def tokenize(sentence):
"Tokenize sentence the way parser expects."
tokenizer = TreebankWordTokenizer()
s = tokenizer.tokenize(sentence)
s = ' '.join(s)
# character replacements
s = ''.join(REPLACEMENTS_R.get(x,x) for x in s)
return s
评论列表
文章目录