def __init__(self, document):
"""Tokenize the text of the body."""
self.settings = settings.Settings()
self.tokeniser = RegexpTokenizer(self.settings.pattern)
self.text = document['body']
self.sentences = nltk.sent_tokenize(self.text)
self.event = document['head']
评论列表
文章目录