def __init__(self):
self.install_nltk_corpora('stopwords', 'wordnet', 'punkt')
self.lemmatizer = nltk.WordNetLemmatizer()
self.lemmatizer.lemmatize('') # Force nltk lazy corpus loader to do something.
self.tokenizer = self.make_tokenizer()
self.stopwords = nltk.corpus.stopwords.words('english')
self.sent_tokenizer = None
评论列表
文章目录