def bag_of_words(messages, model=None, weighting=''):
# TODO: Add stemmming or baseform here
messages, stemmings2baseform = texttools.stemming_messages_snowball(messages)
# Create new model for extrating text features if None is given
if model is None:
if weighting == 'tfidf':
model = TfidfVectorizer()
else:
model = CountVectorizer()
model.fit(messages)
# Extract features
x = model.transform(messages)
return x
textfeatures.py 文件源码
python
阅读 33
收藏 0
点赞 0
评论 0
评论列表
文章目录