def get_tfidf(documents): # ??gensim????tfidf
documents=[[word for word in document.text.split()] for document in documents]
dictionary = corpora.Dictionary(documents)
n_items = len(dictionary)
corpus = [dictionary.doc2bow(text) for text in documents]
tfidf = models.TfidfModel(corpus)
corpus_tfidf = tfidf[corpus]
ds = []
for doc in corpus_tfidf:
d = [0] * n_items
for index, value in doc :
d[index] = value
ds.append(d)
return ds
kmeans_cluster.py 文件源码
python
阅读 21
收藏 0
点赞 0
评论 0
评论列表
文章目录