Tfidf_count.py 文件源码

python
阅读 21 收藏 0 点赞 0 评论 0

项目:Graduation-design 作者: Baichenjia 项目源码 文件源码
def read_test_list():
    fp = open("f://emotion/mysite/weibo_crawler/chinese_weibo.txt", 'r')
    contents = []
    for line in fp.readlines():    # ????
        line = line.strip()
        line.decode('utf-8')
        seg_lines = pseg.cut(line)  # ????
        for seg_line in seg_lines:   # ??????????
            if seg_line.flag == 'n' or seg_line.flag == 'nr' or seg_line.flag == 'ns' or seg_line.flag == 'nt' or seg_line.flag == 'nz':
                contents.append(seg_line.word)  # ????
    fp.close()
    #for w in contents:
    #   print w

    # ??str???????
    str_test = ' '.join(contents)
    return str_test


# 5.??????chinese_weibo.txt??????TF-IDF???????100??
评论列表
文章目录


问题


面经


文章

微信
公众号

扫码关注公众号