def get_seg_features(string):
"""
Segment text with jieba
features are represented in bies format
s donates single word
"""
seg_feature = []
for word in jieba.cut(string):
if len(word) == 1:
seg_feature.append(0)
else:
tmp = [2] * len(word)
tmp[0] = 1
tmp[-1] = 3
## ??????extend????append
seg_feature.extend(tmp)
return seg_feature
data_utils.py 文件源码
python
阅读 26
收藏 0
点赞 0
评论 0
评论列表
文章目录