def snowball(inputpath=None, text=None):
"""
docstring
"""
data = ''
sb = SnowballStemmer('english')
if inputpath:
filenames = [os.path.join(inputpath, file) for file in os.listdir(inputpath)]
sbstemmed_list = []
for file in filenames:
with open(file, 'r') as f:
data = f.read()
if data:
texts = data.split(',')
stemmedfile = []
for text in texts:
sbstemmed = sb.stem(text)
stemmedfile.append(sbstemmed)
sbstemmed_list.extend(stemmedfile)
return sbstemmed_list
if text:
sbstemmed = sb.stem(text)
return sbstemmed
stemming.py 文件源码
python
阅读 23
收藏 0
点赞 0
评论 0
评论列表
文章目录