def extract_org(sent):
pos = pos_tag(nltk.tokenize.word_tokenize(sent))
sentt = nltk.ne_chunk(pos, binary=False)
org = []
for subtree in sentt.subtrees(filter=lambda t: t.label() == 'GPE' or t.label() == 'ORGANIZATION'):
for leave in subtree.leaves():
org.append(leave)
return org
评论列表
文章目录