jieba官方文档:github
# encoding=utf-8
import jieba
import jieba.analyse
txt = open('Chinese.txt',"r")
seg_txt=[]
for line in txt:
#第一行是关键词提取。
#第二行是分词提取
#第三行是关键词提取(与第一行算法有差异)
seg_list = jieba.analyse.extract_tags(line.strip('\n\r\t'))
#seg_list = jieba.lcut(line.strip('\n\r\t'))
#se