python的文章高词频分析总结,自己做的笔记,仅供大家学习参考
import jieba
from collections import Counter
with open("词频文档.txt", "r",encoding="utf-8") as f:
words = jieba.lcut(f.read())
words = [item for item in words if len(item)>1]
counts = Counter(words)
for word,count in counts.most_common(200):
print(word,count)
print ('已统计数量排前100的词')