import jieba
from wordcloud import WordCloud
import matplotlib.pyplot as plt
#AI2017.txt来自http://www.gov.cn/zhengce/content/2017-07/20/content_5211996.htm
with open('AI2017.txt', 'r') as f:
renmin=f.read()
jieba.load_userdict("AIDict.txt") #添加词典
seg_list = jieba.cut(renmin, cut_all=False) #分词
tf = {} #统计词频
for seg in seg_list:
if seg in tf: # 如果该键在集合tf的对象中,则该键所属对象值加1
tf[seg] +=1
else: #否则,生成新词的键值对,初始值为1
tf[seg] = 1
ci=list(tf.keys()) #将字典的健值转为列表
with open('stopword.txt','r') as ft:
stopword=ft.read()
for seg in ci:
if tf[seg]<5 or len(seg)<2 or seg in stopword or '一'in seg:
tf.pop(seg)
#print(tf)
#统计词频后绘制词云图
f