用WordCloud库生成中英文词云
思路:
1、确定需要生成词云的样本(字符串类型)
2、设置词云格式并获取样本生成词云
英文词云:
import wordcloud as wc
def Get_txt():
txt=open("hamlet.txt","r",encoding='utf-8').read() #读取文件
for i in '''!"#$&()*+,-./:;<=>?@[\\]^_‘'{|}'~''': #去符号
txt=txt.replace(i," ")
return txt
def Work(txt):
w=wc.WordCloud()
w=wc.WordCloud(height=500,width=500,font_step=2) #设置词云W的格式
w.generate(txt) #获取词库txt
w.to_file("D:\wordcloud\wc.png") #输出图片
def main():
txt=Get_txt()
Work(txt)
main()
中文词云
import wordcloud as wc
import jieba
exinclude=["的","是","和","在"] #删除词组
def Out(ls):
data=open("D:\python\output\关于实施乡村振兴战略的意见.txt","w",encoding='utf-8')
print(ls,file=data)
data.close
def main():
f=open("D:\python\input\关于实施乡村振兴战略的意见.txt","r",encoding='utf-8').read()
ls=jieba.lcut(f) #jieba分词,生成列表
txt=" ".join(ls) #join函数使列表元素以" "为间隔字符串
Out(txt)
for i in exinclude: #删除不需要词组
txt=txt.replace(i," ")
w=wc.WordCloud(height=1000,width=700,font_step=2,font_path="msyh.ttc",background_color="white") #设置词云格式
w.generate(txt) #输入字符数据
w.to_file("D:\python\output\关于实施乡村振兴战略的意见.png")
main()