将文件做词云是遇中文文件的处理办法:
#-_coding:utf8--
from wordcloud import WordCloud
import PIL .Image as image
import numpy as np
import jieba
def trans_CN(text):
word_list = jieba.cut(text)
# 分词后在单独个体之间加上空格
result = " ".join(word_list)
return result;
with open(“D:\yxl\yicun\lunwen.txt”) as fp:
text = fp.read()
text = trans_CN(text)
print(text)
# mask = np.array(image.open(“D:\yxl\yicun\heart11.png”))
wordcloud = WordCloud(font_path=’./fonts/simhei.ttf’).generate(text)
image_produce = wordcloud.to_image()
image_produce.show()
关键是将在WordCloud()方法中添加font_path=’./fonts/simhei.ttf’,即设置字体为中文字体