一、词云图中的错误
1、生成词云图的源代码
import jieba
import matplotlib.pyplot as plt
import numpy as np
from PIL import Image
from wordcloud import WordCloud,STOPWORDS
def cloudchart():
file = open('text.txt', 'r',encoding="gbk")
res = jieba.cut(file.read())
print(res)
txt = ' '.join(res)
# print((txt))
image1 = Image.open(r'R-C.png')
MASK = np.array(image1)
#设置文本不想出现的文字
stopwords = set(STOPWORDS)
stopwords = stopwords.union(set(['四', '六','五','的','与','和','等']))
# 设置词云的背景颜色、宽高、字数
wordcloud = WordCloud(font_path=r'simhei.ttf',
background_color="white",
height=200,
width=150,
mask=MASK,
stopwords=stopwords,
max_font_size=120,
max_words=100).generate(txt)
wordcloud.to_file("cyt1.png")
plt.imshow(wordcloud)
#不显示x轴y轴
plt.axis('off')
plt.show()
if __name__ == '__main__':
cloudchart()
2、 出现的错误
如果join方法的’ '中沒有空格如下所示:
txt = ''.join(res)
会出现一些条状物,并且生成的词不是按照出现的频率高低
加入空格以后: