初学望批评指正。
红楼词云带背景图的那种。
原始图像:


最终用ps合成的图。其实挺唏嘘的,一般人认为黛玉是绝对的女主,但是黛玉只出现了900多次,不及贾母3000次、凤姐的1000次。
这个是人物出场次数统计:

这个是我的另一个帖子, 红楼梦人物出场统计
最终的成片。抠图毕竟简陋。

源代码如下:
#GovRptWordCloudv1.py
import jieba
import wordcloud
import imageio
mask = imageio.imread("01.jpg")
f = open("dreams01.txt", "r", encoding="utf-8")
t = f.read()
f.close()
words = jieba.lcut(t)
counts = {}
for word in words:
if len(word) == 1:
continue
elif word == "老太太" or word == "太太" or word == "老祖宗" or word == "史太君":
rword = "贾母"
elif word == "老爷":
rword = "贾政"
elif word == "宝二爷":
rword = "宝玉"
elif word == "王熙凤" or word == "熙凤" or word == "凤辣子":
rword = "凤姐"
elif word == "林黛玉" or word == "潇湘妃子" or word == "林丫头" or word == "林妹妹":
rword = "黛玉"
elif word == "宝姑娘" or word == "宝丫头" or word == "蘅芜君" or word == "宝姐姐":
rword = "宝钗"
else:
rword = word
counts[rword] = counts.get(rword, 0) + 1
items = list(counts.items())
txt = " ".join(words)
w = wordcloud.WordCloud( font_path = "msyh.ttc", mask = mask, \
width = 1000, height = 700, background_color = "white", \
)
w.generate(txt)
w.to_file("grwordcloud4.png")