问题描述:
rword用法,举个简单的例子,不要复杂。
问题解答:
当需要将一组特定的词汇归一化为一个标准的词汇时,可以使用 rword
进行替换。
word = "姑娘"
# 如果word等于"姑娘",则将其替换为"女士"
if word == "姑娘":
rword = "女士"
else:
rword = word
print(rword) # 输出结果为 "女士"
——————————————————————————————————————
word没变,只不过统计的时候,统计的是rword。
#统计词频
counts = {}
for word in txt0:
if len(word) == 1:
continue
elif word == '凤姐儿' or word == '凤丫头':
rword = '凤姐'
elif word == '二爷' or word == '宝二爷':
rword = '宝玉'
elif word == '颦儿' or word == '林妹妹' or word == '黛玉道':
rword = '黛玉'
elif word == '宝丫头':
rword = '宝钗'
elif word == '老祖宗':
rword = '贾母'
elif word == '袭人道':
rword = '袭人'
elif word == '贾政道':
rword = '贾政'
elif word == '琏二爷':
rword = '贾琏'
else:
rword = word
counts[rword] = counts.get(rword,0) + 1
li = list(counts.items())
li.sort(key=lambda x:x[1], reverse=True)
print(li)