def pretreatment():
a = 'We need to use window.load, not document.ready, because in Chrome'
a1 = a.lower()
for b in ",.!、!@#$%^'": # 将所有除了单词以外的符号换成空格
a1.replace(b, ' ')
ls = a1.split()
for s in ls:
print(s)
return ls
def main():
d = {}
for word in pretreatment():
# 如果d中无该k则d[newk]=newv可添加一个kv并计该新词频为一有该k则加一
d[word] = d.get(word, 0) + 1
# 将字典转换为列表的三种方法:
dictList = list(d.items())
dictList1 = []
dictList2 = list(d)
for key in d:
dictList1.append("{}:{}".format(key, d[key]))
print(dictList)
print(dictList1)
print(dictList2)
dictList.sort(key=lambda x: x[1], reverse=True)
# 输出TOP(2)
# for i in range(2):
# word, count = dictList[i]
# print('{0:<20}{1:>10}'.format(word, count))
main()
运行结果: