def getText(file):
with open(file, 'r', encoding='UTF-8') as txt: #打开文件
txt = txt.readlines()#,以readlines模式,每个字符为一个行“伪字符串”
for line in txt:
for ch in '!"#$%&()*+,-./:;<=>?@[\\]^_‘{|}~\n':
line = line.replace(ch, ' ')#置换特殊字符
line = line.lower() #统一成小写
return txt
for i in range(10):
try:#试错,防止异常退出
file = input("请输入文件名(不带后缀):")+'.txt'#输入文件名
TEXT = getText(file)#进行前处理
d = {}#建立空字典
for strs in TEXT:#此时strs为每行的长字符串
words = strs.split()#将长字符串分割,split后为列表
for word in words:#遍历列表,进行计数
d[word] = d.get(word, 0) + 1#get函数,如果存在,就+1,不存在就设为1.
item = list(d.items())#转为字典,方便排序
item.sort(key=
def getText(file): with open(file, 'r', encoding='UTF-8') as txt: #打开文件 txt = txt.readlines()#,以readlines模式,每个字符为一个行“伪字符串” for line in txt: for ch in '!"#$%&()*+,-...