题目描述
问题1
import jieba
f = open('data.txt','r')
datas=f.read()
data=jieba.lcut(datas)
fi=open("out1.txt","w")
d=[]
for i in data:
if len(i)>=3 and i not in d:
fi.write(i+"\n")
d.append(i)
fi.close()
f.close()
问题2
import jieba
f=open("data.txt","r")
datas=f.read()
fi=open("out2.txt","w")
data=jieba.lcut(datas)
d={}
for i in data:
if len(i)>=3:
d[i]=d.get(i,0)+1
ls=list(d.items())
ls.sort(key=lambda x:x[1],reverse=True)
for l in ls:
fi.write(l[0]+":"+str(l[1])+"\n")#连接符"+"连接的是字符串,所以此处要将数字转换为字符串
f.close()
fi.close()