#-*- coding: utf-8 -*-
import sys
import jieba
def print_dict(pdict,filename):
reload(sys)
sys.setdefaultencoding( "utf-8" )
fp = open(filename, "w")
for k,v in pdict.items():
if k=='':
continue
fp.write(k)
fp.write(":")
fp.write(str(v))
fp.write("\n")
fp.close()
print 'write to file over!'
def print_words(text,filename):
split_text = text.split('/')
out_list =[]
out_dict ={}
for it in split_text:
if it in out_list:
out_dict[it] = 1 + out_dict[it]
else:
out_list.append(it)
out_dict[it] = 1
print_dict(out_dict,filename)
文本分词,并统计分词出现次数,结果输出到文件中
最新推荐文章于 2022-02-09 09:00:00 发布