这是一个对文本进行分类的函数. 按照=====分类,男孩说话存在boy,女孩存在girl
#coding=gbk
def save_file(boy,girl,count):
file_name_boy = "boy_"+str(count)+'.txt'
file_name_girl = "girl_"+str(count)+'.txt'
boy_file = open(file_name_boy,"w")
girl_file = open(file_name_girl,'w')
boy_file.writelines(boy)
girl_file.writelines(girl)
boy_file.close()
girl_file.close()
def split_file(file_name):
f= open('record.txt')
boy = []
girl = []
count =1
for each in f:
if each[:6] != "======":
(role,line_spoken) = each.split(":",1)
if role == "xx":
boy.append(line_spoken)
if role == "yy":
girl.append(line_spoken)
else:
save_file(boy,girl,count)
boy =[]
girl= []
count+=1
save_file(boy,girl,count)
f.close()
split_file('record.txt')