我这里利用Python的collection包下Counter的类统计
def get_user_home(file_read):
with open(file_read, 'r') as file_object:
list_home = []
lines = file_object.readlines()
for line in lines:
line = line.strip('\n')
list_line = line.split(',')
home = list_line[1]
list_home.append(home)
return list_home
d = collections.Counter(get_user_home(file_read))
for k in d:
# k是lst中的每个元素
# d[k]是k在lst中出现的次数
# ret = str(d[k])+","+k
if d[k] == 2:
with open(file_double_write,'a') as file_object:
file_object.write(k+'\n')
else:
with open(file_single_write,'a') as file_object:
file_object.write(k+'\n')
还是很简单的20W行数据,瞬间就出来结果了