#遍历目录,打印文件重复数目,并排序
import sys
import string
from operator import itemgetter
def stat(pathname):
dict = {"null":0}
dict.clear()
for root, dirs, files in os.walk(pathname):
for file in files:
filename = os.path.join(root, file)
if dict.has_key(file):
dict[file] = dict[file] + 1
else:
dict[file] = 1
for key,value in zip(dict.keys(), dict.values()):
print("%s %d" %(key,value))
#sort dict and the output is list
sortlist = sorted(dict.iteritems(),key=itemgetter(1), reverse=True)
file = open("stat.txt", "w")
for item in sortlist:
file.writelines("%s %d\n" %(item[0], item[1]))
file.close();
if __name__=="__main__":
stat(sys.argv[1])