python删除文件夹下相同文件和无法打开的图片

前天不小心把硬盘格式化了,丢了好多照片,后来用Recuva这款软件成功把文件恢复过来,可是恢复的文件中有好多重复的文件和无法打开的图片,所以写了两个python的小程序用来解决这个问题


删除相同文件:

#coding=utf-8

import os
import os.path
import Image
import hashlib

def get_md5(filename):
    m = hashlib.md5()
    mfile = open(filename, "rb")
    m.update(mfile.read())
    mfile.close()
    md5_value = m.hexdigest()
    return md5_value

if __name__ == '__main__':
    ipath = "E:\\20161019_photo"
    uipath = unicode(ipath, "utf8")

    for parent, dirnames, filenames in os.walk(uipath):
        md5_list = []
        #for dirname in dirnames:  # 输出文件夹信息
            #print "parent is:" + parent
            #print "dirname is: " + dirname
        for filename in filenames:
            #print "parent is :" + parent
            #print "filename is:" + filename
            #print "md5_list is : "

            if(get_md5(os.path.join(parent, filename)) in md5_list):
                os.remove(os.path.join(parent, filename))
            else:
                md5_list.append(get_md5(os.path.join(parent, filename)))
            #print md5_list
            #md5 = []



删除无法打开文件:

#coding=utf-8

import os
import os.path
import Image
import hashlib

def get_md5(filename):
    m = hashlib.md5()
    mfile = open(filename, "rb")
    m.update(mfile.read())
    mfile.close()
    md5_value = m.hexdigest()
    return md5_value

if __name__ == '__main__':
    ipath = "E:\\20161019_photo"
    uipath = unicode(ipath, "utf8")
    for parent, dirnames, filenames in os.walk(uipath):
        for filename in filenames:
            name ,ext = os.path.splitext(filename)
            if((ext == ".png") or (ext == ".tif") or (ext == ".gif")):
                os.remove(os.path.join(parent, filename))
            else:
                if(ext == ".jpg"):
                    try:
                        fp = open(os.path.join(parent, filename), 'rb')
                        img = Image.open(fp)
                    except:
                        fp.close()
                        os.remove(os.path.join(parent, filename))
                    else:
                        continue




评论
添加红包

请填写红包祝福语或标题

红包个数最小为10个

红包金额最低5元

当前余额3.43前往充值 >
需支付:10.00
成就一亿技术人!
领取后你会自动成为博主和红包主的粉丝 规则
hope_wisdom
发出的红包
实付
使用余额支付
点击重新获取
扫码支付
钱包余额 0

抵扣说明:

1.余额是钱包充值的虚拟货币,按照1:1的比例进行支付金额的抵扣。
2.余额无法直接购买下载,可以购买VIP、付费专栏及课程。

余额充值