#author:Xuliu
#time:2021-07-31
#fuction:求两个文件的差集
#input:10w pictures and selected 6w
#output:the rest 3w pictures
#导入对路径操作的库
import sys
import os
# from IPython import embed
import shutil
# 大文件夹的文件路径
root_path = '/home/xl/workstation/Datasets/annores/new_keyframe'
# 被筛选的小文件夹路径
select_picture_path="/home/xl/workstation/Datasets/annores/JPEGImages"
# 剩下的文件夹:即大文件夹减去小文件夹的数据
save_picture_path = "/home/xl/workstation/Datasets/annores/MyJPEGImages"
# 读取文件
fns = os.listdir(root_path)
fnbs = os.listdir(select_picture_path)
#取大文件和筛选后的文件夹的前缀
f_list=list()
fb_list=list()
for f in fns:
portion=os.path.splitext(f)
if portion[1] == '.jpg':
f2=portion[0]
f_list.append(f2)
for fb in fnbs:
portion = os.path.splitext(fb)
if portion[1] == '.jpg':
fb2 = portion[0]
fb_list.append(fb2)
# inter_list=list(set(f_list).intersection(set(fb_list)))
# 求差集:求文件包含在f_list而不包含在fb_list的文件
differ_list = list(set(f_list).difference(set(fb_list)))
for differ in differ_list:
differ_pic = os.path.join(root_path, differ + ".jpg")
shutil.copy(differ_pic, save_picture_path)
Python脚本004:求两个文件的差集
最新推荐文章于 2022-04-11 09:53:29 发布