import pandas as pd # 读取第一个文件内容 df_low = pd.read_csv("id_check_total_india_1594870405.csv") # 读取第二个文件内容 df_more = pd.read_csv("Aadhaar卡简版测试样本.csv") low_order_id = df_low["order_no"] more_id = df_more["order_no"] # 用set 集合找到不同的order id low_set = set(low_order_id.to_dict().values()) more_set = set(more_id.to_dict().values()) diff_set = more_set - low_set df_more_dict = df_more.to_dict() df = pd.DataFrame() import time # 循环比对两个dataframe file_name = f"diff_record_{int(time.time())}" for d in diff_set: for i in df_more.values: if d in i: # 匹配到order id 就写入第三个文件 with open(file_name, "a") as f: data = ",".join([str(data) for data in i.tolist()]) f.write(f"{data}\n") # -*- coding:utf-8 -*-
python & pandas 比较两个文件并把不同写入第三个文件
最新推荐文章于 2023-03-31 13:49:23 发布