import pandas as pd
students = pd.read_excel('D:/Code/.vscode/Students_Duplicates.xlsx')
dupe = students.duplicated(subset='Name')
dupe = dupe[dupe==True]
print(students.iloc[dupe.index]) #找出打印重复项
# students.drop_duplicates(subset='Name',inplace=True,keep='first') 去除重复项
# print(students)
# ['ID','Name'] 如果筛选的重复项有好几个,就用list
import pandas as pd
data = pd.read_excel('D:/code/code practice/CHART.xlsx')
data.drop_duplicates(subset='sku',inplace=True,keep='first')
pd.set_option('display.max_columns', None)
pd.set_option('display.max_rows', None)
data.to_excel('D:/code/code practice/OUTPUT.xlsx')
print(data)
可以打印隐藏的所有行列只需要添加这两行代码:
pd.set_option(‘display.max_columns’, None)
pd.set_option(‘display.max_rows’, None)