1.重名加后缀区分
cols = copy.deepcopy(timesort_data.loc[:,'glass_id'])
for dup in cols[cols.duplicated()].unique():
cols[cols[cols == dup].index.values.tolist()] = [dup + '_' + str(i) if i != 0 else dup for i in
range(sum(cols == dup))]
timesort_data.loc[:,'glass_id'] = cols
2.获取列col中重复值的行号
repeat_list = remain_data.loc[:, col].groupby(
remain_data.loc[:, col].columns.tolist()).apply(lambda a: tuple(a.index)).tolist()
3.取出列名包含某个字符串的数据
data = df.loc[ : , df.columns.str.contains("_a_")]