train_data = pd.read_csv(‘candidate_train.csv’)
train_answer = pd.read_csv(‘train_answer.csv’)
train_data:
Index([‘0’, ‘1’, ‘2’, ‘3’, ‘4’, ‘5’, ‘6’, ‘7’, ‘8’, ‘9’,
…
‘3168’, ‘3169’, ‘3170’, ‘3171’, ‘3172’, ‘3173’, ‘3174’, ‘3175’, ‘3176’,
‘id’],
dtype=‘object’, length=3178)
train_answer:
Index([‘id’, ‘p1’, ‘p2’, ‘p3’, ‘p4’, ‘p5’, ‘p6’], dtype=‘object’)
#将 p1 ~ p6 拼接到原来的特征
train_data = train_data.merge(train_answer, on=‘id’, how=‘left’)