import numpy as np
import pandas as pd
raw_data_1 = {
'subject_id': ['1', '2', '3', '4', '5'],
'first_name': ['Alex', 'Amy', 'Allen', 'Alice', 'Ayoung'],
'last_name': ['Anderson', 'Ackerman', 'Ali', 'Aoni', 'Atiches']
}
raw_data_2 = {
'subject_id': ['4', '5', '6', '7', '8'],
'first_name': ['Billy', 'Brian', 'Bran', 'Bryce', 'Betty'],
'last_name': ['Bonder', 'Black', 'Balwner', 'Brice', 'Btisan']
}
raw_data_3 = {
'subject_id': ['1', '2', '3', '4', '5', '7', '8', '9', '10', '11'],
'test_id': [51, 15, 15, 61, 16, 14, 15, 1, 61, 16]
}
data1 = pd.DataFrame(raw_data_1, columns=['subject_id', 'first_name', 'last_name'])
data2 = pd.DataFrame(raw_data_2, columns=['subject_id', 'first_name', 'last_name'])
data3 = pd.DataFrame(raw_data_3, columns=['subject_id', 'test_id'])
# data1和data2两个数据框按照行的维度进行合并,命名为all_data
all_data = pd.concat([data1, data2])
# print(all_data)
# data1和data2两个数据框按照列的维度进行合并,命名为all_data_col
all_data_col = pd.concat([data1, data2], axis=1)
# print(all_data_col)
# 按照subject_id的值对all_data和data3作合并
me = pd.merge(all_data, data3, on='subject_id')
# print(me)
# data1和data2按照subject_id作连接
me2 = pd.merge(data1, data2, on='subject_id')
# print(me2)
# 找到 data1 和 data2 合并之后的所有匹配结果
me3 = pd.merge(data1, data2, on='subject_id', how='outer')
print(me3)
数据分析Pandas练习题五:合并
最新推荐文章于 2024-04-27 17:30:34 发布