import pandas as pd
'''
pd.concat(objs, axis = 0, join ='outer',
ignore_index = False, keys = None,
levels = None, names=None,sort=False,
verify_integrity=False,copy=True
)
objs: 连接的数据([df1,df2])
axis: 默认0,追加到行后面。1,追加到列后面
join:连接方式,‘outer’ 并集,‘inner’ 交集
ignore_index:保留原来的索引
keys:连接关系
names:索引的名称,多层索引
sort:是否排序
verify_integrity:检查内容是否重复,若有重复内容则会报错
copy:是否为深copy,若FALSE,则为浅copy
'''
"\npd.concat(objs, axis = 0, join ='outer',\n ignore_index = False, keys = None,\n levels = None, names=None,sort=False,\n verify_integrity=False,copy=True\n)\nobjs: 连接的数据([df1,df2])\naxis: 默认0,追加到行后面。1,追加到列后面\njoin:连接方式,‘outer’ 并集,‘inner’ 交集\nignore_index:保留原来的索引\nkeys:连接关系\nnames:索引的名称,多层索引\nsort:是否排序\nverify_integrity:检查内容是否重复,若有重复内容则会报错\ncopy:是否为深copy,若FALSE,则为浅copy\n"
df1 = pd.DataFrame({'x': [1, 2], 'y': [1,2]})
df2 = pd.DataFrame({'x': [2, 3], 'y': [3, 2]})
print(pd.concat([df1, df2]))
x y
0 1 1
1 2 2
0 2 3
1 3 2
print(pd.concat([df1, df2], ignore_index=True))
x y
0 1 1
1 2 2
2 2 3
3 3 2
df3 = pd.DataFrame({'x': [1, 2], 'y': [1, 2], 'key1': [1, 2]})
df4 = pd.DataFrame({'x': [2, 3,4], 'y': [3, 2,4], 'key2': [1, 2, 3]})
print(pd.concat([df3, df4], axis=1, join='inner', keys=['key1', 'key2']))
key1 key2
x y key1 x y key2
0 1 1 1 2 3 1
1 2 2 2 3 2 2
df3 = pd.DataFrame({'x': [1, 2], 'y': [1, 2], 'key1': [1, 2]})
df4 = pd.DataFrame({'x': [2, 3,4], 'y': [3, 2,4], 'key2': [1, 2, 3]})
print(pd.concat([df3, df4], axis=1, join='outer', keys=['key1', 'key2']))
key1 key2
x y key1 x y key2
0 1.0 1.0 1.0 2 3 1
1 2.0 2.0 2.0 3 2 2
2 NaN NaN NaN 4 4 3