import pandas as pd
import numpy as np
注意:默认情况下merge做的是内连接(‘inner ’join),结果中的键是两张表的交集,外连接(outer join)是键的并集
df1=pd.DataFrame({‘key’:[‘b’,‘b’,‘a’,‘c’,‘a’,‘a’,‘b’],‘data1’:range(7)})
df2=pd.DataFrame({‘key’:[‘a’,‘b’,‘d’],‘data2’:range(3)})
df1
key data1
0 b 0
1 b 1
2 a 2
3 c 3
4 a 4
5 a 5
6 b 6
df2
key data2
0 a 0
1 b 1
2 d 2pd.merge(df1,df2,on=‘key’)
key data1 data2
0 b 0 1
1 b 1 1
2 b 6 1
3 a 2 0
4 a 4 0
5 a 5 0
df1=pd.DataFrame({‘l