立即学习:https://edu.csdn.net/course/play/26990/361134?utm_source=blogtoedu
2、缺失值的处理
df.age.fillna(df.age.mean())
df.fillna(20)
df.apply(lambda x: sum(x,isnull())/len(x),axis = 0) #每一列缺失值的占比情况
df.dropna()#每一行中如果有缺失值就删除
df.dropna(how ='all',axis = 0)#每一行中如果全部是缺失值就删除
df.dropna(how='any', subset = ['Condition', 'Price'])#两个变量中有任意一个缺失就删除
df,fillna(0)#只要是缺失,就用0填补
df.Mileage.fillna(df.Mileage.mean(),inplace = True)#针对某个变量,用其均值填补
df[df['Exte_Color'].isnull()]#找到该变量下的空值
df.filllna(value = {'Exte_Color':‘Black','Mileage':65465},inpace = True)
df['Exte_Color'].fillna(method = 'ffill')#前向填补
df['Exte_Color'].fillna(method = 'bfill')#后向填补