相关函数
df.dropna()
df.fillna()
df.isnull()
df.isna()
import pandas as pd
import numpy as np
ts1 = [0, 1, np.nan, np.nan, np.nan, np.nan]
ts2 = [0, 2, np.nan, 3, np.nan, np.nan]
d = {
'X': ts1,
'Y': ts2,
'Z': ts2
}
df = pd.DataFrame(data=d)
print(df)
前项填充
df[[‘X’,‘Y’]] = df[[‘X’,‘Y’]].ffill()
print(df)
对指定列填充
df[‘X’] = df[‘X’].fillna(df.X.median())
df[‘X’] = df[‘X’].fillna(df.X.mean())
print(df)
print(df.head())
print(df.head(5))
计算df每一行有多少个缺失值的值,即按行统计缺失值
print("##################################")
rows_null = df.isnull().sum(axis=1)
print(rows_null)
下面则是按列统计缺失值
print("##################################")
col_null = df.isnull().sum(axis=0)
print(col_null)