import numpy as np
import pandas as pd
dic = {'col1':[1,2,3,4,5],
'col2':[1,np.nan, 3, np.nan, 6],
'col3':[1,2,np.nan, np.nan, 5],
'col4':['aaa','bbb',np.nan, 'ccc','bbb'],
'col5':['bbb','ccc','ccc', np.nan, np.nan]}
# 字典转DataFrame
df = pd.DataFrame(dic)
print(df)
# fillna 均值、中位数、众数
df['col2'] = df['col2'].fillna(df['col2'].mean()) # 均值填充
print(df)
df['col3'] = df['col3'].fillna(df['col3'].median()) # 中位数填充
print(df)
# 众数
df['col4'] = df['col4'].fillna(df['col4'].mode()[0])
df['col5'] = df['col5'].fillna(df['col5'].mode()[0])
print(df['col4'])
print(df['col5'])
缺失值处理 fillna
最新推荐文章于 2024-02-13 18:58:15 发布