import seaborn as sns 1、首先加载数据集 titanic = sns.load_dataset("titanic") age = titanic["age"]
2、然后求取平均值,将为空的数据设置为平均值
mean = age.mean() mean = mean.round() age.fillna(mean,inplace=True)
3、去掉高位异常值
max_value = age.mean()+(3*age.std()) age =age[age <=max_value]
4、归一化数据
age_normalized = (age-age.min())/(age.max()-age.min()) print(age_normalized.head(10))
5、标准化数据
age_standardized = (age-age.mean())/(age.std()) print(age_standardized.head(10))