pandas 数据预处理实验 莺尾花

import pandas as pd
import numpy as np
from sklearn import datasets
import seaborn as sns
iris = datasets.load_iris()
iris.keys()
dict_keys(['data', 'target', 'target_names', 'DESCR', 'feature_names', 'filename'])
X_train = pd.DataFrame(iris.data,columns=iris.feature_names)
X_train
sepal length (cm)sepal width (cm)petal length (cm)petal width (cm)
05.13.51.40.2
14.93.01.40.2
24.73.21.30.2
34.63.11.50.2
45.03.61.40.2
...............
1456.73.05.22.3
1466.32.55.01.9
1476.53.05.22.0
1486.23.45.42.3
1495.93.05.11.8

150 rows × 4 columns

X_train.describe()
sepal length (cm)sepal width (cm)petal length (cm)petal width (cm)
count150.000000150.000000150.000000150.000000
mean5.8433333.0573333.7580001.199333
std0.8280660.4358661.7652980.762238
min4.3000002.0000001.0000000.100000
25%5.1000002.8000001.6000000.300000
50%5.8000003.0000004.3500001.300000
75%6.4000003.3000005.1000001.800000
max7.9000004.4000006.9000002.500000
X_train.mean()
sepal length (cm)    5.843333
sepal width (cm)     3.057333
petal length (cm)    3.758000
petal width (cm)     1.199333
dtype: float64
X_train.corr()
sepal length (cm)sepal width (cm)petal length (cm)petal width (cm)
sepal length (cm)1.000000-0.1175700.8717540.817941
sepal width (cm)-0.1175701.000000-0.428440-0.366126
petal length (cm)0.871754-0.4284401.0000000.962865
petal width (cm)0.817941-0.3661260.9628651.000000
sns.heatmap(X_train.corr(),annot=True,cmap='RdYlBu')
<matplotlib.axes._subplots.AxesSubplot at 0x1f90f0c96c8>

[外链图片转存失败,源站可能有防盗链机制,建议将图片保存下来直接上传(img-D0nzJOvd-1588916369209)(output_7_1.png)]

Y_train0=pd.DataFrame(iris.target)==0
Y_train1=pd.DataFrame(iris.target)==1
Y_train2=pd.DataFrame(iris.target)==2
Y_train=pd.concat([Y_train0,Y_train1,Y_train2],axis=1)
Y_train.columns=iris.target_names
Y_train
setosaversicolorvirginica
0TrueFalseFalse
1TrueFalseFalse
2TrueFalseFalse
3TrueFalseFalse
4TrueFalseFalse
............
145FalseFalseTrue
146FalseFalseTrue
147FalseFalseTrue
148FalseFalseTrue
149FalseFalseTrue

150 rows × 3 columns

Train=pd.concat([X_train,Y_train],axis=1)
Train
sepal length (cm)sepal width (cm)petal length (cm)petal width (cm)setosaversicolorvirginica
05.13.51.40.2TrueFalseFalse
14.93.01.40.2TrueFalseFalse
24.73.21.30.2TrueFalseFalse
34.63.11.50.2TrueFalseFalse
45.03.61.40.2TrueFalseFalse
........................
1456.73.05.22.3FalseFalseTrue
1466.32.55.01.9FalseFalseTrue
1476.53.05.22.0FalseFalseTrue
1486.23.45.42.3FalseFalseTrue
1495.93.05.11.8FalseFalseTrue

150 rows × 7 columns

sns.heatmap(Train.corr(),annot=True,cmap='RdYlBu')
<matplotlib.axes._subplots.AxesSubplot at 0x1f90f027a48>

[外链图片转存失败,源站可能有防盗链机制,建议将图片保存下来直接上传(img-rcUOxtUa-1588916369212)(output_10_1.png)]

在这里插入图片描述
在这里插入图片描述

评论
添加红包

请填写红包祝福语或标题

红包个数最小为10个

红包金额最低5元

当前余额3.43前往充值 >
需支付:10.00
成就一亿技术人!
领取后你会自动成为博主和红包主的粉丝 规则
hope_wisdom
发出的红包

打赏作者

泰洋睿兔

你的鼓励将是我创作的最大动力

¥1 ¥2 ¥4 ¥6 ¥10 ¥20
扫码支付:¥1
获取中
扫码支付

您的余额不足,请更换扫码支付或充值

打赏作者

实付
使用余额支付
点击重新获取
扫码支付
钱包余额 0

抵扣说明:

1.余额是钱包充值的虚拟货币,按照1:1的比例进行支付金额的抵扣。
2.余额无法直接购买下载,可以购买VIP、付费专栏及课程。

余额充值