import numpy as np
import matplotlib.pyplot as plt;
2.加载数据
dataSet = pd.read_csv(“data\winequality-red.csv”);
#print(dataSet.head());
pd.set_option(‘display.max_columns’,None);# DataFrame 显示所有列
#print(“describe”,dataSet.describe());
print(“shape”,np.shape(dataSet));
输出
![在这里插入图片描述](https://img-blog.csdnimg.cn/20200518222221350.png?x-oss-process=image/watermark,type_ZmFuZ3poZW5naGVpdGk,shadow_10,text_aHR0cHM6Ly9ibG9nLmNzZG4ubmV0L3dlaXhpbl80NDIzNTEwOQ==,size_16,color_FFFFFF,t_70)
3.数据分析
dataSet.hist();#直方图
plt.show();
#变量的相关性 展示
sns.heatmap(dataSet.astype(float).corr(),linewidths=0.1,vmax=1.0, square=True,linecolor=‘white’, annot=True)
plt.show();
输出
![在这里插入图片描述](https://img-blog.csdnimg.cn/20200518222417475.png?x-oss-process=image/watermark,type_ZmFuZ3poZW5naGVpdGk,sh