#读取数据
import pandas as pd
fpath = "G:\\萍_python\\data\\white_wine.csv"
data = pd.read_csv(fpath,sep=',')
print(data.head(5))
def huanhang():
for i in range(2):
print('#############################################################')
huanhang()
#查看白葡萄酒总共分为几种品质等级
quality_class = data['quality'].drop_duplicates(keep='first')
display(quality_class)
huanhang()
print(len(quality_class))
#按白葡萄酒等级将数据集划分为7个子集,并统计每种等级的数量
display(data.groupby(by=data['quality']).agg({'quality':'size'}))
# 求每个数据集中fixed acidity的均值
display(data.groupby(by=data['quality']).agg({'fixed acidity':'mean'}))
IDE:vscode,jupyter,python