import pandas as pd
import numpy as np
# 加载数据
detail = pd.read_excel('./meal_order_detail.xlsx')
# print(detail)
# 列名
# print(detail.columns)
# 最大值
print(detail.loc[:, 'amounts'].max())
# 最小值
print(detail.loc[:, 'amounts'].min())
# 均值
print(detail.loc[:, 'amounts'].mean())
# 中位数
print(detail.loc[:, 'amounts'].median())
# 标准差
print(detail.loc[:, 'amounts'].std())
# 方差
print(detail.loc[:, 'amounts'].var())
# 最小值坐标
print(detail.loc[:, 'amounts'].idxmin())
# 最大值坐标
print(detail.loc[:, 'amounts'].idxmax())
# 众数
print(detail.loc[:, 'amounts'].mode()[0])
# 非空数据的数量
print(detail.loc[:, 'amounts'].count())
# 分位数
q = np.arange(0, 1.25, 0.25)
print(detail.loc[:, 'amounts'].quantile(q=q))
# 描述多个结果
print(detail.loc[:, 'amounts'].describe())
print(detail.loc[:, 'dishes_name'].describe())
detail.loc[:, 'amounts'] = detail.loc[:, 'amounts'].astype('category')
print(detail.loc[:, 'amounts'].describe()[['top', 'freq']])
# 统计某列各个元素出现的次数
print(pd.value_counts(detail.loc[:, 'dishes_name']))
对于pandas统计分析,不要太简单
最新推荐文章于 2024-04-14 05:01:23 发布