分类数据可视化 - 统计图
barplot() / countplot() / pointplot()
1. barplot()
#柱状图 - 置信区间估计
#置信区间:样本均值 + 抽样误差
示例1:
import numpy as np
import pandas as pd
import matplotlib.pyplot as plt
import seaborn as sns
sns.set_context('paper')
#加载数据
titanic = sns.load_dataset('titanic')
print(titanic.head())
sns.barplot(x = 'sex', y = 'survived', hue = 'class', data = titanic,
palette = 'hls',
order = ['male', 'female'], #筛选类别
capsize = 0.05, #误差线横向延申宽度
saturation = 8, #颜色饱和度
errcolor = 'gray', errwidth = 2, #误差线颜色、宽度
ci = 'sd' #置信区间误差 --> 0-100内值、 'sd' 、None
)
#计算数据
print(titanic.groupby(['sex', 'class']).mean()['survived