一、功能介绍
输入:
某样本数据
样本分组数
输出:
必选:直方图(纵轴为某分组下样本的数目)
可选:累计频率线
二、代码
import numpy as np
import matplotlib.pyplot as plt
import seaborn as sns
class Histplot:
def __init__(self, x_data, num_bins, linetype='ro-', legends=None, xlabel=None, ylabels=None, fsize=(10, 10), df_line=1):
"""
:param x_data: 数据x列表
:param num_bins: x的分组数
:param linetype: 累计频率曲线的样式,默认为红色实心点
:param legends: 图例名,默认为 "线性拟合结果", "实测值"
:param xlabel:x坐标轴标题名,默认为 "数据x"
:param ylabels:双y坐标轴标题名,默认为 "计数", "累计频率"
:param df_line:是否显示累计频率曲线
"""
if legends is None:
legends = ["计数", "累计频率"]
if xlabel is None:
xlabel = "数据x"
if ylabels is None:
ylabels = ["计数", "累计频率"]
self.x_data = x_data
self.num_bins = num_bins
self.linetype = linetype
self.fsize = fsize
self.legends = legends
self.xlabel = xlabel
self.ylabels = ylabels
self.df_line = df_line
def change_legend(self, new_legends):
# 将图例名称改为new_legends
self.legends = new_legends
def change_ylabel(self, new_labels):
# 将双y轴坐标轴标题改为new_labels
self.ylabels = new_labels
def change_xlabel(self, new_label):
# 将x轴坐标轴标题改为new_label
self.xlabel = new_label
def change_linetype(self, new_linetype):
# 将累计频率线的格式改为new_lintype
self.linetype = new_linetype
def draw_plot(self):
fs = self.fsize # 画布大小
# 利用seaborn库对字体大小进行统一设置,为fgsize[1]的0.12倍,即画布纵向大小为1000时,font_scale=1.2
sns.set_style("ticks")
sns.set_context("talk", font_scale=fs[1]*0.12)
plt.rcParams['font.sans-serif'] = ['SimHei']
# 设置画布
fig, ax = plt.subplots(figsize=fs)
# ax:绘制频率直方图,不可选
n, bins, patches = ax.hist(self.x_data, self.num_bins, rwidth=0.9, label=self.legends[0])
ax.set_xlabel(self.xlabel)
ax.set_ylabel(self.ylabels[0])
# ax2:绘制累计频率曲线,可选
if self.df_line:
leiji_n = [sum(n[:i]) / len(self.x_data) for i in range(len(n) + 1)]
ax2 = ax.twinx()
ax2.plot(bins, leiji_n, self.linetype, ms=fs[0]*0.5, markeredgecolor='k', label=self.legends[1])
ax2.set_ylim(0, 1)
ax2.set_ylabel(self.ylabels[1])
# 显示多图例
fig.legend(loc=1, bbox_to_anchor=(1, 1), bbox_transform=ax.transAxes)
fig.tight_layout()
plt.show()
if __name__ == "__main__":
np.random.seed(19680801)
iqs = x = 100 + 15 * np.random.randn(500) # 待绘制直方图的数据
bins = 50 # 数据
plot1 = Histplot(iqs, num_bins=bins, fsize=(10, 6.18))
plot1.draw_plot()