这周的学习内容是参数估计实践,主要是使用python对我们上周学习的理论知识进行实践。
正态分布下的置信区间
def norm_conf (data,confidence=0.95):
# https://docs.scipy.org/doc/scipy/reference/generated/scipy.stats.norm.html
sample_mean = np.mean(data)
sample_std = np.std(data,ddof=1)
sample_size = len(data)
conf_intveral = scipy.stats.norm.interval(confidence, loc=sample_mean, scale=sample_std)
print(conf_intveral)
T分布下的置信区间
```python
def ttest_conf (data,confidence=0.95):
sample_mean = np.mean(data)
sample_std = np.std(data,ddof=1)
sample_size = len(data)
conf_intveral = scipy.stats.t.interval(confidence,df = (sample_size-1) , loc=sample_mean, scale=sample_std)
print(conf_intveral)
ttest_conf(scale_means)
重复抽取数据
scale_means = []
for _ in range(1000):
scale_sample = age.sample(100, replace=True)
mean = scale_sample.mean()
scale_means.append(mean)
norm_conf(scale_means)
绘制数据
import seaborn as sns
from matplotlib import pyplot as plt
sns.set_palette("hls") #设置所有图的颜色,使用hls色彩空间
sns.distplot(scale_means,color="r",bins=10,kde=True)
plt.title('Age')
plt.xlim(25,35)
plt.grid(True)
plt.show()