# -*- coding: utf-8 -*-
"""
Created on Fri Jun 21 11:08:34 2019
@author: User
"""
# 《Python数据分析基础》中国统计出版社
import numpy as np
from scipy import stats
import pandas as pd
import statsmodels.api as sm
magzine = pd.read_csv(u'data\\ch6\\magzine.csv',encoding = "gbk")
print(magzine.head())
'''
挂上标签便于阅读
'''
magzine['name']=magzine['name'].astype('category')
magzine['name'].cat.categories=['Fashion','Cosmetic']
magzine['name'].cat.set_categories=['Fashion','Cosmetic']
magzine['gender']=magzine['gender'].astype('category')
magzine['gender'].cat.categories=['Male','Female']
magzine['gender'].cat.set_categories=['Male','Female']
print("\n 先统计一下两种杂志的女性读者人数")
female=magzine[magzine['gender']=='Female']['name'].value_counts()
print(female)
print("\n 两种杂志的总人数")
magzines=magzine['name'].value_counts()
print(magzines)
'''
参数1:成功的数目
参数2:样本量
'''
print(sm.stats.proportions_ztest(np.array(female),
np.array(magzines),
value=0.3,
alternative='smaller',
prop_var=False))