# -*- coding: utf-8 -*-
"""
Created on Sun Jul 21 14:26:22 2019
《Python数据分析基础》中国统计出版社
@author: User
"""
#import numpy as np
from scipy import stats
import pandas as pd
#import statsmodels.api as sm
#import statsmodels.formula.api as smf
#import matplotlib.pyplot as plt
#from statsmodels.stats.multicomp import pairwise_tukeyhsd
#from statsmodels.graphics.api import interaction_plot
#from matplotlib.font_manager import FontProperties
#myfont=FontProperties(fname='data\msyh.ttc')
sales_district = pd.read_csv(u'data/ch8/sales_district.csv',encoding = "gbk")
print(sales_district.head())
aa = stats.ranksums(sales_district[sales_district['district']==1]['Sales'],
sales_district[sales_district['district']==2]['Sales'])
print(aa)
运行:
district Sales
0 1 87.17
1 1 88.45
2 1 93.52
3 1 96.17
4 1 92.68
RanksumsResult(statistic=-3.6377197716407874, pvalue=0.0002750624589981112)