DataFrame筛选数据与条件判断
import numpy as np
import pandas as pd
#读取数据
df=pd.read_csv("tips.csv")
df.head()
'''
total_bill tip sex smoker day time size
0 16.99 1.01 Female No Sun Dinner 2
1 10.34 1.66 Male No Sun Dinner 3
2 21.01 3.50 Male No Sun Dinner 3
3 23.68 3.31 Male No Sun Dinner 2
4 24.59 3.61 Female No Sun Dinner 4
'''
1、筛选数据
'''
select total_bill,tip,smoker,time from tips limit 5;
'''
df.loc[:,['total_bill','tip','smoker','time']].head()
'''
total_bill tip smoker time
0 16.99 1.01 No Dinner
1 10.34 1.66 No Dinner
2 21.01 3.50 No Dinner
3 23.68 3.31 No Dinner
4 24.59 3.61 No Dinner
'''
2、统计数据
'''
select count(distinct time) from tip;
'''
df.loc[df.time=='Dinner'].head()
'''
total_bill tip sex smoker day time size
0 16.99 1.01 Female No Sun Dinner 2
1 10.34 1.66 Male No Sun Dinner 3
2 21.01 3.50 Male No Sun Dinner 3
3 23.68 3.31 Male No Sun Dinner 2
4 24.59 3.61 F