import numpy as np
import pandas as pd
df1 = pd.DataFrame({'fruit':['apple','banana','orange','apple','banana'],
'color':['red','yellow','yellow','cyan','cyan'],
'price':[8.5,6.8,5.6,7.8,6.4]})
df1
![在这里插入图片描述](https://i-blog.csdnimg.cn/blog_migrate/36d99b70460aa4f397f6c2ec19c09b4a.png)
df2 = df1[df1['fruit'] == 'apple']
df2
![在这里插入图片描述](https://i-blog.csdnimg.cn/blog_migrate/4b68cb95a697ad35afe2abe6a03ab690.png)
dict(list(df1.groupby(by='fruit')))['apple'].mean()
df1.groupby(by='fruit')[['price']].mean()
df1.groupby(by=['fruit','color'])[['price']].mean()
![在这里插入图片描述](https://i-blog.csdnimg.cn/blog_migrate/c3529b85005b409c1e888914a409e40b.png)
df1.groupby(by=['fruit','color'])['price'].mean().unstack()
![在这里插入图片描述](https://i-blog.csdnimg.cn/blog_migrate/1684084753e7497bf4d5e055b079fd61.png)
df1['fruit'].value_counts()
df1.groupby(by='fruit')['color'].count()
![在这里插入图片描述](https://i-blog.csdnimg.cn/blog_migrate/b1567f9b4658302d4099fc2b8020c634.png)
- 6.每种水果的差价
![在这里插入图片描述](https://i-blog.csdnimg.cn/blog_migrate/0250405bdc334377d415173ceaaf739f.png)
def func(a):
return a.max() - a.min()
df1.groupby('fruit')['price'].apply(func)
df1.groupby('fruit')['price'].agg(func)
df1.groupby('fruit')['price'].aggregate(func)
![在这里插入图片描述](https://i-blog.csdnimg.cn/blog_migrate/e5d2190ca2ed731a4b4c3c5c406d927b.png)