#Series 假如有两个索引都是a 那么求平均数
a=pd.Series([1,2,3,4,6,7],index=['a','a','b','b','c','d'])
ind=list(a.index)
ind_dict={}
#判断哪些是重复的索引
for i in ind:
if i in ind_dict.keys():
ind_dict[i]+=1
else:
ind_dict[i] = 1
print(ind) #['a', 'a', 'b', 'b', 'c', 'd']
print(ind_dict) #{'a': 2, 'b': 2, 'c': 1, 'd': 1}
#将重复的索引放到一个列表中
chongfu_index=[]
for i in ind:
if ind_dict[i]>1:
chongfu_index.append(i)
chongfu_index=list(set(chongfu_index))
print(chongfu_index) # ['b', 'a']
#求重复的平均值 并在原Series中去掉重复的
data=[]
for i in chongfu_index:
data.append(a[i].mean()) #[1.5, 3.5]
a.drop(i,inplace=True)
print(data)
#单独将重复的做成一格Series
add_data_Series=pd.Series(data,index=chongfu_index)
print(add_data_Series) # b 3.5 a 1.5
#两着相加
a=a.append(add_data_Series)
print(a)
'''
c 6.0
d 7.0
a 1.5
b 3.5
'''
print('-------------------------')
# print(a['a'].mean()) #多个的索引进行求平均值
#下面是 print(a['a'].mean())的自己实现的算法
a=pd.Series([1,2,3,4,6,7],index=['a','a','b','b','c','d'])
dict_index={'a':2,'b':2}
data=[]
avg=0
for i in dict_index.keys():
print(a[i].values) # [1 2]
# [3 4]
data.append(a[i].values.mean())
print(data) #[1.5, 3.5]
data_series=pd.Series(data,index=dict_index.keys())
print(data_series)
'''
a 1.5
b 3.5
dtype: float64
'''