importpandas as pd
def readcsv(path):for i in os.listdir(path):
wl=os.path.join(path,i)
a=pd.read_csv(wl)
##########d读、筛、删、改、转
#readingheadersprint(a.columns)#reada specific columnprint(a['T'][:3])print(a.T)#readmulti_columns :change single to a list of nameprint(a[['T','T']])#readrow 注意读行读区间print(a[1:2])#findspecific data in a specific row print(a['NE'].loc[a['NEE']==3])print(a.N.loc[a['N']==3])#readrow by rowfor index, row in a.iterrows():print(index,row['TI'])#readthe data in a specific locationprint(a.iloc[2,1])#max,min,std,0.5,0.75,0.25print(a.describe())#sort排序print(a.sort_values('T',ascending=False))
# ########Flitering data
print(a.loc[a['NEC']<=2])print(a.loc[(a['NE']==2)|(a['S']==2)])print(a.loc[(a['NE']==2)&(a['S']==2)])print(a.reset_index(drop=True))print(a.loc[a['T'].str.contains('')])
########## making changes to data
a['TOTAL']=a['T']+a['TI']print(a.head(2))
drop a specific column
print(a.drop(columns=['TOTAL']).head(2))
# 特定列,逐行相加运算
:, means all rows所有行,逗号后面为五到九列
a['TOTAL']=a.iloc[:,5:9].sum(axis=1)print(a['TOTAL'].head(3))
# 转换列的顺序,,提取特定几列
columns=list(a.columns.values)print(a[columns[0:4]+columns[-2:-1]].head(3))
######### Saving to a new csv
b=a.to_csv('new_csv',index=False)print(b)
# #########condional change
a.loc[a['R']==-9999,'R']=0print(a)
a.loc[a['RE']==0,'RE']='Bingo'print(a)
a.loc[a['RE']==0,['RE','RE']]='Bingo'print(a)#a['count']=1
a.groupby(['RE']).count()['count']print(a)readcsv(r'D:\副本 (2)')