python 37 pandas操作csv文件小结,csv文件合并

import pandas as pd
df = pd.read_csv("annotations.csv")[0:10]
## 一 DataFrame,数据帧df,可以将其看作表格 ### 列:index,行:columns
df
seriesuidcoordXcoordYcoordZdiameter_mm
01.3.6.1.4.1.14519.5.2.1.6279.6001.100225287222…-128.699421-175.319272-298.3875065.651471
11.3.6.1.4.1.14519.5.2.1.6279.6001.100225287222…103.783651-211.925149-227.1212504.224708
21.3.6.1.4.1.14519.5.2.1.6279.6001.100398138793…69.639017-140.944586876.3744965.786348
31.3.6.1.4.1.14519.5.2.1.6279.6001.100621383016…-24.013824192.102405-391.0812768.143262
41.3.6.1.4.1.14519.5.2.1.6279.6001.100621383016…2.441547172.464881-405.49373218.545150
51.3.6.1.4.1.14519.5.2.1.6279.6001.100621383016…90.931713149.027266-426.54471518.208570
61.3.6.1.4.1.14519.5.2.1.6279.6001.100621383016…89.540769196.405159-515.07332216.381276
71.3.6.1.4.1.14519.5.2.1.6279.6001.100953483028…81.50964654.957219-150.34642310.362321
81.3.6.1.4.1.14519.5.2.1.6279.6001.102681962408…105.05579219.825260-91.24725121.089619
91.3.6.1.4.1.14519.5.2.1.6279.6001.104562737760…-124.834262127.247155-473.06447910.465854
### 2 取其中某三列
pd.DataFrame(df,columns = ['seriesuid','coordX','coordY','coordZ'])
seriesuidcoordXcoordYcoordZ
01.3.6.1.4.1.14519.5.2.1.6279.6001.100225287222…-128.699421-175.319272-298.387506
11.3.6.1.4.1.14519.5.2.1.6279.6001.100225287222…103.783651-211.925149-227.121250
21.3.6.1.4.1.14519.5.2.1.6279.6001.100398138793…69.639017-140.944586876.374496
31.3.6.1.4.1.14519.5.2.1.6279.6001.100621383016…-24.013824192.102405-391.081276
41.3.6.1.4.1.14519.5.2.1.6279.6001.100621383016…2.441547172.464881-405.493732
51.3.6.1.4.1.14519.5.2.1.6279.6001.100621383016…90.931713149.027266-426.544715
61.3.6.1.4.1.14519.5.2.1.6279.6001.100621383016…89.540769196.405159-515.073322
71.3.6.1.4.1.14519.5.2.1.6279.6001.100953483028…81.50964654.957219-150.346423
81.3.6.1.4.1.14519.5.2.1.6279.6001.102681962408…105.05579219.825260-91.247251
91.3.6.1.4.1.14519.5.2.1.6279.6001.104562737760…-124.834262127.247155-473.064479
### 3 取其中某俩行
pd.DataFrame(df,index = [0,4])
seriesuidcoordXcoordYcoordZdiameter_mm
01.3.6.1.4.1.14519.5.2.1.6279.6001.100225287222…-128.699421-175.319272-298.3875065.651471
41.3.6.1.4.1.14519.5.2.1.6279.6001.100621383016…2.441547172.464881-405.49373218.545150
## 二 对DataFrame操作 ### 1 排序
df.sort_index(axis=1,ascending=True)
coordXcoordYcoordZdiameter_mmseriesuid
0-128.699421-175.319272-298.3875065.6514711.3.6.1.4.1.14519.5.2.1.6279.6001.100225287222…
1103.783651-211.925149-227.1212504.2247081.3.6.1.4.1.14519.5.2.1.6279.6001.100225287222…
269.639017-140.944586876.3744965.7863481.3.6.1.4.1.14519.5.2.1.6279.6001.100398138793…
3-24.013824192.102405-391.0812768.1432621.3.6.1.4.1.14519.5.2.1.6279.6001.100621383016…
42.441547172.464881-405.49373218.5451501.3.6.1.4.1.14519.5.2.1.6279.6001.100621383016…
590.931713149.027266-426.54471518.2085701.3.6.1.4.1.14519.5.2.1.6279.6001.100621383016…
689.540769196.405159-515.07332216.3812761.3.6.1.4.1.14519.5.2.1.6279.6001.100621383016…
781.50964654.957219-150.34642310.3623211.3.6.1.4.1.14519.5.2.1.6279.6001.100953483028…
8105.05579219.825260-91.24725121.0896191.3.6.1.4.1.14519.5.2.1.6279.6001.102681962408…
9-124.834262127.247155-473.06447910.4658541.3.6.1.4.1.14519.5.2.1.6279.6001.104562737760…
### 2 算数运算
df['corrd_X_Y'] = df['coordX']*df['coordY']
df
seriesuidcoordXcoordYcoordZdiameter_mmcorrd_X_Y
01.3.6.1.4.1.14519.5.2.1.6279.6001.100225287222…-128.699421-175.319272-298.3875065.65147122563.488788
11.3.6.1.4.1.14519.5.2.1.6279.6001.100225287222…103.783651-211.925149-227.1212504.224708-21994.365650
21.3.6.1.4.1.14519.5.2.1.6279.6001.100398138793…69.639017-140.944586876.3744965.786348-9815.242447
31.3.6.1.4.1.14519.5.2.1.6279.6001.100621383016…-24.013824192.102405-391.0812768.143262-4613.113389
41.3.6.1.4.1.14519.5.2.1.6279.6001.100621383016…2.441547172.464881-405.49373218.545150421.081078
51.3.6.1.4.1.14519.5.2.1.6279.6001.100621383016…90.931713149.027266-426.54471518.20857013551.304585
61.3.6.1.4.1.14519.5.2.1.6279.6001.100621383016…89.540769196.405159-515.07332216.38127617586.268931
71.3.6.1.4.1.14519.5.2.1.6279.6001.100953483028…81.50964654.957219-150.34642310.3623214479.543419
81.3.6.1.4.1.14519.5.2.1.6279.6001.102681962408…105.05579219.825260-91.24725121.0896192082.758414
91.3.6.1.4.1.14519.5.2.1.6279.6001.104562737760…-124.834262127.247155-473.06447910.465854-15884.804687
### 3 切片
df['diameter_mm']>6
0 False 1 False 2 False 3 True 4 True 5 True 6 True 7 True 8 True 9 True Name: diameter_mm, dtype: bool
df.loc[:,['coordX','coordY']]
coordXcoordY
0-128.699421-175.319272
1103.783651-211.925149
269.639017-140.944586
3-24.013824192.102405
42.441547172.464881
590.931713149.027266
689.540769196.405159
781.50964654.957219
8105.05579219.825260
9-124.834262127.247155
df.iloc[[0,1],2:4]
coordYcoordZ
0-175.319272-298.387506
1-211.925149-227.121250
df[df['diameter_mm']>10]
seriesuidcoordXcoordYcoordZdiameter_mmcorrd_X_Y
41.3.6.1.4.1.14519.5.2.1.6279.6001.100621383016…2.441547172.464881-405.49373218.545150421.081078
51.3.6.1.4.1.14519.5.2.1.6279.6001.100621383016…90.931713149.027266-426.54471518.20857013551.304585
61.3.6.1.4.1.14519.5.2.1.6279.6001.100621383016…89.540769196.405159-515.07332216.38127617586.268931
71.3.6.1.4.1.14519.5.2.1.6279.6001.100953483028…81.50964654.957219-150.34642310.3623214479.543419
81.3.6.1.4.1.14519.5.2.1.6279.6001.102681962408…105.05579219.825260-91.24725121.0896192082.758414
91.3.6.1.4.1.14519.5.2.1.6279.6001.104562737760…-124.834262127.247155-473.06447910.465854-15884.804687
### 4 合并
pd.concat([df,df,df],ignore_index=True) 
seriesuidcoordXcoordYcoordZdiameter_mmcorrd_X_Y
01.3.6.1.4.1.14519.5.2.1.6279.6001.100225287222…-128.699421-175.319272-298.3875065.65147122563.488788
11.3.6.1.4.1.14519.5.2.1.6279.6001.100225287222…103.783651-211.925149-227.1212504.224708-21994.365650
21.3.6.1.4.1.14519.5.2.1.6279.6001.100398138793…69.639017-140.944586876.3744965.786348-9815.242447
31.3.6.1.4.1.14519.5.2.1.6279.6001.100621383016…-24.013824192.102405-391.0812768.143262-4613.113389
41.3.6.1.4.1.14519.5.2.1.6279.6001.100621383016…2.441547172.464881-405.49373218.545150421.081078
51.3.6.1.4.1.14519.5.2.1.6279.6001.100621383016…90.931713149.027266-426.54471518.20857013551.304585
61.3.6.1.4.1.14519.5.2.1.6279.6001.100621383016…89.540769196.405159-515.07332216.38127617586.268931
71.3.6.1.4.1.14519.5.2.1.6279.6001.100953483028…81.50964654.957219-150.34642310.3623214479.543419
81.3.6.1.4.1.14519.5.2.1.6279.6001.102681962408…105.05579219.825260-91.24725121.0896192082.758414
91.3.6.1.4.1.14519.5.2.1.6279.6001.104562737760…-124.834262127.247155-473.06447910.465854-15884.804687
101.3.6.1.4.1.14519.5.2.1.6279.6001.100225287222…-128.699421-175.319272-298.3875065.65147122563.488788
111.3.6.1.4.1.14519.5.2.1.6279.6001.100225287222…103.783651-211.925149-227.1212504.224708-21994.365650
121.3.6.1.4.1.14519.5.2.1.6279.6001.100398138793…69.639017-140.944586876.3744965.786348-9815.242447
131.3.6.1.4.1.14519.5.2.1.6279.6001.100621383016…-24.013824192.102405-391.0812768.143262-4613.113389
141.3.6.1.4.1.14519.5.2.1.6279.6001.100621383016…2.441547172.464881-405.49373218.545150421.081078
151.3.6.1.4.1.14519.5.2.1.6279.6001.100621383016…90.931713149.027266-426.54471518.20857013551.304585
161.3.6.1.4.1.14519.5.2.1.6279.6001.100621383016…89.540769196.405159-515.07332216.38127617586.268931
171.3.6.1.4.1.14519.5.2.1.6279.6001.100953483028…81.50964654.957219-150.34642310.3623214479.543419
181.3.6.1.4.1.14519.5.2.1.6279.6001.102681962408…105.05579219.825260-91.24725121.0896192082.758414
191.3.6.1.4.1.14519.5.2.1.6279.6001.104562737760…-124.834262127.247155-473.06447910.465854-15884.804687
201.3.6.1.4.1.14519.5.2.1.6279.6001.100225287222…-128.699421-175.319272-298.3875065.65147122563.488788
211.3.6.1.4.1.14519.5.2.1.6279.6001.100225287222…103.783651-211.925149-227.1212504.224708-21994.365650
221.3.6.1.4.1.14519.5.2.1.6279.6001.100398138793…69.639017-140.944586876.3744965.786348-9815.242447
231.3.6.1.4.1.14519.5.2.1.6279.6001.100621383016…-24.013824192.102405-391.0812768.143262-4613.113389
241.3.6.1.4.1.14519.5.2.1.6279.6001.100621383016…2.441547172.464881-405.49373218.545150421.081078
251.3.6.1.4.1.14519.5.2.1.6279.6001.100621383016…90.931713149.027266-426.54471518.20857013551.304585
261.3.6.1.4.1.14519.5.2.1.6279.6001.100621383016…89.540769196.405159-515.07332216.38127617586.268931
271.3.6.1.4.1.14519.5.2.1.6279.6001.100953483028…81.50964654.957219-150.34642310.3623214479.543419
281.3.6.1.4.1.14519.5.2.1.6279.6001.102681962408…105.05579219.825260-91.24725121.0896192082.758414
291.3.6.1.4.1.14519.5.2.1.6279.6001.104562737760…-124.834262127.247155-473.06447910.465854-15884.804687
pd.merge(df,df,how='outer')
seriesuidcoordXcoordYcoordZdiameter_mmcorrd_X_Y
01.3.6.1.4.1.14519.5.2.1.6279.6001.100225287222…-128.699421-175.319272-298.3875065.65147122563.488788
11.3.6.1.4.1.14519.5.2.1.6279.6001.100225287222…103.783651-211.925149-227.1212504.224708-21994.365650
21.3.6.1.4.1.14519.5.2.1.6279.6001.100398138793…69.639017-140.944586876.3744965.786348-9815.242447
31.3.6.1.4.1.14519.5.2.1.6279.6001.100621383016…-24.013824192.102405-391.0812768.143262-4613.113389
41.3.6.1.4.1.14519.5.2.1.6279.6001.100621383016…2.441547172.464881-405.49373218.545150421.081078
51.3.6.1.4.1.14519.5.2.1.6279.6001.100621383016…90.931713149.027266-426.54471518.20857013551.304585
61.3.6.1.4.1.14519.5.2.1.6279.6001.100621383016…89.540769196.405159-515.07332216.38127617586.268931
71.3.6.1.4.1.14519.5.2.1.6279.6001.100953483028…81.50964654.957219-150.34642310.3623214479.543419
81.3.6.1.4.1.14519.5.2.1.6279.6001.102681962408…105.05579219.825260-91.24725121.0896192082.758414
91.3.6.1.4.1.14519.5.2.1.6279.6001.104562737760…-124.834262127.247155-473.06447910.465854-15884.804687

5 合并文件夹下所有同类型的csv的小例子

csv_files = glob.glob('/*/*/*.csv')
df = df = pd.DataFrame(columns=['seriesuid', 'coordX', 'coordY', 'coordZ', 'diameter_mm','des'])   
for csv in csv_files:
    df = pd.merge(df,pd.read_csv(csv),how='outer')
df_to_save = pd.DataFrame(df,columns=['seriesuid', 'coordX', 'coordY', 'coordZ', 'diameter_mm'])      
df_to_save.to_csv('annotations.csv',index=False)
评论
添加红包

请填写红包祝福语或标题

红包个数最小为10个

红包金额最低5元

当前余额3.43前往充值 >
需支付:10.00
成就一亿技术人!
领取后你会自动成为博主和红包主的粉丝 规则
hope_wisdom
发出的红包
实付
使用余额支付
点击重新获取
扫码支付
钱包余额 0

抵扣说明:

1.余额是钱包充值的虚拟货币,按照1:1的比例进行支付金额的抵扣。
2.余额无法直接购买下载,可以购买VIP、付费专栏及课程。

余额充值