csv读取文件
1、新建一个test.csv文件,数据如下:
Symbol,Price,Date,Time,Change,Volume
"AA",39.48,"6/11/2007","9:36am",-0.18,181800
"AIG",71.38,"6/11/2007","9:36am",-0.15,195500
"AXP",62.58,"6/11/2007","9:36am",-0.46,935000
"BA",98.31,"6/11/2007","9:36am",+0.12,104800
"C",53.08,"6/11/2007","9:36am",-0.25,360900
"CAT",78.29,"6/11/2007","9:36am",-0.23,225400
2、读操作
import csv # Python内置包,无需pip install
with open("test.csv") as f:
f_csv = csv.reader(f) # f为文件句柄
# f_csv为一个生成器对象,可以使用next()函数进行调用,可以使用命名元组Row = namedtuple("Row",next(reader))
print(f_csv)
for row in reader: # row为一个列表,其中包含每一行的数据
print(", ".join(row)) # row_ = Row(*row),使用命名元组前提一定是csv文件的头一行的数据都是标准的Python标识符
打印结果:
<_csv.reader object at 0x000002A97FE1FB80>
Symbol, Price, Date, Time, Change, Volume
AA, 39.48, 6/11/2007, 9:36am, -0.18, 181800
AIG, 71.38, 6/11/2007, 9:36am, -0.15, 195500
AXP, 62.58, 6/11/2007, 9:36am, -0.46, 935000
BA, 98.31, 6/11/2007, 9:36am, +0.12, 104800
C, 53.08, 6/11/2007, 9:36am, -0.25, 360900
CAT, 78.29, 6/11/2007, 9:36am, -0.23, 225400
由于row
是一个列表,访问某一行中的某一列数据的时候,必须使用row[1]
这种下标方式,可能会引起混淆,因此我们可以使用命名元组
或者字典读取器DictReader
来进行改善。
import csv
with open("test.csv") as f:
reader = csv.DictReader(f) # DictReader为字典读取器
for row in reader:
print(row) # row为一个字典,可以使用key来进行访问某一行某一列中的数据
打印结果:
{'Symbol': 'AIG', 'Price': '71.38', 'Date': '6/11/2007', 'Time': '9:36am', 'Change': '-0.15', 'Volume': '195500'}
{'Symbol': 'AXP', 'Price': '62.58', 'Date': '6/11/2007', 'Time': '9:36am', 'Change': '-0.46', 'Volume': '935000'}
{'Symbol': 'BA', 'Price': '98.31', 'Date': '6/11/2007', 'Time': '9:36am', 'Change': '+0.12', 'Volume': '104800'}
{'Symbol': 'C', 'Price': '53.08', 'Date': '6/11/2007', 'Time': '9:36am', 'Change': '-0.25', 'Volume': '360900'}
{'Symbol': 'CAT', 'Price': '78.29', 'Date': '6/11/2007', 'Time': '9:36am', 'Change': '-0.23', 'Volume': '225400'}
3、写操作
headers = ['Symbol','Price','Date','Time','Change','Volume']
rows = [('AA', 39.48, '6/11/2007', '9:36am', -0.18, 181800),
('AIG', 71.38, '6/11/2007', '9:36am', -0.15, 195500),
('AXP', 62.58, '6/11/2007', '9:36am', -0.46, 935000),
]
with open('stocks.csv','w') as f:
f_csv = csv.writer(f)
f_csv.writerow(headers) # 单行写入,writerow和writerows中的参数只需要是可迭代的就行,并不一定是列表
f_csv.writerows(rows) # 多行写入
使用DictWriter来进行写入
headers = ['Symbol', 'Price', 'Date', 'Time', 'Change', 'Volume']
rows = [{'Symbol':'AA', 'Price':39.48, 'Date':'6/11/2007',
'Time':'9:36am', 'Change':-0.18, 'Volume':181800},
{'Symbol':'AIG', 'Price': 71.38, 'Date':'6/11/2007',
'Time':'9:36am', 'Change':-0.15, 'Volume': 195500},
{'Symbol':'AXP', 'Price': 62.58, 'Date':'6/11/2007',
'Time':'9:36am', 'Change':-0.46, 'Volume': 935000},
]
with open('stocks.csv','w') as f:
f_csv = csv.DictWriter(f, headers)
f_csv.writeheader()
f_csv.writerows(rows)