保存为csv文件
from scrapy.exporters import CsvItemExporter
class FtimesPipeline(object):
def open_spider(self, spider):
self.file = open('ftoutput.csv', 'wb')
self.exporter = CsvItemExporter(self.file, delimiter='~')
self.exporter.start_exporting()
def close_spider(self, spider):
self.exporter.finish_exporting()
self.file.close()
def process_item(self, item, spider):
self.exporter.export_item(item)
return item
保存为xlsx文件
from openpyxl import Workbook
class MapdataPipeline(object):
wb = Workbook()
ws = wb.active
# 设置表头
ws.append(['area', 'total'])
def process_item(self, item, spider):
# 添加数据
line = [item['area'], item['total']]
self.ws.append(line) # 按行添加
self.wb.save('printingshop.xlsx')
return item