pipelines.py
from pydispatch import dispatcher
from scrapy import signals
from openpyxl import Workbook
class FirstexcelPipeline(object):
def __init__(self):
dispatcher.connect(self.colse_spider, signals.spider_closed)
self.wb = Workbook()
self.ws = self.wb.active
self.ws.append(['写入名字', '写入title', '详细信息'])
def process_item(self, item, spider):
# print(item)
line = [item['name'], item['title'], item['info']]
self.ws.append(line)
return item
def colse_spider(self, spider):
print('结束')
self.wb.save('D:\脚本数据\py\datacache\写入测试.xlsx')
getdatas.py
import scrapy
from ..items import FirstexcelItem
class GetdatasSpider(scrapy.Spider):
name = 'getdatas'
allowed_domains = ['i