最终效果如下:
······················主程序:·······································
# -*- coding: utf-8 -*- import scrapy import requests import json from qidian.items import QidianItem class MyqidianSpider(scrapy.Spider): name = 'myqidian' allowed_domains = ['qidian.com'] start_urls = ['http://www.qidian.com/all?chanId=21&orderId=&page=1&style=1&pageSize=20&siteid=1&pubflag=0&hiddenField=0'] def parse(self, response): # print(response.text) bookList = response.xpath('//ul[@class="all-img-list cf"]/li') for i in bookList: bookId = i.xpath('./div[@class="book-img-box"]/a/@data-bid').extract()[0]