-- coding: utf-8 --
import scrapy
from Novels1.items import Novels1Item
class Novels80Spider(scrapy.Spider):
name = ‘novels80’
allowed_domains = [‘txt80.com’]
start_urls = [‘http://txt80.com/dushi/’]
def parse(self, response):
# divs = response.xpath('//div[@class="list_l_box"]')
# for div in divs:
# # items = {}
# titles = div.xpath('//div[@class="info"]/h4/a/text()').extract()
# auths = div.xpath('//div[@class="info"]/p[1]/b/a[2]/text()').extract()
# images = div.xpath('//div[@class="pic"]/a/img/@src').extract()
# sub_times = div.xpath('//div[@class="info"]/p[3]/font/text()').extract()
# item = Novels1Item(titles=titles, auths=auths, images=images, sub_times=sub_times)
# yield item
divs = response.xpath('//div[@class="list_l_box"]/div')[:-2]
for div in divs:
# get() 取出字符串
title = div.xpath('./div[@class="info"]/h4/a/text()')[0].get()
auth = div.xpath('./div[@class="info"]/p[1]/b/a[2]/text()')[0].get()
img = div.xpath('./div[@class="pic"]/a/img/@src')[0].get()
item = Novels1Item(title=title, auth=auth, img=img)
yield item