# -*- coding: utf-8 -*-
BOT_NAME = 'eie'
SPIDER_MODULES = ['eie.spiders']
NEWSPIDER_MODULE = 'eie.spiders'
# 爬虫规则配置
# robots.txt规则
ROBOTSTXT_OBEY = False
# 下载延迟
DOWNLOAD_DELAY = 3
#启用Cookie
COOKIES_ENABLED = False
# 下载中间件,位于Scrapy引擎与下载器之间的钩子框架,主要是处理scrapy引擎与下载器之间的请求和响应
DOWNLOADER_MIDDLEWARES = {
'scrapy.contrib.downloadermiddleware.useragent.UserAgentMiddleware' : None,
'eie.middlewares.random_user_agent.RandomUserAgent': 100,
}
# item管道
ITEM_PIPELINES = {
'eie.pipelines.EiePipeline':100
}
# Mysql数据库配置
MYSQL_USER = 'root'
MYSQL_PASSWD = '000000'
MYSQL_HOST = '192.168.5.126'
MYSQL_DBNAME = 'eie'
MYSQL_POOL_SIZE = 8
第1.4章 scrapy之setting
最新推荐文章于 2023-07-06 10:55:17 发布