scrapy-scheduler

 1 # scheduler的作用: 用于控制Request对象的存储和获取,并提供了过滤重复Request的功能。
 2 
 3 class Scheduler(object):
 4 
 5     def __init__(self, dupefilter, jobdir=None, dqclass=None, mqclass=None,
 6                  logunser=False, stats=None, pqclass=None):
 7         self.df = dupefilter
 8         self.dqdir = self._dqdir(jobdir)
 9         self.pqclass = pqclass  # 优先级队列
10         self.dqclass = dqclass  # 磁盘序列号队列,用于断点续采
11         self.mqclass = mqclass  # 内存队列
12         self.logunser = logunser
13         self.stats = stats
14 
15     @classmethod
16     def from_crawler(cls, crawler):
17         settings = crawler.settings
18         dupefilter_cls = load_object(settings['DUPEFILTER_CLASS'])
19         dupefilter = dupefilter_cls.from_settings(settings)
20         pqclass = load_object(settings['SCHEDULER_PRIORITY_QUEUE'])
21         dqclass = load_object(settings['SCHEDULER_DISK_QUEUE'])
22         mqclass = load_object(settings['SCHEDULER_MEMORY_QUEUE'])
23         logunser = settings.getbool('LOG_UNSERIALIZABLE_REQUESTS', settings.getbool('SCHEDULER_DEBUG'))
24         return cls(dupefilter, jobdir=job_dir(settings), logunser=logunser,
25                    stats=crawler.stats, pqclass=pqclass, dqclass=dqclass, mqclass=mqclass)

 

 

转载于:https://www.cnblogs.com/liyugeng/p/7890149.html

评论
添加红包

请填写红包祝福语或标题

红包个数最小为10个

红包金额最低5元

当前余额3.43前往充值 >
需支付:10.00
成就一亿技术人!
领取后你会自动成为博主和红包主的粉丝 规则
hope_wisdom
发出的红包
实付
使用余额支付
点击重新获取
扫码支付
钱包余额 0

抵扣说明:

1.余额是钱包充值的虚拟货币,按照1:1的比例进行支付金额的抵扣。
2.余额无法直接购买下载,可以购买VIP、付费专栏及课程。

余额充值