mirror of
https://github.com/scrapy/scrapy.git
synced 2025-02-25 20:04:28 +00:00
commit
f40587c661
@ -49,8 +49,14 @@ class RobotsTxtMiddleware(object):
|
||||
)
|
||||
dfd = self.crawler.engine.download(robotsreq, spider)
|
||||
dfd.addCallback(self._parse_robots)
|
||||
dfd.addErrback(self._logerror, robotsreq, spider)
|
||||
return self._parsers[netloc]
|
||||
|
||||
def _logerror(self, failure, request, spider):
|
||||
if failure.type is not IgnoreRequest:
|
||||
log.msg(format="Error downloading %%(request)s: %s" % failure.value,
|
||||
level=log.ERROR, request=request, spider=spider)
|
||||
|
||||
def _parse_robots(self, response):
|
||||
rp = robotparser.RobotFileParser(response.url)
|
||||
rp.parse(response.body.splitlines())
|
||||
|
Loading…
x
Reference in New Issue
Block a user