1
0
mirror of https://github.com/scrapy/scrapy.git synced 2025-02-11 14:51:32 +00:00
scrapy/tests/test_spidermiddleware_depth.py

Ignoring revisions in .git-blame-ignore-revs. Click here to bypass and see the normal blame view.

42 lines
1.3 KiB
Python
Raw Normal View History

2009-09-07 11:14:43 -03:00
from unittest import TestCase
2023-01-25 14:25:15 -06:00
from scrapy.http import Request, Response
from scrapy.spidermiddlewares.depth import DepthMiddleware
from scrapy.spiders import Spider
from scrapy.statscollectors import StatsCollector
from scrapy.utils.test import get_crawler
2009-09-07 11:14:43 -03:00
class TestDepthMiddleware(TestCase):
def setUp(self):
crawler = get_crawler(Spider)
self.spider = crawler._create_spider("scrapytest.org")
2009-09-07 11:14:43 -03:00
self.stats = StatsCollector(crawler)
self.stats.open_spider(self.spider)
2009-09-07 11:14:43 -03:00
self.mw = DepthMiddleware(1, self.stats, True)
2009-09-07 11:14:43 -03:00
def test_process_spider_output(self):
req = Request("http://scrapytest.org")
resp = Response("http://scrapytest.org")
resp.request = req
result = [Request("http://scrapytest.org")]
out = list(self.mw.process_spider_output(resp, result, self.spider))
self.assertEqual(out, result)
2009-09-07 11:14:43 -03:00
rdc = self.stats.get_value("request_depth_count/1", spider=self.spider)
self.assertEqual(rdc, 1)
2009-09-07 11:14:43 -03:00
req.meta["depth"] = 1
out2 = list(self.mw.process_spider_output(resp, result, self.spider))
self.assertEqual(out2, [])
2009-09-07 11:14:43 -03:00
rdm = self.stats.get_value("request_depth_max", spider=self.spider)
self.assertEqual(rdm, 1)
2009-09-07 11:14:43 -03:00
def tearDown(self):
self.stats.close_spider(self.spider, "")