File: test_spidermiddleware_depth.py

package info (click to toggle)
python-scrapy 2.13.3-1
  • links: PTS, VCS
  • area: main
  • in suites: forky, sid
  • size: 5,664 kB
  • sloc: python: 52,028; xml: 199; makefile: 25; sh: 7
file content (38 lines) | stat: -rw-r--r-- 1,267 bytes parent folder | download
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
from scrapy.http import Request, Response
from scrapy.spidermiddlewares.depth import DepthMiddleware
from scrapy.spiders import Spider
from scrapy.utils.test import get_crawler


class TestDepthMiddleware:
    def setup_method(self):
        crawler = get_crawler(Spider, {"DEPTH_LIMIT": 1, "DEPTH_STATS_VERBOSE": True})
        self.spider = crawler._create_spider("scrapytest.org")

        self.stats = crawler.stats
        self.stats.open_spider(self.spider)

        self.mw = DepthMiddleware.from_crawler(crawler)

    def test_process_spider_output(self):
        req = Request("http://scrapytest.org")
        resp = Response("http://scrapytest.org")
        resp.request = req
        result = [Request("http://scrapytest.org")]

        out = list(self.mw.process_spider_output(resp, result, self.spider))
        assert out == result

        rdc = self.stats.get_value("request_depth_count/1", spider=self.spider)
        assert rdc == 1

        req.meta["depth"] = 1

        out2 = list(self.mw.process_spider_output(resp, result, self.spider))
        assert not out2

        rdm = self.stats.get_value("request_depth_max", spider=self.spider)
        assert rdm == 1

    def teardown_method(self):
        self.stats.close_spider(self.spider, "")