File: test_on_fetched_robotstxt.py

package info (click to toggle)
python-protego 0.2.1%2Bdfsg-1
  • links: PTS, VCS
  • area: main
  • in suites: bookworm
  • size: 30,208 kB
  • sloc: python: 1,430; perl: 190; cpp: 33; sh: 12; makefile: 3
file content (23 lines) | stat: -rw-r--r-- 847 bytes parent folder | download
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
from os import listdir
from os.path import abspath, dirname, isfile, join

import pytest

from protego import Protego

test_data_directory = join(dirname(abspath(__file__)), 'test_data')
robotstxts = [f for f in listdir(test_data_directory) if isfile(join(test_data_directory, f))]


@pytest.mark.parametrize('path_to_robotstxt', robotstxts)
def test_no_exceptions(path_to_robotstxt):
    try:
        with open(join(test_data_directory, path_to_robotstxt), 'rb') as f:
            try:
                content = f.read().decode('utf-8')
            except UnicodeDecodeError:
                # Downloaded robots.txt is malformed, ignore this
                return
            Protego.parse(content=content)
    except Exception as e:
        assert False, "{}. Exception raised while parsing {}".format(e, join(path_to_robotstxt, 'robots.txt'))