1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24 25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48 49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72 73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96 97 98 99 100 101 102 103 104
|
#
# diffoscope: in-depth comparison of files, archives, and directories
#
# Copyright © 2015 Jérémy Bobbio <lunar@debian.org>
# Copyright © 2015-2018, 2020-2021, 2023 Chris Lamb <lamby@debian.org>
#
# diffoscope is free software: you can redistribute it and/or modify
# it under the terms of the GNU General Public License as published by
# the Free Software Foundation, either version 3 of the License, or
# (at your option) any later version.
#
# diffoscope is distributed in the hope that it will be useful,
# but WITHOUT ANY WARRANTY; without even the implied warranty of
# MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
# GNU General Public License for more details.
#
# You should have received a copy of the GNU General Public License
# along with diffoscope. If not, see <https://www.gnu.org/licenses/>.
import pytest
from diffoscope.comparators.pdf import PdfFile
from ..utils.data import load_fixture, assert_diff
from ..utils.tools import (
skip_unless_tools_exist,
skip_unless_module_exists,
skipif,
)
from ..utils.nonexisting import assert_non_existing
pdf1 = load_fixture("test1.pdf")
pdf2 = load_fixture("test2.pdf")
pdf3 = load_fixture("test3.pdf")
pdf4 = load_fixture("test4.pdf")
pdf1a = load_fixture("test_weird_non_unicode_chars1.pdf")
pdf2a = load_fixture("test_weird_non_unicode_chars2.pdf")
def skip_unless_pypdf3():
def fn():
try:
import pypdf
except ImportError:
return True
return not pypdf.__version__.startswith("3.")
return skipif(fn(), reason="pypdf not installed or not version 3.x+")
def test_identification(pdf1):
assert isinstance(pdf1, PdfFile)
def test_no_differences(pdf1):
difference = pdf1.compare(pdf1)
assert difference is None
def test_differences_found_with_weird_encoding(pdf1a, pdf2a):
# diffoscope used to crash here due to weird encoding
difference = pdf1a.compare(pdf2a)
assert difference
@pytest.fixture
def differences(pdf1, pdf2):
return pdf1.compare(pdf2).details
@skip_unless_tools_exist("pdftotext")
def test_text_diff(differences):
assert_diff(differences[0], "pdf_text_expected_diff")
@skip_unless_tools_exist("pdftotext")
def test_compare_non_existing(monkeypatch, pdf1):
assert_non_existing(monkeypatch, pdf1, has_null_source=False)
@pytest.fixture
def differences_metadata(pdf1, pdf1a):
return pdf1.compare(pdf1a).details
@skip_unless_pypdf3()
@skip_unless_tools_exist("pdftotext")
def test_metadata(differences_metadata):
assert len(differences_metadata) == 2
assert_diff(differences_metadata[0], "pdf_metadata_expected_diff")
@pytest.fixture
def differences_annotations(pdf3, pdf4):
return pdf3.compare(pdf4).details
@skip_unless_pypdf3()
@skip_unless_tools_exist("pdftotext")
def test_annotations(differences_annotations):
assert_diff(differences_annotations[0], "pdf_annotations_expected_diff")
|