File: test_linebreaks.py

package info (click to toggle)
pymupdf 1.25.4%2Bds1-3
  • links: PTS, VCS
  • area: main
  • in suites: forky, sid, trixie
  • size: 98,632 kB
  • sloc: python: 43,379; ansic: 75; makefile: 6
file content (16 lines) | stat: -rw-r--r-- 558 bytes parent folder | download
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
import pymupdf

import os.path


def test_linebreaks():
    """Test avoidance of linebreaks."""
    path = os.path.abspath(f"{__file__}/../../tests/resources/test-linebreaks.pdf")
    doc = pymupdf.open(path)
    page = doc[0]
    tp = page.get_textpage(flags=pymupdf.TEXTFLAGS_WORDS)
    word_count = len(page.get_text("words", textpage=tp))
    line_count1 = len(page.get_text(textpage=tp).splitlines())
    line_count2 = len(page.get_text(sort=True, textpage=tp).splitlines())
    assert word_count == line_count1
    assert line_count2 < line_count1 / 2