diff tests/test_linebreaks.py @ 1:1d09e1dec1d9 upstream

ADD: PyMuPDF v1.26.4: the original sdist. It does not yet contain MuPDF. This normally will be downloaded when building PyMuPDF.
author Franz Glasner <fzglas.hg@dom66.de>
date Mon, 15 Sep 2025 11:37:51 +0200
parents
children
line wrap: on
line diff
--- /dev/null	Thu Jan 01 00:00:00 1970 +0000
+++ b/tests/test_linebreaks.py	Mon Sep 15 11:37:51 2025 +0200
@@ -0,0 +1,16 @@
+import pymupdf
+
+import os.path
+
+
+def test_linebreaks():
+    """Test avoidance of linebreaks."""
+    path = os.path.abspath(f"{__file__}/../../tests/resources/test-linebreaks.pdf")
+    doc = pymupdf.open(path)
+    page = doc[0]
+    tp = page.get_textpage(flags=pymupdf.TEXTFLAGS_WORDS)
+    word_count = len(page.get_text("words", textpage=tp))
+    line_count1 = len(page.get_text(textpage=tp).splitlines())
+    line_count2 = len(page.get_text(sort=True, textpage=tp).splitlines())
+    assert word_count == line_count1
+    assert line_count2 < line_count1 / 2