view tests/test_2907.py @ 35:f0e1e5146733

Comment about building with tesseract
author Franz Glasner <fzglas.hg@dom66.de>
date Sun, 21 Sep 2025 19:06:03 +0200
parents 1d09e1dec1d9
children
line wrap: on
line source

import pymupdf

import os.path
import pathlib

def test_2907():
    # This test is for a bug in classic 'segfault trying to call clean_contents
    # on certain pdfs with python 3.12', which we are not going to fix.
    if not hasattr(pymupdf, 'mupdf'):
        print('test_2907(): not running on classic because known to fail.')
        return
    path = os.path.abspath(f'{__file__}/../../tests/resources/test_2907.pdf')
    pdf_file = pathlib.Path(path).read_bytes()
    fitz_document = pymupdf.open(stream=pdf_file, filetype="application/pdf")

    pdf_pages = list(fitz_document.pages())
    (page,) = pdf_pages
    page.clean_contents()