diff --git a/tests/resources/test_3594.pdf b/tests/resources/test_3594.pdf new file mode 100644 index 000000000..ea3c44424 Binary files /dev/null and b/tests/resources/test_3594.pdf differ diff --git a/tests/test_textextract.py b/tests/test_textextract.py index 5374e153f..771ea9dfe 100644 --- a/tests/test_textextract.py +++ b/tests/test_textextract.py @@ -314,3 +314,18 @@ def llen(texts): if _stats: pymupdf._log_items_clear() + + +def test_3594(): + print() + d = pymupdf.open(os.path.abspath(f'{__file__}/../../tests/resources/test_3594.pdf')) + for i, p in enumerate(d.pages()): + text = p.get_text() + print('='*40) + print(f'Page {i}:') + for line in text.split('\n'): + print(f' {line!r}') + if pymupdf.mupdf_version_tuple < (1, 24, 3): + # We expect MuPDF warnings. + wt = pymupdf.TOOLS.mupdf_warnings() + assert wt