From 8aef4ec4cf96afb536334035fccf63e15fc8570a Mon Sep 17 00:00:00 2001 From: hpierre001 <58784889+hpierre001@users.noreply.github.com> Date: Tue, 22 Oct 2024 21:57:22 +0200 Subject: [PATCH] TST: Add test for ``layout_mode_font_height_weight`` of ``PageObject.extract_text()`` --- tests/test_text_extraction.py | 10 ++++++++++ 1 file changed, 10 insertions(+) diff --git a/tests/test_text_extraction.py b/tests/test_text_extraction.py index 1908e7f15..5d5f28ee2 100644 --- a/tests/test_text_extraction.py +++ b/tests/test_text_extraction.py @@ -219,3 +219,13 @@ def test_text_leading_height_unit(): page = reader.pages[0] extracted = page.extract_text() assert "Something[cited]\n" in extracted + + +def test_layout_mode_vertical_space(): + """Tests for #2915""" + reader = PdfReader(RESOURCE_ROOT / "attachment.pdf") + page = reader.pages[0] + extracted = page.extract_text(extraction_mode="layout", layout_mode_space_vertically=True, + layout_mode_font_height_weight=0.85) + assert "The Crazy Ones\nOctober 14, 1998\n\n" in extracted + assert "The round pegs in the square holes.\n\n" in extracted