diff --git a/tests/test_threaded_pipeline.py b/tests/test_threaded_pipeline.py index 987171b0..138d2940 100644 --- a/tests/test_threaded_pipeline.py +++ b/tests/test_threaded_pipeline.py @@ -17,8 +17,18 @@ from docling.pipeline.standard_pdf_pipeline import StandardPdfPipeline from docling.pipeline.threaded_standard_pdf_pipeline import ThreadedStandardPdfPipeline +@pytest.mark.skip(reason="Requires models to be pre-downloaded; run manually to verify timeout behavior") def test_standard_pipeline_document_timeout(): - """Test that StandardPdfPipeline respects document_timeout""" + """Test that StandardPdfPipeline respects document_timeout + + This test verifies that when document_timeout is set, the pipeline will: + 1. Stop processing after the timeout period + 2. Return PARTIAL_SUCCESS status + 3. Return successfully processed pages + + Note: This test requires layout models to be pre-downloaded from HuggingFace. + It can be run manually with: pytest tests/test_threaded_pipeline.py::test_standard_pipeline_document_timeout -v + """ test_file = "tests/data/pdf/2203.01017v2.pdf" # Large file to ensure timeout can occur # Configure pipeline with very short timeout