From 460b247b664577d92b97e9ef66758949c3cce8ef Mon Sep 17 00:00:00 2001 From: Christoph Auer Date: Thu, 10 Jul 2025 11:39:22 +0200 Subject: [PATCH] OCR tests use DPv1 until rotation bugs are fixed Signed-off-by: Christoph Auer --- tests/test_e2e_ocr_conversion.py | 6 +++++- 1 file changed, 5 insertions(+), 1 deletion(-) diff --git a/tests/test_e2e_ocr_conversion.py b/tests/test_e2e_ocr_conversion.py index 16e50146..77e6fac1 100644 --- a/tests/test_e2e_ocr_conversion.py +++ b/tests/test_e2e_ocr_conversion.py @@ -2,6 +2,10 @@ import sys from pathlib import Path from typing import List, Tuple +from docling.backend.docling_parse_backend import DoclingParseDocumentBackend +from docling.backend.docling_parse_v2_backend import DoclingParseV2DocumentBackend +from docling.backend.docling_parse_v4_backend import DoclingParseV4DocumentBackend +from docling.backend.pypdfium2_backend import PyPdfiumDocumentBackend from docling.datamodel.accelerator_options import AcceleratorDevice from docling.datamodel.base_models import InputFormat from docling.datamodel.document import ConversionResult @@ -43,7 +47,7 @@ def get_converter(ocr_options: OcrOptions): format_options={ InputFormat.PDF: PdfFormatOption( pipeline_options=pipeline_options, - backend=PdfFormatOption().backend, + backend=DoclingParseDocumentBackend, # PdfFormatOption().backend, ) } )