Rename docling backend to v4

Signed-off-by: Christoph Auer <cau@zurich.ibm.com>
2025-12-08 20:58:11 +00:00 · 2025-03-14 12:35:06 +01:00
parent b77f73beec
commit af18215714
9 changed files with 25 additions and 25 deletions
--- a/tests/test_backend_docling_parse_v4.py
+++ b/tests/test_backend_docling_parse_v4.py
@@ -2,9 +2,9 @@ from pathlib import Path

 import pytest

-from docling.backend.docling_parse_v3_backend import (
-    DoclingParseV3DocumentBackend,
-    DoclingParseV3PageBackend,
+from docling.backend.docling_parse_v4_backend import (
+    DoclingParseV4DocumentBackend,
+    DoclingParseV4PageBackend,
 )
 from docling.datamodel.base_models import BoundingBox, InputFormat
 from docling.datamodel.document import InputDocument
@@ -19,7 +19,7 @@ def _get_backend(pdf_doc):
    in_doc = InputDocument(
        path_or_stream=pdf_doc,
        format=InputFormat.PDF,
-        backend=DoclingParseV3DocumentBackend,
+        backend=DoclingParseV4DocumentBackend,
    )

    doc_backend = in_doc._backend
@@ -34,7 +34,7 @@ def test_text_cell_counts():
    for page_index in range(0, doc_backend.page_count()):
        last_cell_count = None
        for i in range(10):
-            page_backend: DoclingParseV3PageBackend = doc_backend.load_page(0)
+            page_backend: DoclingParseV4PageBackend = doc_backend.load_page(0)
            cells = list(page_backend.get_text_cells())

            if last_cell_count is None:
@@ -49,7 +49,7 @@ def test_text_cell_counts():

 def test_get_text_from_rect(test_doc_path):
    doc_backend = _get_backend(test_doc_path)
-    page_backend: DoclingParseV3PageBackend = doc_backend.load_page(0)
+    page_backend: DoclingParseV4PageBackend = doc_backend.load_page(0)

    # Get the title text of the DocLayNet paper
    textpiece = page_backend.get_text_in_rect(
@@ -62,7 +62,7 @@ def test_get_text_from_rect(test_doc_path):

 def test_crop_page_image(test_doc_path):
    doc_backend = _get_backend(test_doc_path)
-    page_backend: DoclingParseV3PageBackend = doc_backend.load_page(0)
+    page_backend: DoclingParseV4PageBackend = doc_backend.load_page(0)

    # Crop out "Figure 1" from the DocLayNet paper
    im = page_backend.get_page_image(
--- a/tests/test_e2e_conversion.py
+++ b/tests/test_e2e_conversion.py
@@ -1,6 +1,6 @@
 from pathlib import Path

-from docling.backend.docling_parse_v3_backend import DoclingParseV3DocumentBackend
+from docling.backend.docling_parse_v4_backend import DoclingParseV4DocumentBackend
 from docling.datamodel.base_models import InputFormat
 from docling.datamodel.document import ConversionResult
 from docling.datamodel.pipeline_options import AcceleratorDevice, PdfPipelineOptions
@@ -34,7 +34,7 @@ def get_converter():
    converter = DocumentConverter(
        format_options={
            InputFormat.PDF: PdfFormatOption(
-                pipeline_options=pipeline_options, backend=DoclingParseV3DocumentBackend
+                pipeline_options=pipeline_options, backend=DoclingParseV4DocumentBackend
            )
        }
    )
--- a/tests/test_e2e_ocr_conversion.py
+++ b/tests/test_e2e_ocr_conversion.py
@@ -2,7 +2,7 @@ import sys
 from pathlib import Path
 from typing import List

-from docling.backend.docling_parse_v3_backend import DoclingParseV3DocumentBackend
+from docling.backend.docling_parse_v4_backend import DoclingParseV4DocumentBackend
 from docling.datamodel.base_models import InputFormat
 from docling.datamodel.document import ConversionResult
 from docling.datamodel.pipeline_options import (
@@ -45,7 +45,7 @@ def get_converter(ocr_options: OcrOptions):
        format_options={
            InputFormat.PDF: PdfFormatOption(
                pipeline_options=pipeline_options,
-                backend=DoclingParseV3DocumentBackend,
+                backend=DoclingParseV4DocumentBackend,
            )
        }
    )
--- a/tests/test_interfaces.py
+++ b/tests/test_interfaces.py
@@ -3,7 +3,7 @@ from pathlib import Path

 import pytest

-from docling.backend.docling_parse_v3_backend import DoclingParseV3DocumentBackend
+from docling.backend.docling_parse_v4_backend import DoclingParseV4DocumentBackend
 from docling.datamodel.base_models import DocumentStream, InputFormat
 from docling.datamodel.pipeline_options import PdfPipelineOptions
 from docling.document_converter import DocumentConverter, PdfFormatOption
@@ -31,7 +31,7 @@ def converter():
    converter = DocumentConverter(
        format_options={
            InputFormat.PDF: PdfFormatOption(
-                pipeline_options=pipeline_options, backend=DoclingParseV3DocumentBackend
+                pipeline_options=pipeline_options, backend=DoclingParseV4DocumentBackend
            )
        }
    )
--- a/tests/test_options.py
+++ b/tests/test_options.py
@@ -3,7 +3,7 @@ from pathlib import Path

 import pytest

-from docling.backend.docling_parse_v3_backend import DoclingParseV3DocumentBackend
+from docling.backend.docling_parse_v4_backend import DoclingParseV4DocumentBackend
 from docling.datamodel.base_models import ConversionStatus, InputFormat
 from docling.datamodel.document import ConversionResult
 from docling.datamodel.pipeline_options import (
@@ -33,7 +33,7 @@ def get_converters_with_table_options():
                format_options={
                    InputFormat.PDF: PdfFormatOption(
                        pipeline_options=pipeline_options,
-                        backend=DoclingParseV3DocumentBackend,
+                        backend=DoclingParseV4DocumentBackend,
                    )
                }
            )