feat: Introduce the force-ocr cmd parameter in docling cli. Add the full_page_ocr.py example in mkdocs

Signed-off-by: Nikos Livathinos <nli@zurich.ibm.com>
2025-07-30 22:14:37 +00:00 · 2024-11-11 14:10:56 +01:00 · 2024-11-11 14:10:56 +01:00 · 7234dc3a42
commit 7234dc3a42
parent 1963e7145b
3 changed files with 11 additions and 4 deletions
--- a/docling/cli/main.py
+++ b/docling/cli/main.py
@ -153,6 +153,13 @@ def convert(
            ..., help="If enabled, the bitmap content will be processed using OCR."
        ),
    ] = True,
+    force_ocr: Annotated[
+        bool,
+        typer.Option(
+            ...,
+            help="Replace any existing text with OCR generated text over the full content.",
+        ),
+    ] = False,
    ocr_engine: Annotated[
        OcrEngine, typer.Option(..., help="The OCR engine to use.")
    ] = OcrEngine.EASYOCR,
@ -219,11 +226,11 @@ def convert(

    match ocr_engine:
        case OcrEngine.EASYOCR:
-            ocr_options: OcrOptions = EasyOcrOptions()
+            ocr_options: OcrOptions = EasyOcrOptions(force_full_page_ocr=force_ocr)
        case OcrEngine.TESSERACT_CLI:
-            ocr_options = TesseractCliOcrOptions()
+            ocr_options = TesseractCliOcrOptions(force_full_page_ocr=force_ocr)
        case OcrEngine.TESSERACT:
-            ocr_options = TesseractOcrOptions()
+            ocr_options = TesseractOcrOptions(force_full_page_ocr=force_ocr)
        case _:
            raise RuntimeError(f"Unexpected OCR engine type {ocr_engine}")

--- a/docs/examples/full_page_ocr.py
+++ b/docs/examples/full_page_ocr.py
@ -29,7 +29,6 @@ def main():
        format_options={
            InputFormat.PDF: PdfFormatOption(
                pipeline_options=pipeline_options,
-                backend=DoclingParseDocumentBackend,
            )
        }
    )
--- a/mkdocs.yml
+++ b/mkdocs.yml
@ -69,6 +69,7 @@ nav:
      - "Figure enrichment": examples/develop_picture_enrichment.py
      - "Table export": examples/export_tables.py
      - "Multimodal export": examples/export_multimodal.py
+      - "Force full page OCR": examples/full_page_ocr.py
    - RAG / QA:
      - "RAG with LlamaIndex 🦙": examples/rag_llamaindex.ipynb
      - "RAG with LangChain 🦜🔗": examples/rag_langchain.ipynb