fix: Enable GPU for RapidOCR when available (#2659)

* add setting for using gpu Signed-off-by: Michele Dolfi <dol@zurich.ibm.com> * add docs Signed-off-by: Michele Dolfi <dol@zurich.ibm.com> --------- Signed-off-by: Michele Dolfi <dol@zurich.ibm.com>
2025-12-08 12:48:28 +00:00 · 2025-11-19 17:12:00 +01:00
parent b216ad848d
commit 463a3fd474
2 changed files with 22 additions and 0 deletions
--- a/docling/models/rapid_ocr_model.py
+++ b/docling/models/rapid_ocr_model.py
@@ -110,6 +110,9 @@ class RapidOcrModel(BaseOcrModel):
            use_cuda = str(AcceleratorDevice.CUDA.value).lower() in device
            use_dml = accelerator_options.device == AcceleratorDevice.AUTO
            intra_op_num_threads = accelerator_options.num_threads
            gpu_id = 0
            if use_cuda and ":" in device:
                gpu_id = int(device.split(":")[1])
            _ALIASES = {
                "onnxruntime": EngineType.ONNXRUNTIME,
                "openvino": EngineType.OPENVINO,
@@ -184,6 +187,10 @@ class RapidOcrModel(BaseOcrModel):
                "Det.engine_type": backend_enum,
                "Cls.engine_type": backend_enum,
                "Rec.engine_type": backend_enum,
                "EngineConfig.paddle.use_cuda": use_cuda,
                "EngineConfig.paddle.gpu_id": gpu_id,
                "EngineConfig.torch.use_cuda": use_cuda,
                "EngineConfig.torch.gpu_id": gpu_id,
            }
            if self.options.rec_font_path is not None:
--- a/docs/usage/gpu.md
+++ b/docs/usage/gpu.md
@@ -43,6 +43,21 @@ Setting a higher `page_batch_size` will run the Docling models (in particular th
 For a complete example see [gpu_standard_pipeline.py](../examples/gpu_standard_pipeline.py).
 #### OCR engines
 The current Docling OCR engines rely on third-party libraries, hence GPU support depends on the availability in the respective engines.
 The only setup which is known to work at the moment is RapidOCR with the torch backend, which can be enabled via
 ```py
 pipeline_options = PdfPipelineOptions()
 pipeline_options.ocr_options = RapidOcrOptions(
    backend="torch",
 )
 ```
 More details in the GitHub discussion [#2451](https://github.com/docling-project/docling/discussions/2451).
 ### VLM Pipeline