From a0aa83301c617c4d47481e092e4595fd20c6da1e Mon Sep 17 00:00:00 2001 From: Simonas <20096648+simjak@users.noreply.github.com> Date: Tue, 3 Dec 2024 09:30:03 +0200 Subject: [PATCH] chore: base ocr options, was missing rapid ocr Signed-off-by: Simonas <20096648+simjak@users.noreply.github.com> --- docling/datamodel/pipeline_options.py | 4 +--- 1 file changed, 1 insertion(+), 3 deletions(-) diff --git a/docling/datamodel/pipeline_options.py b/docling/datamodel/pipeline_options.py index 63e0d3c6..5e73a905 100644 --- a/docling/datamodel/pipeline_options.py +++ b/docling/datamodel/pipeline_options.py @@ -142,9 +142,7 @@ class PdfPipelineOptions(PipelineOptions): do_ocr: bool = True # True: perform OCR, replace programmatic PDF text table_structure_options: TableStructureOptions = TableStructureOptions() - ocr_options: Union[ - EasyOcrOptions, TesseractCliOcrOptions, TesseractOcrOptions, OcrMacOptions - ] = Field(EasyOcrOptions(), discriminator="kind") + ocr_options: OcrOptions = Field(EasyOcrOptions(), discriminator="kind") images_scale: float = 1.0 generate_page_images: bool = False