From ea3f720ef59561419797741699099a642ae8f361 Mon Sep 17 00:00:00 2001 From: Michele Dolfi Date: Tue, 8 Oct 2024 11:32:54 +0200 Subject: [PATCH] remove pydantic warning for model_ Signed-off-by: Michele Dolfi --- docling/datamodel/pipeline_options.py | 15 ++++++++++++++- 1 file changed, 14 insertions(+), 1 deletion(-) diff --git a/docling/datamodel/pipeline_options.py b/docling/datamodel/pipeline_options.py index 0c915bbf..b4bb9977 100644 --- a/docling/datamodel/pipeline_options.py +++ b/docling/datamodel/pipeline_options.py @@ -1,7 +1,7 @@ from enum import Enum, auto from typing import List, Literal, Optional, Union -from pydantic import BaseModel, Field +from pydantic import BaseModel, ConfigDict, Field class TableFormerMode(str, Enum): @@ -30,17 +30,30 @@ class EasyOcrOptions(OcrOptions): model_storage_directory: Optional[str] = None download_enabled: bool = True # same default as easyocr.Reader + model_config = ConfigDict( + extra="forbid", + protected_namespaces=(), + ) + class TesseractOcrOptions(OcrOptions): kind: Literal["tesseract"] = "tesseract" lang: List[str] = ["fra", "deu", "spa", "eng"] tesseract_cmd: str = "tesseract" + model_config = ConfigDict( + extra="forbid", + ) + class TesserOcrOptions(OcrOptions): kind: Literal["tesserocr"] = "tesserocr" lang: List[str] = ["fra", "deu", "spa", "eng"] + model_config = ConfigDict( + extra="forbid", + ) + class PipelineOptions(BaseModel): do_table_structure: bool = True # True: perform table structure extraction