From bba056b2da043c02d3253acdb4f875dbe7ccf421 Mon Sep 17 00:00:00 2001 From: DimtrisKaragatslis Date: Thu, 8 May 2025 15:12:22 +0300 Subject: [PATCH] fix: ensure orig and text are both strings in TesseractOcrCliModel Signed-off-by: Dimitris Karagatslis --- docling/models/tesseract_ocr_cli_model.py | 2 +- 1 file changed, 1 insertion(+), 1 deletion(-) diff --git a/docling/models/tesseract_ocr_cli_model.py b/docling/models/tesseract_ocr_cli_model.py index 91b4555f..33ca0c10 100644 --- a/docling/models/tesseract_ocr_cli_model.py +++ b/docling/models/tesseract_ocr_cli_model.py @@ -249,7 +249,7 @@ class TesseractOcrCliModel(BaseOcrModel): cell = TextCell( index=ix, text=str(text), - orig=text, + orig=str(text), from_ocr=True, confidence=conf / 100.0, rect=BoundingRectangle.from_bounding_box(