Small fixes

Signed-off-by: Christoph Auer <cau@zurich.ibm.com>
2025-12-08 12:48:28 +00:00 · 2025-08-18 11:12:02 +02:00
parent f42676aab9
commit e372cfe01a
2 changed files with 2 additions and 2 deletions
--- a/docling/datamodel/vlm_model_specs.py
+++ b/docling/datamodel/vlm_model_specs.py
@@ -65,7 +65,7 @@ SMOLDOCLING_VLLM = InlineVlmOptions(
 SMOLVLM500_TRANSFORMERS = InlineVlmOptions(
    repo_id="HuggingFaceTB/SmolVLM-500M-Instruct",
    prompt="Transcribe this image to plain text.",
-    response_format=ResponseFormat.DOCTAGS,
+    response_format=ResponseFormat.PLAINTEXT,
    inference_framework=InferenceFramework.TRANSFORMERS,
    transformers_model_type=TransformersModelType.AUTOMODEL_IMAGETEXTTOTEXT,
    supported_devices=[
--- a/docling/pipeline/threaded_multistage_vlm_pipeline.py
+++ b/docling/pipeline/threaded_multistage_vlm_pipeline.py
@@ -161,7 +161,7 @@ class ThreadedMultiStageVlmPipelineOptions(PaginatedPipelineOptions):
        # text_opts = DOLPHIN_TRANSFORMERS.model_copy()
        # text_opts.prompt = "<s>Read text in the image. <Answer/>"

-        base_model = SMOLVLM500_TRANSFORMERS
+        base_model = SMOLVLM500_MLX

        text_opts = base_model.model_copy()
        # text_opts.prompt = "Convert this page to docling."