updated the model specs

Signed-off-by: Peter Staar <taa@zurich.ibm.com>
2025-12-08 12:48:28 +00:00 · 2025-09-05 16:58:43 +02:00
parent c1dcb0597d
commit 0e2f370f4f
1 changed files with 8 additions and 3 deletions
--- a/docling/datamodel/vlm_model_specs.py
+++ b/docling/datamodel/vlm_model_specs.py
@@ -24,10 +24,14 @@ GRANITEDOCLING_TRANSFORMERS = InlineVlmOptions(
    prompt="Convert this page to docling.",
    response_format=ResponseFormat.DOCTAGS,
    inference_framework=InferenceFramework.MLX,
-    supported_devices=[AcceleratorDevice.MPS],
+    supported_devices=[
        AcceleratorDevice.CPU,
        AcceleratorDevice.CUDA,
    ],
    scale=2.0,
    temperature=0.0,
-    stop_strings=["</doctag>", "<end_of_utterance>"],
+    max_new_tokens=8192,
    stop_strings=["</doctag>", "<|end_of_text|>"],
 )
 GRANITEDOCLING_MLX = InlineVlmOptions(
@@ -38,7 +42,8 @@ GRANITEDOCLING_MLX = InlineVlmOptions(
    supported_devices=[AcceleratorDevice.MPS],
    scale=2.0,
    temperature=0.0,
-    stop_strings=["</doctag>", "<end_of_utterance>"],
+    max_new_tokens=8192,
    stop_strings=["</doctag>", "<|end_of_text|>"],
 )
 # SmolDocling