updated the model specs

Signed-off-by: Peter Staar <taa@zurich.ibm.com>
This commit is contained in:
Peter Staar
2025-09-05 16:58:43 +02:00
parent c1dcb0597d
commit 0e2f370f4f

View File

@@ -24,10 +24,14 @@ GRANITEDOCLING_TRANSFORMERS = InlineVlmOptions(
prompt="Convert this page to docling.", prompt="Convert this page to docling.",
response_format=ResponseFormat.DOCTAGS, response_format=ResponseFormat.DOCTAGS,
inference_framework=InferenceFramework.MLX, inference_framework=InferenceFramework.MLX,
supported_devices=[AcceleratorDevice.MPS], supported_devices=[
AcceleratorDevice.CPU,
AcceleratorDevice.CUDA,
],
scale=2.0, scale=2.0,
temperature=0.0, temperature=0.0,
stop_strings=["</doctag>", "<end_of_utterance>"], max_new_tokens=8192,
stop_strings=["</doctag>", "<|end_of_text|>"],
) )
GRANITEDOCLING_MLX = InlineVlmOptions( GRANITEDOCLING_MLX = InlineVlmOptions(
@@ -38,7 +42,8 @@ GRANITEDOCLING_MLX = InlineVlmOptions(
supported_devices=[AcceleratorDevice.MPS], supported_devices=[AcceleratorDevice.MPS],
scale=2.0, scale=2.0,
temperature=0.0, temperature=0.0,
stop_strings=["</doctag>", "<end_of_utterance>"], max_new_tokens=8192,
stop_strings=["</doctag>", "<|end_of_text|>"],
) )
# SmolDocling # SmolDocling