diff --git a/docling/datamodel/vlm_model_specs.py b/docling/datamodel/vlm_model_specs.py index fd3c347d..dd796fba 100644 --- a/docling/datamodel/vlm_model_specs.py +++ b/docling/datamodel/vlm_model_specs.py @@ -24,10 +24,14 @@ GRANITEDOCLING_TRANSFORMERS = InlineVlmOptions( prompt="Convert this page to docling.", response_format=ResponseFormat.DOCTAGS, inference_framework=InferenceFramework.MLX, - supported_devices=[AcceleratorDevice.MPS], + supported_devices=[ + AcceleratorDevice.CPU, + AcceleratorDevice.CUDA, + ], scale=2.0, temperature=0.0, - stop_strings=["", ""], + max_new_tokens=8192, + stop_strings=["", "<|end_of_text|>"], ) GRANITEDOCLING_MLX = InlineVlmOptions( @@ -38,7 +42,8 @@ GRANITEDOCLING_MLX = InlineVlmOptions( supported_devices=[AcceleratorDevice.MPS], scale=2.0, temperature=0.0, - stop_strings=["", ""], + max_new_tokens=8192, + stop_strings=["", "<|end_of_text|>"], ) # SmolDocling