diff --git a/docling/models/vlm_models_inline/hf_transformers_model.py b/docling/models/vlm_models_inline/hf_transformers_model.py index 18bd7d86..689bdc50 100644 --- a/docling/models/vlm_models_inline/hf_transformers_model.py +++ b/docling/models/vlm_models_inline/hf_transformers_model.py @@ -94,7 +94,7 @@ class HuggingFaceTransformersVlmModel(BasePageModel, HuggingFaceModelDownloadMix model_cls = AutoModelForVision2Seq elif ( self.vlm_options.transformers_model_type - == TransformersModelType.AUTOMODEL_FORIMAGETEXTTOTEXT + == TransformersModelType.AUTOMODEL_IMAGETEXTTOTEXT ): model_cls = AutoModelForImageTextToText