diff --git a/docling/datamodel/vlm_model_specs.py b/docling/datamodel/vlm_model_specs.py index 54d0c3e9..d008f58c 100644 --- a/docling/datamodel/vlm_model_specs.py +++ b/docling/datamodel/vlm_model_specs.py @@ -287,6 +287,7 @@ DOLPHIN_TRANSFORMERS = InlineVlmOptions( # NuExtract NU_EXTRACT_2B_TRANSFORMERS = InlineVlmOptions( repo_id="numind/NuExtract-2.0-2B", + revision="fe5b2f0b63b81150721435a3ca1129a75c59c74e", # 489efed leads to MPS issues prompt="", # This won't be used, template is passed separately torch_dtype="bfloat16", inference_framework=InferenceFramework.TRANSFORMERS, diff --git a/docling/models/vlm_models_inline/nuextract_transformers_model.py b/docling/models/vlm_models_inline/nuextract_transformers_model.py index 194a1d9d..3fe39510 100644 --- a/docling/models/vlm_models_inline/nuextract_transformers_model.py +++ b/docling/models/vlm_models_inline/nuextract_transformers_model.py @@ -131,7 +131,10 @@ class NuExtractTransformersModel(BaseVlmModel, HuggingFaceModelDownloadMixin): repo_cache_folder = vlm_options.repo_id.replace("/", "--") if artifacts_path is None: - artifacts_path = self.download_models(self.vlm_options.repo_id) + artifacts_path = self.download_models( + repo_id=self.vlm_options.repo_id, + revision=self.vlm_options.revision, + ) elif (artifacts_path / repo_cache_folder).exists(): artifacts_path = artifacts_path / repo_cache_folder