diff --git a/docling/datamodel/pipeline_model_specializations.py b/docling/datamodel/pipeline_model_specializations.py index 12ebcb46..7082da3b 100644 --- a/docling/datamodel/pipeline_model_specializations.py +++ b/docling/datamodel/pipeline_model_specializations.py @@ -154,3 +154,22 @@ qwen25_vl_3b_vlm_mlx_conversion_options = HuggingFaceVlmOptions( scale=2.0, temperature=0.0, ) + +# Gemma-3 +gemma_3_12b_mlx_conversion_options = HuggingFaceVlmOptions( + repo_id="mlx-community/gemma-3-12b-it-bf16", + prompt="Convert this page to markdown. Do not miss any text and only output the bare MarkDown!", + response_format=ResponseFormat.MARKDOWN, + inference_framework=InferenceFramework.MLX, + scale=2.0, + temperature=0.0, +) + +gemma_3_27b_mlx_conversion_options = HuggingFaceVlmOptions( + repo_id="mlx-community/gemma-3-27b-it-bf16", + prompt="Convert this page to markdown. Do not miss any text and only output the bare MarkDown!", + response_format=ResponseFormat.MARKDOWN, + inference_framework=InferenceFramework.MLX, + scale=2.0, + temperature=0.0, +) diff --git a/docs/examples/minimal_vlm_pipeline.py b/docs/examples/minimal_vlm_pipeline.py index fa79fcc9..32aecc6d 100644 --- a/docs/examples/minimal_vlm_pipeline.py +++ b/docs/examples/minimal_vlm_pipeline.py @@ -11,6 +11,7 @@ from docling.datamodel.pipeline_model_specializations import ( HuggingFaceVlmOptions, InferenceFramework, ResponseFormat, + gemma_3_12b_mlx_conversion_options, granite_vision_vlm_conversion_options, granite_vision_vlm_ollama_conversion_options, phi_vlm_conversion_options, @@ -199,6 +200,7 @@ if __name__ == "__main__": # qwen25_vl_3b_vlm_mlx_conversion_options, \ # pixtral_12b_vlm_mlx_conversion_options, # pixtral_12b_vlm_conversion_options, + gemma_3_12b_mlx_conversion_options, ]: pipeline_options.vlm_options = vlm_options diff --git a/tests/test_backend_html.py b/tests/test_backend_html.py index 18254a78..783137cc 100644 --- a/tests/test_backend_html.py +++ b/tests/test_backend_html.py @@ -2,6 +2,7 @@ from io import BytesIO from pathlib import Path import pytest +from docling_core.types.doc.document import SectionHeaderItem from docling.backend.html_backend import HTMLDocumentBackend from docling.datamodel.base_models import InputFormat @@ -9,7 +10,7 @@ from docling.datamodel.document import ( ConversionResult, DoclingDocument, InputDocument, - SectionHeaderItem, + # SectionHeaderItem, ) from docling.document_converter import DocumentConverter diff --git a/tests/test_backend_msword.py b/tests/test_backend_msword.py index c50e0718..782e04ee 100644 --- a/tests/test_backend_msword.py +++ b/tests/test_backend_msword.py @@ -1,12 +1,14 @@ from pathlib import Path +from docling_core.types.doc.document import SectionHeaderItem + from docling.backend.msword_backend import MsWordDocumentBackend from docling.datamodel.base_models import InputFormat from docling.datamodel.document import ( ConversionResult, DoclingDocument, InputDocument, - SectionHeaderItem, + # SectionHeaderItem, ) from docling.document_converter import DocumentConverter