mirror of
https://github.com/DS4SD/docling.git
synced 2025-07-25 19:44:34 +00:00
initial reference to granite-doclong
Signed-off-by: Peter Staar <taa@zurich.ibm.com>
This commit is contained in:
parent
64ac043786
commit
90da15f611
@ -50,6 +50,7 @@ from docling.datamodel.settings import settings
|
|||||||
from docling.datamodel.vlm_model_specs import (
|
from docling.datamodel.vlm_model_specs import (
|
||||||
GRANITE_VISION_OLLAMA,
|
GRANITE_VISION_OLLAMA,
|
||||||
GRANITE_VISION_TRANSFORMERS,
|
GRANITE_VISION_TRANSFORMERS,
|
||||||
|
GRANITEDOCLING_TRANSFORMERS,
|
||||||
SMOLDOCLING_MLX,
|
SMOLDOCLING_MLX,
|
||||||
SMOLDOCLING_TRANSFORMERS,
|
SMOLDOCLING_TRANSFORMERS,
|
||||||
VlmModelType,
|
VlmModelType,
|
||||||
@ -595,6 +596,20 @@ def convert( # noqa: C901
|
|||||||
"To run SmolDocling faster, please install mlx-vlm:\n"
|
"To run SmolDocling faster, please install mlx-vlm:\n"
|
||||||
"pip install mlx-vlm"
|
"pip install mlx-vlm"
|
||||||
)
|
)
|
||||||
|
elif vlm_model == VlmModelType.GRANITE_DOCLING:
|
||||||
|
pipeline_options.vlm_options = GRANITEDOCLING_TRANSFORMERS
|
||||||
|
"""
|
||||||
|
if sys.platform == "darwin":
|
||||||
|
try:
|
||||||
|
import mlx_vlm
|
||||||
|
|
||||||
|
pipeline_options.vlm_options = GRANITEDOCLING_MLX
|
||||||
|
except ImportError:
|
||||||
|
_log.warning(
|
||||||
|
"To run SmolDocling faster, please install mlx-vlm:\n"
|
||||||
|
"pip install mlx-vlm"
|
||||||
|
)
|
||||||
|
"""
|
||||||
|
|
||||||
pdf_format_option = PdfFormatOption(
|
pdf_format_option = PdfFormatOption(
|
||||||
pipeline_cls=VlmPipeline, pipeline_options=pipeline_options
|
pipeline_cls=VlmPipeline, pipeline_options=pipeline_options
|
||||||
|
@ -43,6 +43,22 @@ SMOLDOCLING_TRANSFORMERS = InlineVlmOptions(
|
|||||||
temperature=0.0,
|
temperature=0.0,
|
||||||
)
|
)
|
||||||
|
|
||||||
|
# GraniteDocling
|
||||||
|
GRANITEDOCLING_TRANSFORMERS = InlineVlmOptions(
|
||||||
|
repo_id="ibm-granite/granite-docling-256m-preview",
|
||||||
|
prompt="Convert this page to docling.",
|
||||||
|
response_format=ResponseFormat.DOCTAGS,
|
||||||
|
inference_framework=InferenceFramework.TRANSFORMERS,
|
||||||
|
transformers_model_type=TransformersModelType.AUTOMODEL_VISION2SEQ,
|
||||||
|
supported_devices=[
|
||||||
|
AcceleratorDevice.CPU,
|
||||||
|
AcceleratorDevice.CUDA,
|
||||||
|
AcceleratorDevice.MPS,
|
||||||
|
],
|
||||||
|
scale=2.0,
|
||||||
|
temperature=0.0,
|
||||||
|
)
|
||||||
|
|
||||||
# GraniteVision
|
# GraniteVision
|
||||||
GRANITE_VISION_TRANSFORMERS = InlineVlmOptions(
|
GRANITE_VISION_TRANSFORMERS = InlineVlmOptions(
|
||||||
repo_id="ibm-granite/granite-vision-3.2-2b",
|
repo_id="ibm-granite/granite-vision-3.2-2b",
|
||||||
@ -140,5 +156,6 @@ GEMMA3_27B_MLX = InlineVlmOptions(
|
|||||||
|
|
||||||
class VlmModelType(str, Enum):
|
class VlmModelType(str, Enum):
|
||||||
SMOLDOCLING = "smoldocling"
|
SMOLDOCLING = "smoldocling"
|
||||||
|
GRANITE_DOCLING = "granite_docling"
|
||||||
GRANITE_VISION = "granite_vision"
|
GRANITE_VISION = "granite_vision"
|
||||||
GRANITE_VISION_OLLAMA = "granite_vision_ollama"
|
GRANITE_VISION_OLLAMA = "granite_vision_ollama"
|
||||||
|
Loading…
Reference in New Issue
Block a user