mirror of
https://github.com/DS4SD/docling.git
synced 2025-08-01 15:02:21 +00:00
show other vlm
Signed-off-by: Michele Dolfi <dol@zurich.ibm.com>
This commit is contained in:
parent
753c12b29e
commit
287e621c7a
@ -175,7 +175,7 @@
|
|||||||
},
|
},
|
||||||
{
|
{
|
||||||
"cell_type": "code",
|
"cell_type": "code",
|
||||||
"execution_count": 5,
|
"execution_count": 7,
|
||||||
"metadata": {},
|
"metadata": {},
|
||||||
"outputs": [],
|
"outputs": [],
|
||||||
"source": [
|
"source": [
|
||||||
@ -265,6 +265,52 @@
|
|||||||
"display.HTML(\"<hr />\".join(html_buffer))"
|
"display.HTML(\"<hr />\".join(html_buffer))"
|
||||||
]
|
]
|
||||||
},
|
},
|
||||||
|
{
|
||||||
|
"cell_type": "markdown",
|
||||||
|
"metadata": {},
|
||||||
|
"source": [
|
||||||
|
"---"
|
||||||
|
]
|
||||||
|
},
|
||||||
|
{
|
||||||
|
"cell_type": "markdown",
|
||||||
|
"metadata": {},
|
||||||
|
"source": [
|
||||||
|
"## Use other vision models\n",
|
||||||
|
"\n",
|
||||||
|
"The examples above can also be reproduced using other vision model.\n",
|
||||||
|
"The Docling options `PictureDescriptionVlmOptions` allows to speficy your favorite vision model from the Hugging Face Hub."
|
||||||
|
]
|
||||||
|
},
|
||||||
|
{
|
||||||
|
"cell_type": "code",
|
||||||
|
"execution_count": 8,
|
||||||
|
"metadata": {},
|
||||||
|
"outputs": [],
|
||||||
|
"source": [
|
||||||
|
"from docling.datamodel.pipeline_options import PictureDescriptionVlmOptions\n",
|
||||||
|
"\n",
|
||||||
|
"pipeline_options = PdfPipelineOptions()\n",
|
||||||
|
"pipeline_options.do_picture_description = True\n",
|
||||||
|
"pipeline_options.picture_description_options = PictureDescriptionVlmOptions(\n",
|
||||||
|
" repo_id=\"\", # <-- add here the Hugging Face repo_id of your favorite VLM\n",
|
||||||
|
" prompt=\"Describe the image in three sentences. Be consise and accurate.\",\n",
|
||||||
|
")\n",
|
||||||
|
"pipeline_options.images_scale = 2.0\n",
|
||||||
|
"pipeline_options.generate_picture_images = True\n",
|
||||||
|
"\n",
|
||||||
|
"converter = DocumentConverter(\n",
|
||||||
|
" format_options={\n",
|
||||||
|
" InputFormat.PDF: PdfFormatOption(\n",
|
||||||
|
" pipeline_options=pipeline_options,\n",
|
||||||
|
" )\n",
|
||||||
|
" }\n",
|
||||||
|
")\n",
|
||||||
|
"\n",
|
||||||
|
"# Uncomment to run:\n",
|
||||||
|
"# doc = converter.convert(DOC_SOURCE).document"
|
||||||
|
]
|
||||||
|
},
|
||||||
{
|
{
|
||||||
"cell_type": "code",
|
"cell_type": "code",
|
||||||
"execution_count": null,
|
"execution_count": null,
|
||||||
|
Loading…
Reference in New Issue
Block a user