mirror of
https://github.com/DS4SD/docling.git
synced 2025-12-11 22:28:31 +00:00
20479 lines
714 KiB
HTML
20479 lines
714 KiB
HTML
|
||
<!doctype html>
|
||
<html lang="en" class="no-js">
|
||
<head>
|
||
|
||
<meta charset="utf-8">
|
||
<meta name="viewport" content="width=device-width,initial-scale=1">
|
||
|
||
|
||
|
||
<link rel="canonical" href="https://docling-project.github.io/docling/reference/pipeline_options/">
|
||
|
||
|
||
<link rel="prev" href="../document_converter/">
|
||
|
||
|
||
<link rel="next" href="../docling_document/">
|
||
|
||
|
||
|
||
|
||
|
||
<link rel="icon" href="../../assets/logo.png">
|
||
<meta name="generator" content="mkdocs-1.6.1, mkdocs-material-9.7.0">
|
||
|
||
|
||
|
||
<title>Pipeline options - Docling</title>
|
||
|
||
|
||
|
||
<link rel="stylesheet" href="../../assets/stylesheets/main.618322db.min.css">
|
||
|
||
|
||
<link rel="stylesheet" href="../../assets/stylesheets/palette.ab4e12ef.min.css">
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
<link rel="preconnect" href="https://fonts.gstatic.com" crossorigin>
|
||
<link rel="stylesheet" href="https://fonts.googleapis.com/css?family=Roboto:300,300i,400,400i,700,700i%7CRoboto+Mono:400,400i,700,700i&display=fallback">
|
||
<style>:root{--md-text-font:"Roboto";--md-code-font:"Roboto Mono"}</style>
|
||
|
||
|
||
|
||
<link rel="stylesheet" href="../../assets/_mkdocstrings.css">
|
||
|
||
<link rel="stylesheet" href="../../stylesheets/extra.css">
|
||
|
||
<script>__md_scope=new URL("../..",location),__md_hash=e=>[...e].reduce(((e,_)=>(e<<5)-e+_.charCodeAt(0)),0),__md_get=(e,_=localStorage,t=__md_scope)=>JSON.parse(_.getItem(t.pathname+"."+e)),__md_set=(e,_,t=localStorage,a=__md_scope)=>{try{t.setItem(a.pathname+"."+e,JSON.stringify(_))}catch(e){}}</script>
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
<script id="__analytics">function __md_analytics(){function e(){dataLayer.push(arguments)}window.dataLayer=window.dataLayer||[],e("js",new Date),e("config","G-MP75NXFDH4"),document.addEventListener("DOMContentLoaded",(function(){document.forms.search&&document.forms.search.query.addEventListener("blur",(function(){this.value&&e("event","search",{search_term:this.value})}));document$.subscribe((function(){var t=document.forms.feedback;if(void 0!==t)for(var a of t.querySelectorAll("[type=submit]"))a.addEventListener("click",(function(a){a.preventDefault();var n=document.location.pathname,d=this.getAttribute("data-md-value");e("event","feedback",{page:n,data:d}),t.firstElementChild.disabled=!0;var r=t.querySelector(".md-feedback__note [data-md-value='"+d+"']");r&&(r.hidden=!1)})),t.hidden=!1})),location$.subscribe((function(t){e("config","G-MP75NXFDH4",{page_path:t.pathname})}))}));var t=document.createElement("script");t.async=!0,t.src="https://www.googletagmanager.com/gtag/js?id=G-MP75NXFDH4",document.getElementById("__analytics").insertAdjacentElement("afterEnd",t)}</script>
|
||
|
||
<script>"undefined"!=typeof __md_analytics&&__md_analytics()</script>
|
||
|
||
|
||
|
||
|
||
</head>
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
<body dir="ltr" data-md-color-scheme="slate" data-md-color-primary="black" data-md-color-accent="indigo">
|
||
|
||
|
||
<input class="md-toggle" data-md-toggle="drawer" type="checkbox" id="__drawer" autocomplete="off">
|
||
<input class="md-toggle" data-md-toggle="search" type="checkbox" id="__search" autocomplete="off">
|
||
<label class="md-overlay" for="__drawer"></label>
|
||
<div data-md-component="skip">
|
||
|
||
|
||
<a href="#pipeline-options" class="md-skip">
|
||
Skip to content
|
||
</a>
|
||
|
||
</div>
|
||
<div data-md-component="announce">
|
||
|
||
</div>
|
||
|
||
|
||
|
||
|
||
<header class="md-header" data-md-component="header">
|
||
<nav class="md-header__inner md-grid" aria-label="Header">
|
||
<a href="../.." title="Docling" class="md-header__button md-logo" aria-label="Docling" data-md-component="logo">
|
||
|
||
<img src="../../assets/logo.png" alt="logo">
|
||
|
||
</a>
|
||
<label class="md-header__button md-icon" for="__drawer">
|
||
|
||
<svg xmlns="http://www.w3.org/2000/svg" viewBox="0 0 24 24"><path d="M3 6h18v2H3zm0 5h18v2H3zm0 5h18v2H3z"/></svg>
|
||
</label>
|
||
<div class="md-header__title" data-md-component="header-title">
|
||
<div class="md-header__ellipsis">
|
||
<div class="md-header__topic">
|
||
<span class="md-ellipsis">
|
||
Docling
|
||
</span>
|
||
</div>
|
||
<div class="md-header__topic" data-md-component="header-topic">
|
||
<span class="md-ellipsis">
|
||
|
||
Pipeline options
|
||
|
||
</span>
|
||
</div>
|
||
</div>
|
||
</div>
|
||
|
||
|
||
<form class="md-header__option" data-md-component="palette">
|
||
|
||
|
||
|
||
|
||
<input class="md-option" data-md-color-media="" data-md-color-scheme="slate" data-md-color-primary="black" data-md-color-accent="indigo" aria-label="Switch to light mode" type="radio" name="__palette" id="__palette_0">
|
||
|
||
<label class="md-header__button md-icon" title="Switch to light mode" for="__palette_1" hidden>
|
||
<svg xmlns="http://www.w3.org/2000/svg" viewBox="0 0 24 24"><path d="M12 8a4 4 0 0 0-4 4 4 4 0 0 0 4 4 4 4 0 0 0 4-4 4 4 0 0 0-4-4m0 10a6 6 0 0 1-6-6 6 6 0 0 1 6-6 6 6 0 0 1 6 6 6 6 0 0 1-6 6m8-9.31V4h-4.69L12 .69 8.69 4H4v4.69L.69 12 4 15.31V20h4.69L12 23.31 15.31 20H20v-4.69L23.31 12z"/></svg>
|
||
</label>
|
||
|
||
|
||
|
||
|
||
|
||
<input class="md-option" data-md-color-media="(prefers-color-scheme: light)" data-md-color-scheme="default" data-md-color-primary="black" data-md-color-accent="indigo" aria-label="Switch to dark mode" type="radio" name="__palette" id="__palette_1">
|
||
|
||
<label class="md-header__button md-icon" title="Switch to dark mode" for="__palette_2" hidden>
|
||
<svg xmlns="http://www.w3.org/2000/svg" viewBox="0 0 24 24"><path d="M12 18c-.89 0-1.74-.2-2.5-.55C11.56 16.5 13 14.42 13 12s-1.44-4.5-3.5-5.45C10.26 6.2 11.11 6 12 6a6 6 0 0 1 6 6 6 6 0 0 1-6 6m8-9.31V4h-4.69L12 .69 8.69 4H4v4.69L.69 12 4 15.31V20h4.69L12 23.31 15.31 20H20v-4.69L23.31 12z"/></svg>
|
||
</label>
|
||
|
||
|
||
|
||
|
||
|
||
<input class="md-option" data-md-color-media="(prefers-color-scheme: dark)" data-md-color-scheme="slate" data-md-color-primary="black" data-md-color-accent="indigo" aria-label="Switch to system preference" type="radio" name="__palette" id="__palette_2">
|
||
|
||
<label class="md-header__button md-icon" title="Switch to system preference" for="__palette_0" hidden>
|
||
<svg xmlns="http://www.w3.org/2000/svg" viewBox="0 0 24 24"><path d="m14.3 16-.7-2h-3.2l-.7 2H7.8L11 7h2l3.2 9zM20 8.69V4h-4.69L12 .69 8.69 4H4v4.69L.69 12 4 15.31V20h4.69L12 23.31 15.31 20H20v-4.69L23.31 12zm-9.15 3.96h2.3L12 9z"/></svg>
|
||
</label>
|
||
|
||
|
||
</form>
|
||
|
||
|
||
|
||
<script>var palette=__md_get("__palette");if(palette&&palette.color){if("(prefers-color-scheme)"===palette.color.media){var media=matchMedia("(prefers-color-scheme: light)"),input=document.querySelector(media.matches?"[data-md-color-media='(prefers-color-scheme: light)']":"[data-md-color-media='(prefers-color-scheme: dark)']");palette.color.media=input.getAttribute("data-md-color-media"),palette.color.scheme=input.getAttribute("data-md-color-scheme"),palette.color.primary=input.getAttribute("data-md-color-primary"),palette.color.accent=input.getAttribute("data-md-color-accent")}for(var[key,value]of Object.entries(palette.color))document.body.setAttribute("data-md-color-"+key,value)}</script>
|
||
|
||
|
||
|
||
|
||
|
||
<label class="md-header__button md-icon" for="__search">
|
||
|
||
<svg xmlns="http://www.w3.org/2000/svg" viewBox="0 0 24 24"><path d="M9.5 3A6.5 6.5 0 0 1 16 9.5c0 1.61-.59 3.09-1.56 4.23l.27.27h.79l5 5-1.5 1.5-5-5v-.79l-.27-.27A6.52 6.52 0 0 1 9.5 16 6.5 6.5 0 0 1 3 9.5 6.5 6.5 0 0 1 9.5 3m0 2C7 5 5 7 5 9.5S7 14 9.5 14 14 12 14 9.5 12 5 9.5 5"/></svg>
|
||
</label>
|
||
<div class="md-search" data-md-component="search" role="dialog">
|
||
<label class="md-search__overlay" for="__search"></label>
|
||
<div class="md-search__inner" role="search">
|
||
<form class="md-search__form" name="search">
|
||
<input type="text" class="md-search__input" name="query" aria-label="Search" placeholder="Search" autocapitalize="off" autocorrect="off" autocomplete="off" spellcheck="false" data-md-component="search-query" required>
|
||
<label class="md-search__icon md-icon" for="__search">
|
||
|
||
<svg xmlns="http://www.w3.org/2000/svg" viewBox="0 0 24 24"><path d="M9.5 3A6.5 6.5 0 0 1 16 9.5c0 1.61-.59 3.09-1.56 4.23l.27.27h.79l5 5-1.5 1.5-5-5v-.79l-.27-.27A6.52 6.52 0 0 1 9.5 16 6.5 6.5 0 0 1 3 9.5 6.5 6.5 0 0 1 9.5 3m0 2C7 5 5 7 5 9.5S7 14 9.5 14 14 12 14 9.5 12 5 9.5 5"/></svg>
|
||
|
||
<svg xmlns="http://www.w3.org/2000/svg" viewBox="0 0 24 24"><path d="M20 11v2H8l5.5 5.5-1.42 1.42L4.16 12l7.92-7.92L13.5 5.5 8 11z"/></svg>
|
||
</label>
|
||
<nav class="md-search__options" aria-label="Search">
|
||
|
||
<button type="reset" class="md-search__icon md-icon" title="Clear" aria-label="Clear" tabindex="-1">
|
||
|
||
<svg xmlns="http://www.w3.org/2000/svg" viewBox="0 0 24 24"><path d="M19 6.41 17.59 5 12 10.59 6.41 5 5 6.41 10.59 12 5 17.59 6.41 19 12 13.41 17.59 19 19 17.59 13.41 12z"/></svg>
|
||
</button>
|
||
</nav>
|
||
|
||
<div class="md-search__suggest" data-md-component="search-suggest"></div>
|
||
|
||
</form>
|
||
<div class="md-search__output">
|
||
<div class="md-search__scrollwrap" tabindex="0" data-md-scrollfix>
|
||
<div class="md-search-result" data-md-component="search-result">
|
||
<div class="md-search-result__meta">
|
||
Initializing search
|
||
</div>
|
||
<ol class="md-search-result__list" role="presentation"></ol>
|
||
</div>
|
||
</div>
|
||
</div>
|
||
</div>
|
||
</div>
|
||
|
||
|
||
|
||
<div class="md-header__source">
|
||
<a href="https://github.com/docling-project/docling" title="Go to repository" class="md-source" data-md-component="source">
|
||
<div class="md-source__icon md-icon">
|
||
|
||
<svg xmlns="http://www.w3.org/2000/svg" viewBox="0 0 448 512"><!--! Font Awesome Free 7.1.0 by @fontawesome - https://fontawesome.com License - https://fontawesome.com/license/free (Icons: CC BY 4.0, Fonts: SIL OFL 1.1, Code: MIT License) Copyright 2025 Fonticons, Inc.--><path d="M439.6 236.1 244 40.5c-5.4-5.5-12.8-8.5-20.4-8.5s-15 3-20.4 8.4L162.5 81l51.5 51.5c27.1-9.1 52.7 16.8 43.4 43.7l49.7 49.7c34.2-11.8 61.2 31 35.5 56.7-26.5 26.5-70.2-2.9-56-37.3L240.3 199v121.9c25.3 12.5 22.3 41.8 9.1 55-6.4 6.4-15.2 10.1-24.3 10.1s-17.8-3.6-24.3-10.1c-17.6-17.6-11.1-46.9 11.2-56v-123c-20.8-8.5-24.6-30.7-18.6-45L142.6 101 8.5 235.1C3 240.6 0 247.9 0 255.5s3 15 8.5 20.4l195.6 195.7c5.4 5.4 12.7 8.4 20.4 8.4s15-3 20.4-8.4l194.7-194.7c5.4-5.4 8.4-12.8 8.4-20.4s-3-15-8.4-20.4"/></svg>
|
||
</div>
|
||
<div class="md-source__repository">
|
||
docling-project/docling
|
||
</div>
|
||
</a>
|
||
</div>
|
||
|
||
</nav>
|
||
|
||
</header>
|
||
|
||
<div class="md-container" data-md-component="container">
|
||
|
||
|
||
|
||
|
||
|
||
<nav class="md-tabs" aria-label="Tabs" data-md-component="tabs">
|
||
<div class="md-grid">
|
||
<ul class="md-tabs__list">
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
<li class="md-tabs__item">
|
||
<a href="../.." class="md-tabs__link">
|
||
|
||
|
||
|
||
|
||
|
||
Documentation
|
||
|
||
</a>
|
||
</li>
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
<li class="md-tabs__item">
|
||
<a href="../../concepts/" class="md-tabs__link">
|
||
|
||
|
||
|
||
|
||
|
||
Concepts
|
||
|
||
</a>
|
||
</li>
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
<li class="md-tabs__item">
|
||
<a href="../../examples/" class="md-tabs__link">
|
||
|
||
|
||
|
||
|
||
|
||
Examples
|
||
|
||
</a>
|
||
</li>
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
<li class="md-tabs__item">
|
||
<a href="../../integrations/" class="md-tabs__link">
|
||
|
||
|
||
|
||
|
||
|
||
Integrations
|
||
|
||
</a>
|
||
</li>
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
<li class="md-tabs__item md-tabs__item--active">
|
||
<a href="../document_converter/" class="md-tabs__link">
|
||
|
||
|
||
|
||
|
||
|
||
Reference
|
||
|
||
</a>
|
||
</li>
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
</ul>
|
||
</div>
|
||
</nav>
|
||
|
||
|
||
|
||
<main class="md-main" data-md-component="main">
|
||
<div class="md-main__inner md-grid">
|
||
|
||
|
||
|
||
<div class="md-sidebar md-sidebar--primary" data-md-component="sidebar" data-md-type="navigation" >
|
||
<div class="md-sidebar__scrollwrap">
|
||
<div class="md-sidebar__inner">
|
||
|
||
|
||
|
||
|
||
|
||
|
||
<nav class="md-nav md-nav--primary md-nav--lifted" aria-label="Navigation" data-md-level="0">
|
||
<label class="md-nav__title" for="__drawer">
|
||
<a href="../.." title="Docling" class="md-nav__button md-logo" aria-label="Docling" data-md-component="logo">
|
||
|
||
<img src="../../assets/logo.png" alt="logo">
|
||
|
||
</a>
|
||
Docling
|
||
</label>
|
||
|
||
<div class="md-nav__source">
|
||
<a href="https://github.com/docling-project/docling" title="Go to repository" class="md-source" data-md-component="source">
|
||
<div class="md-source__icon md-icon">
|
||
|
||
<svg xmlns="http://www.w3.org/2000/svg" viewBox="0 0 448 512"><!--! Font Awesome Free 7.1.0 by @fontawesome - https://fontawesome.com License - https://fontawesome.com/license/free (Icons: CC BY 4.0, Fonts: SIL OFL 1.1, Code: MIT License) Copyright 2025 Fonticons, Inc.--><path d="M439.6 236.1 244 40.5c-5.4-5.5-12.8-8.5-20.4-8.5s-15 3-20.4 8.4L162.5 81l51.5 51.5c27.1-9.1 52.7 16.8 43.4 43.7l49.7 49.7c34.2-11.8 61.2 31 35.5 56.7-26.5 26.5-70.2-2.9-56-37.3L240.3 199v121.9c25.3 12.5 22.3 41.8 9.1 55-6.4 6.4-15.2 10.1-24.3 10.1s-17.8-3.6-24.3-10.1c-17.6-17.6-11.1-46.9 11.2-56v-123c-20.8-8.5-24.6-30.7-18.6-45L142.6 101 8.5 235.1C3 240.6 0 247.9 0 255.5s3 15 8.5 20.4l195.6 195.7c5.4 5.4 12.7 8.4 20.4 8.4s15-3 20.4-8.4l194.7-194.7c5.4-5.4 8.4-12.8 8.4-20.4s-3-15-8.4-20.4"/></svg>
|
||
</div>
|
||
<div class="md-source__repository">
|
||
docling-project/docling
|
||
</div>
|
||
</a>
|
||
</div>
|
||
|
||
<ul class="md-nav__list" data-md-scrollfix>
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
<li class="md-nav__item md-nav__item--nested">
|
||
|
||
|
||
|
||
<input class="md-nav__toggle md-toggle " type="checkbox" id="__nav_1" >
|
||
|
||
|
||
<div class="md-nav__link md-nav__container">
|
||
<a href="../.." class="md-nav__link ">
|
||
|
||
|
||
|
||
<span class="md-ellipsis">
|
||
|
||
|
||
Documentation
|
||
|
||
|
||
|
||
</span>
|
||
|
||
|
||
|
||
</a>
|
||
|
||
|
||
<label class="md-nav__link " for="__nav_1" id="__nav_1_label" tabindex="0">
|
||
<span class="md-nav__icon md-icon"></span>
|
||
</label>
|
||
|
||
</div>
|
||
|
||
<nav class="md-nav" data-md-level="1" aria-labelledby="__nav_1_label" aria-expanded="false">
|
||
<label class="md-nav__title" for="__nav_1">
|
||
<span class="md-nav__icon md-icon"></span>
|
||
|
||
|
||
Documentation
|
||
|
||
|
||
</label>
|
||
<ul class="md-nav__list" data-md-scrollfix>
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
<li class="md-nav__item md-nav__item--nested">
|
||
|
||
|
||
|
||
<input class="md-nav__toggle md-toggle " type="checkbox" id="__nav_1_2" >
|
||
|
||
|
||
<label class="md-nav__link" for="__nav_1_2" id="__nav_1_2_label" tabindex="0">
|
||
|
||
|
||
|
||
<span class="md-ellipsis">
|
||
|
||
|
||
Getting started
|
||
|
||
|
||
|
||
</span>
|
||
|
||
|
||
|
||
<span class="md-nav__icon md-icon"></span>
|
||
</label>
|
||
|
||
<nav class="md-nav" data-md-level="2" aria-labelledby="__nav_1_2_label" aria-expanded="false">
|
||
<label class="md-nav__title" for="__nav_1_2">
|
||
<span class="md-nav__icon md-icon"></span>
|
||
|
||
|
||
Getting started
|
||
|
||
|
||
</label>
|
||
<ul class="md-nav__list" data-md-scrollfix>
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
<li class="md-nav__item">
|
||
<a href="../../getting_started/installation/" class="md-nav__link">
|
||
|
||
|
||
|
||
<span class="md-ellipsis">
|
||
|
||
|
||
Installation
|
||
|
||
|
||
|
||
</span>
|
||
|
||
|
||
|
||
</a>
|
||
</li>
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
<li class="md-nav__item">
|
||
<a href="../../getting_started/quickstart/" class="md-nav__link">
|
||
|
||
|
||
|
||
<span class="md-ellipsis">
|
||
|
||
|
||
Quickstart
|
||
|
||
|
||
|
||
</span>
|
||
|
||
|
||
|
||
</a>
|
||
</li>
|
||
|
||
|
||
|
||
|
||
</ul>
|
||
</nav>
|
||
|
||
</li>
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
<li class="md-nav__item md-nav__item--nested">
|
||
|
||
|
||
|
||
<input class="md-nav__toggle md-toggle " type="checkbox" id="__nav_1_3" >
|
||
|
||
|
||
<label class="md-nav__link" for="__nav_1_3" id="__nav_1_3_label" tabindex="0">
|
||
|
||
|
||
|
||
<span class="md-ellipsis">
|
||
|
||
|
||
Usage
|
||
|
||
|
||
|
||
</span>
|
||
|
||
|
||
|
||
<span class="md-nav__icon md-icon"></span>
|
||
</label>
|
||
|
||
<nav class="md-nav" data-md-level="2" aria-labelledby="__nav_1_3_label" aria-expanded="false">
|
||
<label class="md-nav__title" for="__nav_1_3">
|
||
<span class="md-nav__icon md-icon"></span>
|
||
|
||
|
||
Usage
|
||
|
||
|
||
</label>
|
||
<ul class="md-nav__list" data-md-scrollfix>
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
<li class="md-nav__item">
|
||
<a href="../../usage/advanced_options/" class="md-nav__link">
|
||
|
||
|
||
|
||
<span class="md-ellipsis">
|
||
|
||
|
||
Advanced options
|
||
|
||
|
||
|
||
</span>
|
||
|
||
|
||
|
||
</a>
|
||
</li>
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
<li class="md-nav__item">
|
||
<a href="../../usage/supported_formats/" class="md-nav__link">
|
||
|
||
|
||
|
||
<span class="md-ellipsis">
|
||
|
||
|
||
Supported formats
|
||
|
||
|
||
|
||
</span>
|
||
|
||
|
||
|
||
</a>
|
||
</li>
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
<li class="md-nav__item">
|
||
<a href="../../usage/enrichments/" class="md-nav__link">
|
||
|
||
|
||
|
||
<span class="md-ellipsis">
|
||
|
||
|
||
Enrichment features
|
||
|
||
|
||
|
||
</span>
|
||
|
||
|
||
|
||
</a>
|
||
</li>
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
<li class="md-nav__item">
|
||
<a href="../../usage/vision_models/" class="md-nav__link">
|
||
|
||
|
||
|
||
<span class="md-ellipsis">
|
||
|
||
|
||
Vision models
|
||
|
||
|
||
|
||
</span>
|
||
|
||
|
||
|
||
</a>
|
||
</li>
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
<li class="md-nav__item">
|
||
<a href="../../usage/gpu/" class="md-nav__link">
|
||
|
||
|
||
|
||
<span class="md-ellipsis">
|
||
|
||
|
||
GPU support
|
||
|
||
|
||
|
||
</span>
|
||
|
||
|
||
|
||
</a>
|
||
</li>
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
<li class="md-nav__item">
|
||
<a href="../../usage/mcp/" class="md-nav__link">
|
||
|
||
|
||
|
||
<span class="md-ellipsis">
|
||
|
||
|
||
MCP server
|
||
|
||
|
||
|
||
</span>
|
||
|
||
|
||
|
||
</a>
|
||
</li>
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
<li class="md-nav__item">
|
||
<a href="../../usage/jobkit/" class="md-nav__link">
|
||
|
||
|
||
|
||
<span class="md-ellipsis">
|
||
|
||
|
||
Jobkit
|
||
|
||
|
||
|
||
</span>
|
||
|
||
|
||
|
||
</a>
|
||
</li>
|
||
|
||
|
||
|
||
|
||
</ul>
|
||
</nav>
|
||
|
||
</li>
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
<li class="md-nav__item md-nav__item--nested">
|
||
|
||
|
||
|
||
<input class="md-nav__toggle md-toggle " type="checkbox" id="__nav_1_4" >
|
||
|
||
|
||
<div class="md-nav__link md-nav__container">
|
||
<a href="../../faq/" class="md-nav__link ">
|
||
|
||
|
||
|
||
<span class="md-ellipsis">
|
||
|
||
|
||
FAQ
|
||
|
||
|
||
|
||
</span>
|
||
|
||
|
||
|
||
</a>
|
||
|
||
</div>
|
||
|
||
<nav class="md-nav" data-md-level="2" aria-labelledby="__nav_1_4_label" aria-expanded="false">
|
||
<label class="md-nav__title" for="__nav_1_4">
|
||
<span class="md-nav__icon md-icon"></span>
|
||
|
||
|
||
FAQ
|
||
|
||
|
||
</label>
|
||
<ul class="md-nav__list" data-md-scrollfix>
|
||
|
||
|
||
|
||
</ul>
|
||
</nav>
|
||
|
||
</li>
|
||
|
||
|
||
|
||
|
||
</ul>
|
||
</nav>
|
||
|
||
</li>
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
<li class="md-nav__item md-nav__item--nested">
|
||
|
||
|
||
|
||
<input class="md-nav__toggle md-toggle " type="checkbox" id="__nav_2" >
|
||
|
||
|
||
<div class="md-nav__link md-nav__container">
|
||
<a href="../../concepts/" class="md-nav__link ">
|
||
|
||
|
||
|
||
<span class="md-ellipsis">
|
||
|
||
|
||
Concepts
|
||
|
||
|
||
|
||
</span>
|
||
|
||
|
||
|
||
</a>
|
||
|
||
|
||
<label class="md-nav__link " for="__nav_2" id="__nav_2_label" tabindex="0">
|
||
<span class="md-nav__icon md-icon"></span>
|
||
</label>
|
||
|
||
</div>
|
||
|
||
<nav class="md-nav" data-md-level="1" aria-labelledby="__nav_2_label" aria-expanded="false">
|
||
<label class="md-nav__title" for="__nav_2">
|
||
<span class="md-nav__icon md-icon"></span>
|
||
|
||
|
||
Concepts
|
||
|
||
|
||
</label>
|
||
<ul class="md-nav__list" data-md-scrollfix>
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
<li class="md-nav__item">
|
||
<a href="../../concepts/architecture/" class="md-nav__link">
|
||
|
||
|
||
|
||
<span class="md-ellipsis">
|
||
|
||
|
||
Architecture
|
||
|
||
|
||
|
||
</span>
|
||
|
||
|
||
|
||
</a>
|
||
</li>
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
<li class="md-nav__item">
|
||
<a href="../../concepts/docling_document/" class="md-nav__link">
|
||
|
||
|
||
|
||
<span class="md-ellipsis">
|
||
|
||
|
||
Docling Document
|
||
|
||
|
||
|
||
</span>
|
||
|
||
|
||
|
||
</a>
|
||
</li>
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
<li class="md-nav__item">
|
||
<a href="../../concepts/serialization/" class="md-nav__link">
|
||
|
||
|
||
|
||
<span class="md-ellipsis">
|
||
|
||
|
||
Serialization
|
||
|
||
|
||
|
||
</span>
|
||
|
||
|
||
|
||
</a>
|
||
</li>
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
<li class="md-nav__item">
|
||
<a href="../../concepts/confidence_scores/" class="md-nav__link">
|
||
|
||
|
||
|
||
<span class="md-ellipsis">
|
||
|
||
|
||
Confidence Scores
|
||
|
||
|
||
|
||
</span>
|
||
|
||
|
||
|
||
</a>
|
||
</li>
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
<li class="md-nav__item">
|
||
<a href="../../concepts/chunking/" class="md-nav__link">
|
||
|
||
|
||
|
||
<span class="md-ellipsis">
|
||
|
||
|
||
Chunking
|
||
|
||
|
||
|
||
</span>
|
||
|
||
|
||
|
||
</a>
|
||
</li>
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
<li class="md-nav__item">
|
||
<a href="../../concepts/plugins/" class="md-nav__link">
|
||
|
||
|
||
|
||
<span class="md-ellipsis">
|
||
|
||
|
||
Plugins
|
||
|
||
|
||
|
||
</span>
|
||
|
||
|
||
|
||
</a>
|
||
</li>
|
||
|
||
|
||
|
||
|
||
</ul>
|
||
</nav>
|
||
|
||
</li>
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
<li class="md-nav__item md-nav__item--nested">
|
||
|
||
|
||
|
||
<input class="md-nav__toggle md-toggle " type="checkbox" id="__nav_3" >
|
||
|
||
|
||
<div class="md-nav__link md-nav__container">
|
||
<a href="../../examples/" class="md-nav__link ">
|
||
|
||
|
||
|
||
<span class="md-ellipsis">
|
||
|
||
|
||
Examples
|
||
|
||
|
||
|
||
</span>
|
||
|
||
|
||
|
||
</a>
|
||
|
||
|
||
<label class="md-nav__link " for="__nav_3" id="__nav_3_label" tabindex="0">
|
||
<span class="md-nav__icon md-icon"></span>
|
||
</label>
|
||
|
||
</div>
|
||
|
||
<nav class="md-nav" data-md-level="1" aria-labelledby="__nav_3_label" aria-expanded="false">
|
||
<label class="md-nav__title" for="__nav_3">
|
||
<span class="md-nav__icon md-icon"></span>
|
||
|
||
|
||
Examples
|
||
|
||
|
||
</label>
|
||
<ul class="md-nav__list" data-md-scrollfix>
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
<li class="md-nav__item md-nav__item--nested">
|
||
|
||
|
||
|
||
<input class="md-nav__toggle md-toggle " type="checkbox" id="__nav_3_2" >
|
||
|
||
|
||
<label class="md-nav__link" for="__nav_3_2" id="__nav_3_2_label" tabindex="0">
|
||
|
||
|
||
|
||
<span class="md-ellipsis">
|
||
|
||
|
||
🔀 Conversion
|
||
|
||
|
||
|
||
</span>
|
||
|
||
|
||
|
||
<span class="md-nav__icon md-icon"></span>
|
||
</label>
|
||
|
||
<nav class="md-nav" data-md-level="2" aria-labelledby="__nav_3_2_label" aria-expanded="false">
|
||
<label class="md-nav__title" for="__nav_3_2">
|
||
<span class="md-nav__icon md-icon"></span>
|
||
|
||
|
||
🔀 Conversion
|
||
|
||
|
||
</label>
|
||
<ul class="md-nav__list" data-md-scrollfix>
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
<li class="md-nav__item">
|
||
<a href="../../examples/minimal/" class="md-nav__link">
|
||
|
||
|
||
|
||
<span class="md-ellipsis">
|
||
|
||
|
||
Simple conversion
|
||
|
||
|
||
|
||
</span>
|
||
|
||
|
||
|
||
</a>
|
||
</li>
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
<li class="md-nav__item">
|
||
<a href="../../examples/custom_convert/" class="md-nav__link">
|
||
|
||
|
||
|
||
<span class="md-ellipsis">
|
||
|
||
|
||
Custom conversion
|
||
|
||
|
||
|
||
</span>
|
||
|
||
|
||
|
||
</a>
|
||
</li>
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
<li class="md-nav__item">
|
||
<a href="../../examples/batch_convert/" class="md-nav__link">
|
||
|
||
|
||
|
||
<span class="md-ellipsis">
|
||
|
||
|
||
Batch conversion
|
||
|
||
|
||
|
||
</span>
|
||
|
||
|
||
|
||
</a>
|
||
</li>
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
<li class="md-nav__item">
|
||
<a href="../../examples/run_with_formats/" class="md-nav__link">
|
||
|
||
|
||
|
||
<span class="md-ellipsis">
|
||
|
||
|
||
Multi-format conversion
|
||
|
||
|
||
|
||
</span>
|
||
|
||
|
||
|
||
</a>
|
||
</li>
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
<li class="md-nav__item">
|
||
<a href="../../examples/minimal_vlm_pipeline/" class="md-nav__link">
|
||
|
||
|
||
|
||
<span class="md-ellipsis">
|
||
|
||
|
||
VLM pipeline with GraniteDocling
|
||
|
||
|
||
|
||
</span>
|
||
|
||
|
||
|
||
</a>
|
||
</li>
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
<li class="md-nav__item">
|
||
<a href="../../examples/vlm_pipeline_api_model/" class="md-nav__link">
|
||
|
||
|
||
|
||
<span class="md-ellipsis">
|
||
|
||
|
||
VLM pipeline with remote model
|
||
|
||
|
||
|
||
</span>
|
||
|
||
|
||
|
||
</a>
|
||
</li>
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
<li class="md-nav__item">
|
||
<a href="../../examples/compare_vlm_models/" class="md-nav__link">
|
||
|
||
|
||
|
||
<span class="md-ellipsis">
|
||
|
||
|
||
VLM comparison
|
||
|
||
|
||
|
||
</span>
|
||
|
||
|
||
|
||
</a>
|
||
</li>
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
<li class="md-nav__item">
|
||
<a href="../../examples/minimal_asr_pipeline/" class="md-nav__link">
|
||
|
||
|
||
|
||
<span class="md-ellipsis">
|
||
|
||
|
||
ASR pipeline with Whisper
|
||
|
||
|
||
|
||
</span>
|
||
|
||
|
||
|
||
</a>
|
||
</li>
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
<li class="md-nav__item">
|
||
<a href="../../examples/export_figures/" class="md-nav__link">
|
||
|
||
|
||
|
||
<span class="md-ellipsis">
|
||
|
||
|
||
Figure export
|
||
|
||
|
||
|
||
</span>
|
||
|
||
|
||
|
||
</a>
|
||
</li>
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
<li class="md-nav__item">
|
||
<a href="../../examples/export_tables/" class="md-nav__link">
|
||
|
||
|
||
|
||
<span class="md-ellipsis">
|
||
|
||
|
||
Table export
|
||
|
||
|
||
|
||
</span>
|
||
|
||
|
||
|
||
</a>
|
||
</li>
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
<li class="md-nav__item">
|
||
<a href="../../examples/export_multimodal/" class="md-nav__link">
|
||
|
||
|
||
|
||
<span class="md-ellipsis">
|
||
|
||
|
||
Multimodal export
|
||
|
||
|
||
|
||
</span>
|
||
|
||
|
||
|
||
</a>
|
||
</li>
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
<li class="md-nav__item">
|
||
<a href="../../examples/full_page_ocr/" class="md-nav__link">
|
||
|
||
|
||
|
||
<span class="md-ellipsis">
|
||
|
||
|
||
Force full page OCR
|
||
|
||
|
||
|
||
</span>
|
||
|
||
|
||
|
||
</a>
|
||
</li>
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
<li class="md-nav__item">
|
||
<a href="../../examples/tesseract_lang_detection/" class="md-nav__link">
|
||
|
||
|
||
|
||
<span class="md-ellipsis">
|
||
|
||
|
||
Automatic OCR language detection with tesseract
|
||
|
||
|
||
|
||
</span>
|
||
|
||
|
||
|
||
</a>
|
||
</li>
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
<li class="md-nav__item">
|
||
<a href="../../examples/rapidocr_with_custom_models/" class="md-nav__link">
|
||
|
||
|
||
|
||
<span class="md-ellipsis">
|
||
|
||
|
||
RapidOCR with custom OCR models
|
||
|
||
|
||
|
||
</span>
|
||
|
||
|
||
|
||
</a>
|
||
</li>
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
<li class="md-nav__item">
|
||
<a href="../../examples/suryaocr_with_custom_models/" class="md-nav__link">
|
||
|
||
|
||
|
||
<span class="md-ellipsis">
|
||
|
||
|
||
SuryaOCR with custom OCR models
|
||
|
||
|
||
|
||
</span>
|
||
|
||
|
||
|
||
</a>
|
||
</li>
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
<li class="md-nav__item">
|
||
<a href="../../examples/run_with_accelerator/" class="md-nav__link">
|
||
|
||
|
||
|
||
<span class="md-ellipsis">
|
||
|
||
|
||
Accelerator options
|
||
|
||
|
||
|
||
</span>
|
||
|
||
|
||
|
||
</a>
|
||
</li>
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
<li class="md-nav__item">
|
||
<a href="../../examples/pii_obfuscate/" class="md-nav__link">
|
||
|
||
|
||
|
||
<span class="md-ellipsis">
|
||
|
||
|
||
Detect and obfuscate PII
|
||
|
||
|
||
|
||
</span>
|
||
|
||
|
||
|
||
</a>
|
||
</li>
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
<li class="md-nav__item">
|
||
<a href="../../examples/translate/" class="md-nav__link">
|
||
|
||
|
||
|
||
<span class="md-ellipsis">
|
||
|
||
|
||
Simple translation
|
||
|
||
|
||
|
||
</span>
|
||
|
||
|
||
|
||
</a>
|
||
</li>
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
<li class="md-nav__item">
|
||
<a href="../../examples/backend_csv/" class="md-nav__link">
|
||
|
||
|
||
|
||
<span class="md-ellipsis">
|
||
|
||
|
||
Conversion of CSV files
|
||
|
||
|
||
|
||
</span>
|
||
|
||
|
||
|
||
</a>
|
||
</li>
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
<li class="md-nav__item">
|
||
<a href="../../examples/backend_xml_rag/" class="md-nav__link">
|
||
|
||
|
||
|
||
<span class="md-ellipsis">
|
||
|
||
|
||
Conversion of custom XML
|
||
|
||
|
||
|
||
</span>
|
||
|
||
|
||
|
||
</a>
|
||
</li>
|
||
|
||
|
||
|
||
|
||
</ul>
|
||
</nav>
|
||
|
||
</li>
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
<li class="md-nav__item md-nav__item--nested">
|
||
|
||
|
||
|
||
<input class="md-nav__toggle md-toggle " type="checkbox" id="__nav_3_3" >
|
||
|
||
|
||
<label class="md-nav__link" for="__nav_3_3" id="__nav_3_3_label" tabindex="0">
|
||
|
||
|
||
|
||
<span class="md-ellipsis">
|
||
|
||
|
||
✂️ Serialization & chunking
|
||
|
||
|
||
|
||
</span>
|
||
|
||
|
||
|
||
<span class="md-nav__icon md-icon"></span>
|
||
</label>
|
||
|
||
<nav class="md-nav" data-md-level="2" aria-labelledby="__nav_3_3_label" aria-expanded="false">
|
||
<label class="md-nav__title" for="__nav_3_3">
|
||
<span class="md-nav__icon md-icon"></span>
|
||
|
||
|
||
✂️ Serialization & chunking
|
||
|
||
|
||
</label>
|
||
<ul class="md-nav__list" data-md-scrollfix>
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
<li class="md-nav__item">
|
||
<a href="../../examples/serialization/" class="md-nav__link">
|
||
|
||
|
||
|
||
<span class="md-ellipsis">
|
||
|
||
|
||
Serialization
|
||
|
||
|
||
|
||
</span>
|
||
|
||
|
||
|
||
</a>
|
||
</li>
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
<li class="md-nav__item">
|
||
<a href="../../examples/hybrid_chunking/" class="md-nav__link">
|
||
|
||
|
||
|
||
<span class="md-ellipsis">
|
||
|
||
|
||
Hybrid chunking
|
||
|
||
|
||
|
||
</span>
|
||
|
||
|
||
|
||
</a>
|
||
</li>
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
<li class="md-nav__item">
|
||
<a href="../../examples/advanced_chunking_and_serialization/" class="md-nav__link">
|
||
|
||
|
||
|
||
<span class="md-ellipsis">
|
||
|
||
|
||
Advanced chunking & serialization
|
||
|
||
|
||
|
||
</span>
|
||
|
||
|
||
|
||
</a>
|
||
</li>
|
||
|
||
|
||
|
||
|
||
</ul>
|
||
</nav>
|
||
|
||
</li>
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
<li class="md-nav__item md-nav__item--nested">
|
||
|
||
|
||
|
||
<input class="md-nav__toggle md-toggle " type="checkbox" id="__nav_3_4" >
|
||
|
||
|
||
<label class="md-nav__link" for="__nav_3_4" id="__nav_3_4_label" tabindex="0">
|
||
|
||
|
||
|
||
<span class="md-ellipsis">
|
||
|
||
|
||
📤 Information extraction
|
||
|
||
|
||
|
||
</span>
|
||
|
||
|
||
|
||
<span class="md-nav__icon md-icon"></span>
|
||
</label>
|
||
|
||
<nav class="md-nav" data-md-level="2" aria-labelledby="__nav_3_4_label" aria-expanded="false">
|
||
<label class="md-nav__title" for="__nav_3_4">
|
||
<span class="md-nav__icon md-icon"></span>
|
||
|
||
|
||
📤 Information extraction
|
||
|
||
|
||
</label>
|
||
<ul class="md-nav__list" data-md-scrollfix>
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
<li class="md-nav__item">
|
||
<a href="../../examples/extraction/" class="md-nav__link">
|
||
|
||
|
||
|
||
<span class="md-ellipsis">
|
||
|
||
|
||
Information extraction
|
||
|
||
|
||
|
||
</span>
|
||
|
||
|
||
|
||
</a>
|
||
</li>
|
||
|
||
|
||
|
||
|
||
</ul>
|
||
</nav>
|
||
|
||
</li>
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
<li class="md-nav__item md-nav__item--nested">
|
||
|
||
|
||
|
||
<input class="md-nav__toggle md-toggle " type="checkbox" id="__nav_3_5" >
|
||
|
||
|
||
<label class="md-nav__link" for="__nav_3_5" id="__nav_3_5_label" tabindex="0">
|
||
|
||
|
||
|
||
<span class="md-ellipsis">
|
||
|
||
|
||
🤖 RAG with AI dev frameworks
|
||
|
||
|
||
|
||
</span>
|
||
|
||
|
||
|
||
<span class="md-nav__icon md-icon"></span>
|
||
</label>
|
||
|
||
<nav class="md-nav" data-md-level="2" aria-labelledby="__nav_3_5_label" aria-expanded="false">
|
||
<label class="md-nav__title" for="__nav_3_5">
|
||
<span class="md-nav__icon md-icon"></span>
|
||
|
||
|
||
🤖 RAG with AI dev frameworks
|
||
|
||
|
||
</label>
|
||
<ul class="md-nav__list" data-md-scrollfix>
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
<li class="md-nav__item">
|
||
<a href="../../examples/rag_haystack/" class="md-nav__link">
|
||
|
||
|
||
|
||
<span class="md-ellipsis">
|
||
|
||
|
||
RAG with Haystack
|
||
|
||
|
||
|
||
</span>
|
||
|
||
|
||
|
||
</a>
|
||
</li>
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
<li class="md-nav__item">
|
||
<a href="../../examples/rag_langchain/" class="md-nav__link">
|
||
|
||
|
||
|
||
<span class="md-ellipsis">
|
||
|
||
|
||
RAG with LangChain
|
||
|
||
|
||
|
||
</span>
|
||
|
||
|
||
|
||
</a>
|
||
</li>
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
<li class="md-nav__item">
|
||
<a href="../../examples/rag_llamaindex/" class="md-nav__link">
|
||
|
||
|
||
|
||
<span class="md-ellipsis">
|
||
|
||
|
||
RAG with LlamaIndex
|
||
|
||
|
||
|
||
</span>
|
||
|
||
|
||
|
||
</a>
|
||
</li>
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
<li class="md-nav__item">
|
||
<a href="../../examples/visual_grounding/" class="md-nav__link">
|
||
|
||
|
||
|
||
<span class="md-ellipsis">
|
||
|
||
|
||
Visual grounding
|
||
|
||
|
||
|
||
</span>
|
||
|
||
|
||
|
||
</a>
|
||
</li>
|
||
|
||
|
||
|
||
|
||
</ul>
|
||
</nav>
|
||
|
||
</li>
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
<li class="md-nav__item md-nav__item--nested">
|
||
|
||
|
||
|
||
<input class="md-nav__toggle md-toggle " type="checkbox" id="__nav_3_6" >
|
||
|
||
|
||
<label class="md-nav__link" for="__nav_3_6" id="__nav_3_6_label" tabindex="0">
|
||
|
||
|
||
|
||
<span class="md-ellipsis">
|
||
|
||
|
||
🖼️ Picture annotation
|
||
|
||
|
||
|
||
</span>
|
||
|
||
|
||
|
||
<span class="md-nav__icon md-icon"></span>
|
||
</label>
|
||
|
||
<nav class="md-nav" data-md-level="2" aria-labelledby="__nav_3_6_label" aria-expanded="false">
|
||
<label class="md-nav__title" for="__nav_3_6">
|
||
<span class="md-nav__icon md-icon"></span>
|
||
|
||
|
||
🖼️ Picture annotation
|
||
|
||
|
||
</label>
|
||
<ul class="md-nav__list" data-md-scrollfix>
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
<li class="md-nav__item">
|
||
<a href="../../examples/pictures_description/" class="md-nav__link">
|
||
|
||
|
||
|
||
<span class="md-ellipsis">
|
||
|
||
|
||
Annotate picture with local VLM
|
||
|
||
|
||
|
||
</span>
|
||
|
||
|
||
|
||
</a>
|
||
</li>
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
<li class="md-nav__item">
|
||
<a href="../../examples/pictures_description_api/" class="md-nav__link">
|
||
|
||
|
||
|
||
<span class="md-ellipsis">
|
||
|
||
|
||
Annotate picture with remote VLM
|
||
|
||
|
||
|
||
</span>
|
||
|
||
|
||
|
||
</a>
|
||
</li>
|
||
|
||
|
||
|
||
|
||
</ul>
|
||
</nav>
|
||
|
||
</li>
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
<li class="md-nav__item md-nav__item--nested">
|
||
|
||
|
||
|
||
<input class="md-nav__toggle md-toggle " type="checkbox" id="__nav_3_7" >
|
||
|
||
|
||
<label class="md-nav__link" for="__nav_3_7" id="__nav_3_7_label" tabindex="0">
|
||
|
||
|
||
|
||
<span class="md-ellipsis">
|
||
|
||
|
||
✨ Enrichment development
|
||
|
||
|
||
|
||
</span>
|
||
|
||
|
||
|
||
<span class="md-nav__icon md-icon"></span>
|
||
</label>
|
||
|
||
<nav class="md-nav" data-md-level="2" aria-labelledby="__nav_3_7_label" aria-expanded="false">
|
||
<label class="md-nav__title" for="__nav_3_7">
|
||
<span class="md-nav__icon md-icon"></span>
|
||
|
||
|
||
✨ Enrichment development
|
||
|
||
|
||
</label>
|
||
<ul class="md-nav__list" data-md-scrollfix>
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
<li class="md-nav__item">
|
||
<a href="../../examples/develop_picture_enrichment/" class="md-nav__link">
|
||
|
||
|
||
|
||
<span class="md-ellipsis">
|
||
|
||
|
||
Figure enrichment
|
||
|
||
|
||
|
||
</span>
|
||
|
||
|
||
|
||
</a>
|
||
</li>
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
<li class="md-nav__item">
|
||
<a href="../../examples/develop_formula_understanding/" class="md-nav__link">
|
||
|
||
|
||
|
||
<span class="md-ellipsis">
|
||
|
||
|
||
Formula enrichment
|
||
|
||
|
||
|
||
</span>
|
||
|
||
|
||
|
||
</a>
|
||
</li>
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
<li class="md-nav__item">
|
||
<a href="../../examples/enrich_doclingdocument/" class="md-nav__link">
|
||
|
||
|
||
|
||
<span class="md-ellipsis">
|
||
|
||
|
||
Enrich a DoclingDocument
|
||
|
||
|
||
|
||
</span>
|
||
|
||
|
||
|
||
</a>
|
||
</li>
|
||
|
||
|
||
|
||
|
||
</ul>
|
||
</nav>
|
||
|
||
</li>
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
<li class="md-nav__item md-nav__item--nested">
|
||
|
||
|
||
|
||
<input class="md-nav__toggle md-toggle " type="checkbox" id="__nav_3_8" >
|
||
|
||
|
||
<label class="md-nav__link" for="__nav_3_8" id="__nav_3_8_label" tabindex="0">
|
||
|
||
|
||
|
||
<span class="md-ellipsis">
|
||
|
||
|
||
⚡️ GPU optimization
|
||
|
||
|
||
|
||
</span>
|
||
|
||
|
||
|
||
<span class="md-nav__icon md-icon"></span>
|
||
</label>
|
||
|
||
<nav class="md-nav" data-md-level="2" aria-labelledby="__nav_3_8_label" aria-expanded="false">
|
||
<label class="md-nav__title" for="__nav_3_8">
|
||
<span class="md-nav__icon md-icon"></span>
|
||
|
||
|
||
⚡️ GPU optimization
|
||
|
||
|
||
</label>
|
||
<ul class="md-nav__list" data-md-scrollfix>
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
<li class="md-nav__item">
|
||
<a href="../../examples/gpu_standard_pipeline/" class="md-nav__link">
|
||
|
||
|
||
|
||
<span class="md-ellipsis">
|
||
|
||
|
||
Standard pipeline
|
||
|
||
|
||
|
||
</span>
|
||
|
||
|
||
|
||
</a>
|
||
</li>
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
<li class="md-nav__item">
|
||
<a href="../../examples/gpu_vlm_pipeline/" class="md-nav__link">
|
||
|
||
|
||
|
||
<span class="md-ellipsis">
|
||
|
||
|
||
VLM pipeline
|
||
|
||
|
||
|
||
</span>
|
||
|
||
|
||
|
||
</a>
|
||
</li>
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
<li class="md-nav__item">
|
||
<a href="../../examples/parquet_images/" class="md-nav__link">
|
||
|
||
|
||
|
||
<span class="md-ellipsis">
|
||
|
||
|
||
Parquet benchmark
|
||
|
||
|
||
|
||
</span>
|
||
|
||
|
||
|
||
</a>
|
||
</li>
|
||
|
||
|
||
|
||
|
||
</ul>
|
||
</nav>
|
||
|
||
</li>
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
<li class="md-nav__item md-nav__item--nested">
|
||
|
||
|
||
|
||
<input class="md-nav__toggle md-toggle " type="checkbox" id="__nav_3_9" >
|
||
|
||
|
||
<label class="md-nav__link" for="__nav_3_9" id="__nav_3_9_label" tabindex="0">
|
||
|
||
|
||
|
||
<span class="md-ellipsis">
|
||
|
||
|
||
🗂️ More examples
|
||
|
||
|
||
|
||
</span>
|
||
|
||
|
||
|
||
<span class="md-nav__icon md-icon"></span>
|
||
</label>
|
||
|
||
<nav class="md-nav" data-md-level="2" aria-labelledby="__nav_3_9_label" aria-expanded="false">
|
||
<label class="md-nav__title" for="__nav_3_9">
|
||
<span class="md-nav__icon md-icon"></span>
|
||
|
||
|
||
🗂️ More examples
|
||
|
||
|
||
</label>
|
||
<ul class="md-nav__list" data-md-scrollfix>
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
<li class="md-nav__item">
|
||
<a href="../../examples/dpk-ingest-chunk-tokenize/" class="md-nav__link">
|
||
|
||
|
||
|
||
<span class="md-ellipsis">
|
||
|
||
|
||
Chunking & tokenization with Data Prep Kit
|
||
|
||
|
||
|
||
</span>
|
||
|
||
|
||
|
||
</a>
|
||
</li>
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
<li class="md-nav__item">
|
||
<a href="../../examples/rag_azuresearch/" class="md-nav__link">
|
||
|
||
|
||
|
||
<span class="md-ellipsis">
|
||
|
||
|
||
RAG with Azure AI Search
|
||
|
||
|
||
|
||
</span>
|
||
|
||
|
||
|
||
</a>
|
||
</li>
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
<li class="md-nav__item">
|
||
<a href="https://github.com/ibm-granite-community/granite-snack-cookbook/blob/main/recipes/RAG/Granite_Docling_RAG.ipynb" class="md-nav__link">
|
||
|
||
|
||
|
||
<span class="md-ellipsis">
|
||
|
||
|
||
RAG with Granite [↗]
|
||
|
||
|
||
|
||
</span>
|
||
|
||
|
||
|
||
</a>
|
||
</li>
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
<li class="md-nav__item">
|
||
<a href="../../examples/rag_milvus/" class="md-nav__link">
|
||
|
||
|
||
|
||
<span class="md-ellipsis">
|
||
|
||
|
||
RAG with Milvus
|
||
|
||
|
||
|
||
</span>
|
||
|
||
|
||
|
||
</a>
|
||
</li>
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
<li class="md-nav__item">
|
||
<a href="../../examples/rag_opensearch/" class="md-nav__link">
|
||
|
||
|
||
|
||
<span class="md-ellipsis">
|
||
|
||
|
||
RAG with OpenSearch
|
||
|
||
|
||
|
||
</span>
|
||
|
||
|
||
|
||
</a>
|
||
</li>
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
<li class="md-nav__item">
|
||
<a href="../../examples/rag_weaviate/" class="md-nav__link">
|
||
|
||
|
||
|
||
<span class="md-ellipsis">
|
||
|
||
|
||
RAG with Weaviate
|
||
|
||
|
||
|
||
</span>
|
||
|
||
|
||
|
||
</a>
|
||
</li>
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
<li class="md-nav__item">
|
||
<a href="../../examples/retrieval_qdrant/" class="md-nav__link">
|
||
|
||
|
||
|
||
<span class="md-ellipsis">
|
||
|
||
|
||
Retrieval with Qdrant
|
||
|
||
|
||
|
||
</span>
|
||
|
||
|
||
|
||
</a>
|
||
</li>
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
<li class="md-nav__item">
|
||
<a href="../../examples/rag_mongodb/" class="md-nav__link">
|
||
|
||
|
||
|
||
<span class="md-ellipsis">
|
||
|
||
|
||
RAG with MongoDB + VoyageAI
|
||
|
||
|
||
|
||
</span>
|
||
|
||
|
||
|
||
</a>
|
||
</li>
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
<li class="md-nav__item">
|
||
<a href="https://github.com/workloads/pathfinder-prism" class="md-nav__link">
|
||
|
||
|
||
|
||
<span class="md-ellipsis">
|
||
|
||
|
||
RAG with Vault PII transform [↗]
|
||
|
||
|
||
|
||
</span>
|
||
|
||
|
||
|
||
</a>
|
||
</li>
|
||
|
||
|
||
|
||
|
||
</ul>
|
||
</nav>
|
||
|
||
</li>
|
||
|
||
|
||
|
||
|
||
</ul>
|
||
</nav>
|
||
|
||
</li>
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
<li class="md-nav__item md-nav__item--nested">
|
||
|
||
|
||
|
||
<input class="md-nav__toggle md-toggle " type="checkbox" id="__nav_4" >
|
||
|
||
|
||
<div class="md-nav__link md-nav__container">
|
||
<a href="../../integrations/" class="md-nav__link ">
|
||
|
||
|
||
|
||
<span class="md-ellipsis">
|
||
|
||
|
||
Integrations
|
||
|
||
|
||
|
||
</span>
|
||
|
||
|
||
|
||
</a>
|
||
|
||
|
||
<label class="md-nav__link " for="__nav_4" id="__nav_4_label" tabindex="0">
|
||
<span class="md-nav__icon md-icon"></span>
|
||
</label>
|
||
|
||
</div>
|
||
|
||
<nav class="md-nav" data-md-level="1" aria-labelledby="__nav_4_label" aria-expanded="false">
|
||
<label class="md-nav__title" for="__nav_4">
|
||
<span class="md-nav__icon md-icon"></span>
|
||
|
||
|
||
Integrations
|
||
|
||
|
||
</label>
|
||
<ul class="md-nav__list" data-md-scrollfix>
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
<li class="md-nav__item md-nav__item--nested">
|
||
|
||
|
||
|
||
<input class="md-nav__toggle md-toggle " type="checkbox" id="__nav_4_2" >
|
||
|
||
|
||
<label class="md-nav__link" for="__nav_4_2" id="__nav_4_2_label" tabindex="0">
|
||
|
||
|
||
|
||
<span class="md-ellipsis">
|
||
|
||
|
||
🤖 Agentic / AI dev frameworks
|
||
|
||
|
||
|
||
</span>
|
||
|
||
|
||
|
||
<span class="md-nav__icon md-icon"></span>
|
||
</label>
|
||
|
||
<nav class="md-nav" data-md-level="2" aria-labelledby="__nav_4_2_label" aria-expanded="false">
|
||
<label class="md-nav__title" for="__nav_4_2">
|
||
<span class="md-nav__icon md-icon"></span>
|
||
|
||
|
||
🤖 Agentic / AI dev frameworks
|
||
|
||
|
||
</label>
|
||
<ul class="md-nav__list" data-md-scrollfix>
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
<li class="md-nav__item">
|
||
<a href="../../integrations/bee/" class="md-nav__link">
|
||
|
||
|
||
|
||
<span class="md-ellipsis">
|
||
|
||
|
||
Bee Agent Framework
|
||
|
||
|
||
|
||
</span>
|
||
|
||
|
||
|
||
</a>
|
||
</li>
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
<li class="md-nav__item">
|
||
<a href="../../integrations/crewai/" class="md-nav__link">
|
||
|
||
|
||
|
||
<span class="md-ellipsis">
|
||
|
||
|
||
Crew AI
|
||
|
||
|
||
|
||
</span>
|
||
|
||
|
||
|
||
</a>
|
||
</li>
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
<li class="md-nav__item">
|
||
<a href="../../integrations/haystack/" class="md-nav__link">
|
||
|
||
|
||
|
||
<span class="md-ellipsis">
|
||
|
||
|
||
Haystack
|
||
|
||
|
||
|
||
</span>
|
||
|
||
|
||
|
||
</a>
|
||
</li>
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
<li class="md-nav__item">
|
||
<a href="../../integrations/hector/" class="md-nav__link">
|
||
|
||
|
||
|
||
<span class="md-ellipsis">
|
||
|
||
|
||
Hector
|
||
|
||
|
||
|
||
</span>
|
||
|
||
|
||
|
||
</a>
|
||
</li>
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
<li class="md-nav__item">
|
||
<a href="../../integrations/langchain/" class="md-nav__link">
|
||
|
||
|
||
|
||
<span class="md-ellipsis">
|
||
|
||
|
||
LangChain
|
||
|
||
|
||
|
||
</span>
|
||
|
||
|
||
|
||
</a>
|
||
</li>
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
<li class="md-nav__item">
|
||
<a href="../../integrations/langflow/" class="md-nav__link">
|
||
|
||
|
||
|
||
<span class="md-ellipsis">
|
||
|
||
|
||
Langflow
|
||
|
||
|
||
|
||
</span>
|
||
|
||
|
||
|
||
</a>
|
||
</li>
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
<li class="md-nav__item">
|
||
<a href="../../integrations/llamaindex/" class="md-nav__link">
|
||
|
||
|
||
|
||
<span class="md-ellipsis">
|
||
|
||
|
||
LlamaIndex
|
||
|
||
|
||
|
||
</span>
|
||
|
||
|
||
|
||
</a>
|
||
</li>
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
<li class="md-nav__item">
|
||
<a href="../../integrations/txtai/" class="md-nav__link">
|
||
|
||
|
||
|
||
<span class="md-ellipsis">
|
||
|
||
|
||
txtai
|
||
|
||
|
||
|
||
</span>
|
||
|
||
|
||
|
||
</a>
|
||
</li>
|
||
|
||
|
||
|
||
|
||
</ul>
|
||
</nav>
|
||
|
||
</li>
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
<li class="md-nav__item md-nav__item--nested">
|
||
|
||
|
||
|
||
<input class="md-nav__toggle md-toggle " type="checkbox" id="__nav_4_3" >
|
||
|
||
|
||
<label class="md-nav__link" for="__nav_4_3" id="__nav_4_3_label" tabindex="0">
|
||
|
||
|
||
|
||
<span class="md-ellipsis">
|
||
|
||
|
||
⭐️ Featured
|
||
|
||
|
||
|
||
</span>
|
||
|
||
|
||
|
||
<span class="md-nav__icon md-icon"></span>
|
||
</label>
|
||
|
||
<nav class="md-nav" data-md-level="2" aria-labelledby="__nav_4_3_label" aria-expanded="false">
|
||
<label class="md-nav__title" for="__nav_4_3">
|
||
<span class="md-nav__icon md-icon"></span>
|
||
|
||
|
||
⭐️ Featured
|
||
|
||
|
||
</label>
|
||
<ul class="md-nav__list" data-md-scrollfix>
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
<li class="md-nav__item">
|
||
<a href="../../integrations/apify/" class="md-nav__link">
|
||
|
||
|
||
|
||
<span class="md-ellipsis">
|
||
|
||
|
||
Apify
|
||
|
||
|
||
|
||
</span>
|
||
|
||
|
||
|
||
</a>
|
||
</li>
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
<li class="md-nav__item">
|
||
<a href="../../integrations/data_prep_kit/" class="md-nav__link">
|
||
|
||
|
||
|
||
<span class="md-ellipsis">
|
||
|
||
|
||
Data Prep Kit
|
||
|
||
|
||
|
||
</span>
|
||
|
||
|
||
|
||
</a>
|
||
</li>
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
<li class="md-nav__item">
|
||
<a href="../../integrations/instructlab/" class="md-nav__link">
|
||
|
||
|
||
|
||
<span class="md-ellipsis">
|
||
|
||
|
||
InstructLab
|
||
|
||
|
||
|
||
</span>
|
||
|
||
|
||
|
||
</a>
|
||
</li>
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
<li class="md-nav__item">
|
||
<a href="../../integrations/nvidia/" class="md-nav__link">
|
||
|
||
|
||
|
||
<span class="md-ellipsis">
|
||
|
||
|
||
NVIDIA
|
||
|
||
|
||
|
||
</span>
|
||
|
||
|
||
|
||
</a>
|
||
</li>
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
<li class="md-nav__item">
|
||
<a href="../../integrations/prodigy/" class="md-nav__link">
|
||
|
||
|
||
|
||
<span class="md-ellipsis">
|
||
|
||
|
||
Prodigy
|
||
|
||
|
||
|
||
</span>
|
||
|
||
|
||
|
||
</a>
|
||
</li>
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
<li class="md-nav__item">
|
||
<a href="../../integrations/rhel_ai/" class="md-nav__link">
|
||
|
||
|
||
|
||
<span class="md-ellipsis">
|
||
|
||
|
||
RHEL AI
|
||
|
||
|
||
|
||
</span>
|
||
|
||
|
||
|
||
</a>
|
||
</li>
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
<li class="md-nav__item">
|
||
<a href="../../integrations/spacy/" class="md-nav__link">
|
||
|
||
|
||
|
||
<span class="md-ellipsis">
|
||
|
||
|
||
spaCy
|
||
|
||
|
||
|
||
</span>
|
||
|
||
|
||
|
||
</a>
|
||
</li>
|
||
|
||
|
||
|
||
|
||
</ul>
|
||
</nav>
|
||
|
||
</li>
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
<li class="md-nav__item md-nav__item--nested">
|
||
|
||
|
||
|
||
<input class="md-nav__toggle md-toggle " type="checkbox" id="__nav_4_4" >
|
||
|
||
|
||
<label class="md-nav__link" for="__nav_4_4" id="__nav_4_4_label" tabindex="0">
|
||
|
||
|
||
|
||
<span class="md-ellipsis">
|
||
|
||
|
||
🗂️ More integrations
|
||
|
||
|
||
|
||
</span>
|
||
|
||
|
||
|
||
<span class="md-nav__icon md-icon"></span>
|
||
</label>
|
||
|
||
<nav class="md-nav" data-md-level="2" aria-labelledby="__nav_4_4_label" aria-expanded="false">
|
||
<label class="md-nav__title" for="__nav_4_4">
|
||
<span class="md-nav__icon md-icon"></span>
|
||
|
||
|
||
🗂️ More integrations
|
||
|
||
|
||
</label>
|
||
<ul class="md-nav__list" data-md-scrollfix>
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
<li class="md-nav__item">
|
||
<a href="../../integrations/arconia/" class="md-nav__link">
|
||
|
||
|
||
|
||
<span class="md-ellipsis">
|
||
|
||
|
||
Arconia
|
||
|
||
|
||
|
||
</span>
|
||
|
||
|
||
|
||
</a>
|
||
</li>
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
<li class="md-nav__item">
|
||
<a href="../../integrations/cloudera/" class="md-nav__link">
|
||
|
||
|
||
|
||
<span class="md-ellipsis">
|
||
|
||
|
||
Cloudera
|
||
|
||
|
||
|
||
</span>
|
||
|
||
|
||
|
||
</a>
|
||
</li>
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
<li class="md-nav__item">
|
||
<a href="../../integrations/docetl/" class="md-nav__link">
|
||
|
||
|
||
|
||
<span class="md-ellipsis">
|
||
|
||
|
||
DocETL
|
||
|
||
|
||
|
||
</span>
|
||
|
||
|
||
|
||
</a>
|
||
</li>
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
<li class="md-nav__item">
|
||
<a href="../../integrations/kotaemon/" class="md-nav__link">
|
||
|
||
|
||
|
||
<span class="md-ellipsis">
|
||
|
||
|
||
Kotaemon
|
||
|
||
|
||
|
||
</span>
|
||
|
||
|
||
|
||
</a>
|
||
</li>
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
<li class="md-nav__item">
|
||
<a href="../../integrations/opencontracts/" class="md-nav__link">
|
||
|
||
|
||
|
||
<span class="md-ellipsis">
|
||
|
||
|
||
OpenContracts
|
||
|
||
|
||
|
||
</span>
|
||
|
||
|
||
|
||
</a>
|
||
</li>
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
<li class="md-nav__item">
|
||
<a href="../../integrations/openwebui/" class="md-nav__link">
|
||
|
||
|
||
|
||
<span class="md-ellipsis">
|
||
|
||
|
||
Open WebUI
|
||
|
||
|
||
|
||
</span>
|
||
|
||
|
||
|
||
</a>
|
||
</li>
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
<li class="md-nav__item">
|
||
<a href="../../integrations/quarkus/" class="md-nav__link">
|
||
|
||
|
||
|
||
<span class="md-ellipsis">
|
||
|
||
|
||
Quarkus
|
||
|
||
|
||
|
||
</span>
|
||
|
||
|
||
|
||
</a>
|
||
</li>
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
<li class="md-nav__item">
|
||
<a href="../../integrations/vectara/" class="md-nav__link">
|
||
|
||
|
||
|
||
<span class="md-ellipsis">
|
||
|
||
|
||
Vectara
|
||
|
||
|
||
|
||
</span>
|
||
|
||
|
||
|
||
</a>
|
||
</li>
|
||
|
||
|
||
|
||
|
||
</ul>
|
||
</nav>
|
||
|
||
</li>
|
||
|
||
|
||
|
||
|
||
</ul>
|
||
</nav>
|
||
|
||
</li>
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
<li class="md-nav__item md-nav__item--active md-nav__item--section md-nav__item--nested">
|
||
|
||
|
||
|
||
<input class="md-nav__toggle md-toggle " type="checkbox" id="__nav_5" checked>
|
||
|
||
|
||
<label class="md-nav__link" for="__nav_5" id="__nav_5_label" tabindex="">
|
||
|
||
|
||
|
||
<span class="md-ellipsis">
|
||
|
||
|
||
Reference
|
||
|
||
|
||
|
||
</span>
|
||
|
||
|
||
|
||
<span class="md-nav__icon md-icon"></span>
|
||
</label>
|
||
|
||
<nav class="md-nav" data-md-level="1" aria-labelledby="__nav_5_label" aria-expanded="true">
|
||
<label class="md-nav__title" for="__nav_5">
|
||
<span class="md-nav__icon md-icon"></span>
|
||
|
||
|
||
Reference
|
||
|
||
|
||
</label>
|
||
<ul class="md-nav__list" data-md-scrollfix>
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
<li class="md-nav__item md-nav__item--active md-nav__item--nested">
|
||
|
||
|
||
|
||
<input class="md-nav__toggle md-toggle " type="checkbox" id="__nav_5_1" checked>
|
||
|
||
|
||
<label class="md-nav__link" for="__nav_5_1" id="__nav_5_1_label" tabindex="0">
|
||
|
||
|
||
|
||
<span class="md-ellipsis">
|
||
|
||
|
||
Python API
|
||
|
||
|
||
|
||
</span>
|
||
|
||
|
||
|
||
<span class="md-nav__icon md-icon"></span>
|
||
</label>
|
||
|
||
<nav class="md-nav" data-md-level="2" aria-labelledby="__nav_5_1_label" aria-expanded="true">
|
||
<label class="md-nav__title" for="__nav_5_1">
|
||
<span class="md-nav__icon md-icon"></span>
|
||
|
||
|
||
Python API
|
||
|
||
|
||
</label>
|
||
<ul class="md-nav__list" data-md-scrollfix>
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
<li class="md-nav__item">
|
||
<a href="../document_converter/" class="md-nav__link">
|
||
|
||
|
||
|
||
<span class="md-ellipsis">
|
||
|
||
|
||
Document Converter
|
||
|
||
|
||
|
||
</span>
|
||
|
||
|
||
|
||
</a>
|
||
</li>
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
<li class="md-nav__item md-nav__item--active">
|
||
|
||
<input class="md-nav__toggle md-toggle" type="checkbox" id="__toc">
|
||
|
||
|
||
|
||
|
||
|
||
<label class="md-nav__link md-nav__link--active" for="__toc">
|
||
|
||
|
||
|
||
<span class="md-ellipsis">
|
||
|
||
|
||
Pipeline options
|
||
|
||
|
||
|
||
</span>
|
||
|
||
|
||
|
||
<span class="md-nav__icon md-icon"></span>
|
||
</label>
|
||
|
||
<a href="./" class="md-nav__link md-nav__link--active">
|
||
|
||
|
||
|
||
<span class="md-ellipsis">
|
||
|
||
|
||
Pipeline options
|
||
|
||
|
||
|
||
</span>
|
||
|
||
|
||
|
||
</a>
|
||
|
||
|
||
|
||
<nav class="md-nav md-nav--secondary" aria-label="Table of contents">
|
||
|
||
|
||
|
||
|
||
|
||
|
||
<label class="md-nav__title" for="__toc">
|
||
<span class="md-nav__icon md-icon"></span>
|
||
Table of contents
|
||
</label>
|
||
<ul class="md-nav__list" data-md-component="toc" data-md-scrollfix>
|
||
|
||
<li class="md-nav__item">
|
||
<a href="#docling.datamodel.pipeline_options" class="md-nav__link">
|
||
<span class="md-ellipsis">
|
||
|
||
<code class="doc-symbol doc-symbol-toc doc-symbol-module"></code> pipeline_options
|
||
|
||
</span>
|
||
</a>
|
||
|
||
<nav class="md-nav" aria-label=" pipeline_options">
|
||
<ul class="md-nav__list">
|
||
|
||
<li class="md-nav__item">
|
||
<a href="#docling.datamodel.pipeline_options.granite_picture_description" class="md-nav__link">
|
||
<span class="md-ellipsis">
|
||
|
||
<code class="doc-symbol doc-symbol-toc doc-symbol-attribute"></code> granite_picture_description
|
||
|
||
</span>
|
||
</a>
|
||
|
||
</li>
|
||
|
||
<li class="md-nav__item">
|
||
<a href="#docling.datamodel.pipeline_options.smolvlm_picture_description" class="md-nav__link">
|
||
<span class="md-ellipsis">
|
||
|
||
<code class="doc-symbol doc-symbol-toc doc-symbol-attribute"></code> smolvlm_picture_description
|
||
|
||
</span>
|
||
</a>
|
||
|
||
</li>
|
||
|
||
<li class="md-nav__item">
|
||
<a href="#docling.datamodel.pipeline_options.AsrPipelineOptions" class="md-nav__link">
|
||
<span class="md-ellipsis">
|
||
|
||
<code class="doc-symbol doc-symbol-toc doc-symbol-class"></code> AsrPipelineOptions
|
||
|
||
</span>
|
||
</a>
|
||
|
||
<nav class="md-nav" aria-label=" AsrPipelineOptions">
|
||
<ul class="md-nav__list">
|
||
|
||
<li class="md-nav__item">
|
||
<a href="#docling.datamodel.pipeline_options.AsrPipelineOptions.accelerator_options" class="md-nav__link">
|
||
<span class="md-ellipsis">
|
||
|
||
<code class="doc-symbol doc-symbol-toc doc-symbol-attribute"></code> accelerator_options
|
||
|
||
</span>
|
||
</a>
|
||
|
||
</li>
|
||
|
||
<li class="md-nav__item">
|
||
<a href="#docling.datamodel.pipeline_options.AsrPipelineOptions.allow_external_plugins" class="md-nav__link">
|
||
<span class="md-ellipsis">
|
||
|
||
<code class="doc-symbol doc-symbol-toc doc-symbol-attribute"></code> allow_external_plugins
|
||
|
||
</span>
|
||
</a>
|
||
|
||
</li>
|
||
|
||
<li class="md-nav__item">
|
||
<a href="#docling.datamodel.pipeline_options.AsrPipelineOptions.artifacts_path" class="md-nav__link">
|
||
<span class="md-ellipsis">
|
||
|
||
<code class="doc-symbol doc-symbol-toc doc-symbol-attribute"></code> artifacts_path
|
||
|
||
</span>
|
||
</a>
|
||
|
||
</li>
|
||
|
||
<li class="md-nav__item">
|
||
<a href="#docling.datamodel.pipeline_options.AsrPipelineOptions.asr_options" class="md-nav__link">
|
||
<span class="md-ellipsis">
|
||
|
||
<code class="doc-symbol doc-symbol-toc doc-symbol-attribute"></code> asr_options
|
||
|
||
</span>
|
||
</a>
|
||
|
||
</li>
|
||
|
||
<li class="md-nav__item">
|
||
<a href="#docling.datamodel.pipeline_options.AsrPipelineOptions.document_timeout" class="md-nav__link">
|
||
<span class="md-ellipsis">
|
||
|
||
<code class="doc-symbol doc-symbol-toc doc-symbol-attribute"></code> document_timeout
|
||
|
||
</span>
|
||
</a>
|
||
|
||
</li>
|
||
|
||
<li class="md-nav__item">
|
||
<a href="#docling.datamodel.pipeline_options.AsrPipelineOptions.enable_remote_services" class="md-nav__link">
|
||
<span class="md-ellipsis">
|
||
|
||
<code class="doc-symbol doc-symbol-toc doc-symbol-attribute"></code> enable_remote_services
|
||
|
||
</span>
|
||
</a>
|
||
|
||
</li>
|
||
|
||
<li class="md-nav__item">
|
||
<a href="#docling.datamodel.pipeline_options.AsrPipelineOptions.kind" class="md-nav__link">
|
||
<span class="md-ellipsis">
|
||
|
||
<code class="doc-symbol doc-symbol-toc doc-symbol-attribute"></code> kind
|
||
|
||
</span>
|
||
</a>
|
||
|
||
</li>
|
||
|
||
</ul>
|
||
</nav>
|
||
|
||
</li>
|
||
|
||
<li class="md-nav__item">
|
||
<a href="#docling.datamodel.pipeline_options.BaseLayoutOptions" class="md-nav__link">
|
||
<span class="md-ellipsis">
|
||
|
||
<code class="doc-symbol doc-symbol-toc doc-symbol-class"></code> BaseLayoutOptions
|
||
|
||
</span>
|
||
</a>
|
||
|
||
<nav class="md-nav" aria-label=" BaseLayoutOptions">
|
||
<ul class="md-nav__list">
|
||
|
||
<li class="md-nav__item">
|
||
<a href="#docling.datamodel.pipeline_options.BaseLayoutOptions.keep_empty_clusters" class="md-nav__link">
|
||
<span class="md-ellipsis">
|
||
|
||
<code class="doc-symbol doc-symbol-toc doc-symbol-attribute"></code> keep_empty_clusters
|
||
|
||
</span>
|
||
</a>
|
||
|
||
</li>
|
||
|
||
<li class="md-nav__item">
|
||
<a href="#docling.datamodel.pipeline_options.BaseLayoutOptions.kind" class="md-nav__link">
|
||
<span class="md-ellipsis">
|
||
|
||
<code class="doc-symbol doc-symbol-toc doc-symbol-attribute"></code> kind
|
||
|
||
</span>
|
||
</a>
|
||
|
||
</li>
|
||
|
||
<li class="md-nav__item">
|
||
<a href="#docling.datamodel.pipeline_options.BaseLayoutOptions.skip_cell_assignment" class="md-nav__link">
|
||
<span class="md-ellipsis">
|
||
|
||
<code class="doc-symbol doc-symbol-toc doc-symbol-attribute"></code> skip_cell_assignment
|
||
|
||
</span>
|
||
</a>
|
||
|
||
</li>
|
||
|
||
</ul>
|
||
</nav>
|
||
|
||
</li>
|
||
|
||
<li class="md-nav__item">
|
||
<a href="#docling.datamodel.pipeline_options.BaseOptions" class="md-nav__link">
|
||
<span class="md-ellipsis">
|
||
|
||
<code class="doc-symbol doc-symbol-toc doc-symbol-class"></code> BaseOptions
|
||
|
||
</span>
|
||
</a>
|
||
|
||
<nav class="md-nav" aria-label=" BaseOptions">
|
||
<ul class="md-nav__list">
|
||
|
||
<li class="md-nav__item">
|
||
<a href="#docling.datamodel.pipeline_options.BaseOptions.kind" class="md-nav__link">
|
||
<span class="md-ellipsis">
|
||
|
||
<code class="doc-symbol doc-symbol-toc doc-symbol-attribute"></code> kind
|
||
|
||
</span>
|
||
</a>
|
||
|
||
</li>
|
||
|
||
</ul>
|
||
</nav>
|
||
|
||
</li>
|
||
|
||
<li class="md-nav__item">
|
||
<a href="#docling.datamodel.pipeline_options.BaseTableStructureOptions" class="md-nav__link">
|
||
<span class="md-ellipsis">
|
||
|
||
<code class="doc-symbol doc-symbol-toc doc-symbol-class"></code> BaseTableStructureOptions
|
||
|
||
</span>
|
||
</a>
|
||
|
||
<nav class="md-nav" aria-label=" BaseTableStructureOptions">
|
||
<ul class="md-nav__list">
|
||
|
||
<li class="md-nav__item">
|
||
<a href="#docling.datamodel.pipeline_options.BaseTableStructureOptions.kind" class="md-nav__link">
|
||
<span class="md-ellipsis">
|
||
|
||
<code class="doc-symbol doc-symbol-toc doc-symbol-attribute"></code> kind
|
||
|
||
</span>
|
||
</a>
|
||
|
||
</li>
|
||
|
||
</ul>
|
||
</nav>
|
||
|
||
</li>
|
||
|
||
<li class="md-nav__item">
|
||
<a href="#docling.datamodel.pipeline_options.ConvertPipelineOptions" class="md-nav__link">
|
||
<span class="md-ellipsis">
|
||
|
||
<code class="doc-symbol doc-symbol-toc doc-symbol-class"></code> ConvertPipelineOptions
|
||
|
||
</span>
|
||
</a>
|
||
|
||
<nav class="md-nav" aria-label=" ConvertPipelineOptions">
|
||
<ul class="md-nav__list">
|
||
|
||
<li class="md-nav__item">
|
||
<a href="#docling.datamodel.pipeline_options.ConvertPipelineOptions.accelerator_options" class="md-nav__link">
|
||
<span class="md-ellipsis">
|
||
|
||
<code class="doc-symbol doc-symbol-toc doc-symbol-attribute"></code> accelerator_options
|
||
|
||
</span>
|
||
</a>
|
||
|
||
</li>
|
||
|
||
<li class="md-nav__item">
|
||
<a href="#docling.datamodel.pipeline_options.ConvertPipelineOptions.allow_external_plugins" class="md-nav__link">
|
||
<span class="md-ellipsis">
|
||
|
||
<code class="doc-symbol doc-symbol-toc doc-symbol-attribute"></code> allow_external_plugins
|
||
|
||
</span>
|
||
</a>
|
||
|
||
</li>
|
||
|
||
<li class="md-nav__item">
|
||
<a href="#docling.datamodel.pipeline_options.ConvertPipelineOptions.artifacts_path" class="md-nav__link">
|
||
<span class="md-ellipsis">
|
||
|
||
<code class="doc-symbol doc-symbol-toc doc-symbol-attribute"></code> artifacts_path
|
||
|
||
</span>
|
||
</a>
|
||
|
||
</li>
|
||
|
||
<li class="md-nav__item">
|
||
<a href="#docling.datamodel.pipeline_options.ConvertPipelineOptions.do_picture_classification" class="md-nav__link">
|
||
<span class="md-ellipsis">
|
||
|
||
<code class="doc-symbol doc-symbol-toc doc-symbol-attribute"></code> do_picture_classification
|
||
|
||
</span>
|
||
</a>
|
||
|
||
</li>
|
||
|
||
<li class="md-nav__item">
|
||
<a href="#docling.datamodel.pipeline_options.ConvertPipelineOptions.do_picture_description" class="md-nav__link">
|
||
<span class="md-ellipsis">
|
||
|
||
<code class="doc-symbol doc-symbol-toc doc-symbol-attribute"></code> do_picture_description
|
||
|
||
</span>
|
||
</a>
|
||
|
||
</li>
|
||
|
||
<li class="md-nav__item">
|
||
<a href="#docling.datamodel.pipeline_options.ConvertPipelineOptions.document_timeout" class="md-nav__link">
|
||
<span class="md-ellipsis">
|
||
|
||
<code class="doc-symbol doc-symbol-toc doc-symbol-attribute"></code> document_timeout
|
||
|
||
</span>
|
||
</a>
|
||
|
||
</li>
|
||
|
||
<li class="md-nav__item">
|
||
<a href="#docling.datamodel.pipeline_options.ConvertPipelineOptions.enable_remote_services" class="md-nav__link">
|
||
<span class="md-ellipsis">
|
||
|
||
<code class="doc-symbol doc-symbol-toc doc-symbol-attribute"></code> enable_remote_services
|
||
|
||
</span>
|
||
</a>
|
||
|
||
</li>
|
||
|
||
<li class="md-nav__item">
|
||
<a href="#docling.datamodel.pipeline_options.ConvertPipelineOptions.kind" class="md-nav__link">
|
||
<span class="md-ellipsis">
|
||
|
||
<code class="doc-symbol doc-symbol-toc doc-symbol-attribute"></code> kind
|
||
|
||
</span>
|
||
</a>
|
||
|
||
</li>
|
||
|
||
<li class="md-nav__item">
|
||
<a href="#docling.datamodel.pipeline_options.ConvertPipelineOptions.picture_description_options" class="md-nav__link">
|
||
<span class="md-ellipsis">
|
||
|
||
<code class="doc-symbol doc-symbol-toc doc-symbol-attribute"></code> picture_description_options
|
||
|
||
</span>
|
||
</a>
|
||
|
||
</li>
|
||
|
||
</ul>
|
||
</nav>
|
||
|
||
</li>
|
||
|
||
<li class="md-nav__item">
|
||
<a href="#docling.datamodel.pipeline_options.EasyOcrOptions" class="md-nav__link">
|
||
<span class="md-ellipsis">
|
||
|
||
<code class="doc-symbol doc-symbol-toc doc-symbol-class"></code> EasyOcrOptions
|
||
|
||
</span>
|
||
</a>
|
||
|
||
<nav class="md-nav" aria-label=" EasyOcrOptions">
|
||
<ul class="md-nav__list">
|
||
|
||
<li class="md-nav__item">
|
||
<a href="#docling.datamodel.pipeline_options.EasyOcrOptions.bitmap_area_threshold" class="md-nav__link">
|
||
<span class="md-ellipsis">
|
||
|
||
<code class="doc-symbol doc-symbol-toc doc-symbol-attribute"></code> bitmap_area_threshold
|
||
|
||
</span>
|
||
</a>
|
||
|
||
</li>
|
||
|
||
<li class="md-nav__item">
|
||
<a href="#docling.datamodel.pipeline_options.EasyOcrOptions.confidence_threshold" class="md-nav__link">
|
||
<span class="md-ellipsis">
|
||
|
||
<code class="doc-symbol doc-symbol-toc doc-symbol-attribute"></code> confidence_threshold
|
||
|
||
</span>
|
||
</a>
|
||
|
||
</li>
|
||
|
||
<li class="md-nav__item">
|
||
<a href="#docling.datamodel.pipeline_options.EasyOcrOptions.download_enabled" class="md-nav__link">
|
||
<span class="md-ellipsis">
|
||
|
||
<code class="doc-symbol doc-symbol-toc doc-symbol-attribute"></code> download_enabled
|
||
|
||
</span>
|
||
</a>
|
||
|
||
</li>
|
||
|
||
<li class="md-nav__item">
|
||
<a href="#docling.datamodel.pipeline_options.EasyOcrOptions.force_full_page_ocr" class="md-nav__link">
|
||
<span class="md-ellipsis">
|
||
|
||
<code class="doc-symbol doc-symbol-toc doc-symbol-attribute"></code> force_full_page_ocr
|
||
|
||
</span>
|
||
</a>
|
||
|
||
</li>
|
||
|
||
<li class="md-nav__item">
|
||
<a href="#docling.datamodel.pipeline_options.EasyOcrOptions.kind" class="md-nav__link">
|
||
<span class="md-ellipsis">
|
||
|
||
<code class="doc-symbol doc-symbol-toc doc-symbol-attribute"></code> kind
|
||
|
||
</span>
|
||
</a>
|
||
|
||
</li>
|
||
|
||
<li class="md-nav__item">
|
||
<a href="#docling.datamodel.pipeline_options.EasyOcrOptions.lang" class="md-nav__link">
|
||
<span class="md-ellipsis">
|
||
|
||
<code class="doc-symbol doc-symbol-toc doc-symbol-attribute"></code> lang
|
||
|
||
</span>
|
||
</a>
|
||
|
||
</li>
|
||
|
||
<li class="md-nav__item">
|
||
<a href="#docling.datamodel.pipeline_options.EasyOcrOptions.model_config" class="md-nav__link">
|
||
<span class="md-ellipsis">
|
||
|
||
<code class="doc-symbol doc-symbol-toc doc-symbol-attribute"></code> model_config
|
||
|
||
</span>
|
||
</a>
|
||
|
||
</li>
|
||
|
||
<li class="md-nav__item">
|
||
<a href="#docling.datamodel.pipeline_options.EasyOcrOptions.model_storage_directory" class="md-nav__link">
|
||
<span class="md-ellipsis">
|
||
|
||
<code class="doc-symbol doc-symbol-toc doc-symbol-attribute"></code> model_storage_directory
|
||
|
||
</span>
|
||
</a>
|
||
|
||
</li>
|
||
|
||
<li class="md-nav__item">
|
||
<a href="#docling.datamodel.pipeline_options.EasyOcrOptions.recog_network" class="md-nav__link">
|
||
<span class="md-ellipsis">
|
||
|
||
<code class="doc-symbol doc-symbol-toc doc-symbol-attribute"></code> recog_network
|
||
|
||
</span>
|
||
</a>
|
||
|
||
</li>
|
||
|
||
<li class="md-nav__item">
|
||
<a href="#docling.datamodel.pipeline_options.EasyOcrOptions.suppress_mps_warnings" class="md-nav__link">
|
||
<span class="md-ellipsis">
|
||
|
||
<code class="doc-symbol doc-symbol-toc doc-symbol-attribute"></code> suppress_mps_warnings
|
||
|
||
</span>
|
||
</a>
|
||
|
||
</li>
|
||
|
||
<li class="md-nav__item">
|
||
<a href="#docling.datamodel.pipeline_options.EasyOcrOptions.use_gpu" class="md-nav__link">
|
||
<span class="md-ellipsis">
|
||
|
||
<code class="doc-symbol doc-symbol-toc doc-symbol-attribute"></code> use_gpu
|
||
|
||
</span>
|
||
</a>
|
||
|
||
</li>
|
||
|
||
</ul>
|
||
</nav>
|
||
|
||
</li>
|
||
|
||
<li class="md-nav__item">
|
||
<a href="#docling.datamodel.pipeline_options.LayoutOptions" class="md-nav__link">
|
||
<span class="md-ellipsis">
|
||
|
||
<code class="doc-symbol doc-symbol-toc doc-symbol-class"></code> LayoutOptions
|
||
|
||
</span>
|
||
</a>
|
||
|
||
<nav class="md-nav" aria-label=" LayoutOptions">
|
||
<ul class="md-nav__list">
|
||
|
||
<li class="md-nav__item">
|
||
<a href="#docling.datamodel.pipeline_options.LayoutOptions.create_orphan_clusters" class="md-nav__link">
|
||
<span class="md-ellipsis">
|
||
|
||
<code class="doc-symbol doc-symbol-toc doc-symbol-attribute"></code> create_orphan_clusters
|
||
|
||
</span>
|
||
</a>
|
||
|
||
</li>
|
||
|
||
<li class="md-nav__item">
|
||
<a href="#docling.datamodel.pipeline_options.LayoutOptions.keep_empty_clusters" class="md-nav__link">
|
||
<span class="md-ellipsis">
|
||
|
||
<code class="doc-symbol doc-symbol-toc doc-symbol-attribute"></code> keep_empty_clusters
|
||
|
||
</span>
|
||
</a>
|
||
|
||
</li>
|
||
|
||
<li class="md-nav__item">
|
||
<a href="#docling.datamodel.pipeline_options.LayoutOptions.kind" class="md-nav__link">
|
||
<span class="md-ellipsis">
|
||
|
||
<code class="doc-symbol doc-symbol-toc doc-symbol-attribute"></code> kind
|
||
|
||
</span>
|
||
</a>
|
||
|
||
</li>
|
||
|
||
<li class="md-nav__item">
|
||
<a href="#docling.datamodel.pipeline_options.LayoutOptions.model_spec" class="md-nav__link">
|
||
<span class="md-ellipsis">
|
||
|
||
<code class="doc-symbol doc-symbol-toc doc-symbol-attribute"></code> model_spec
|
||
|
||
</span>
|
||
</a>
|
||
|
||
</li>
|
||
|
||
<li class="md-nav__item">
|
||
<a href="#docling.datamodel.pipeline_options.LayoutOptions.skip_cell_assignment" class="md-nav__link">
|
||
<span class="md-ellipsis">
|
||
|
||
<code class="doc-symbol doc-symbol-toc doc-symbol-attribute"></code> skip_cell_assignment
|
||
|
||
</span>
|
||
</a>
|
||
|
||
</li>
|
||
|
||
</ul>
|
||
</nav>
|
||
|
||
</li>
|
||
|
||
<li class="md-nav__item">
|
||
<a href="#docling.datamodel.pipeline_options.OcrAutoOptions" class="md-nav__link">
|
||
<span class="md-ellipsis">
|
||
|
||
<code class="doc-symbol doc-symbol-toc doc-symbol-class"></code> OcrAutoOptions
|
||
|
||
</span>
|
||
</a>
|
||
|
||
<nav class="md-nav" aria-label=" OcrAutoOptions">
|
||
<ul class="md-nav__list">
|
||
|
||
<li class="md-nav__item">
|
||
<a href="#docling.datamodel.pipeline_options.OcrAutoOptions.bitmap_area_threshold" class="md-nav__link">
|
||
<span class="md-ellipsis">
|
||
|
||
<code class="doc-symbol doc-symbol-toc doc-symbol-attribute"></code> bitmap_area_threshold
|
||
|
||
</span>
|
||
</a>
|
||
|
||
</li>
|
||
|
||
<li class="md-nav__item">
|
||
<a href="#docling.datamodel.pipeline_options.OcrAutoOptions.force_full_page_ocr" class="md-nav__link">
|
||
<span class="md-ellipsis">
|
||
|
||
<code class="doc-symbol doc-symbol-toc doc-symbol-attribute"></code> force_full_page_ocr
|
||
|
||
</span>
|
||
</a>
|
||
|
||
</li>
|
||
|
||
<li class="md-nav__item">
|
||
<a href="#docling.datamodel.pipeline_options.OcrAutoOptions.kind" class="md-nav__link">
|
||
<span class="md-ellipsis">
|
||
|
||
<code class="doc-symbol doc-symbol-toc doc-symbol-attribute"></code> kind
|
||
|
||
</span>
|
||
</a>
|
||
|
||
</li>
|
||
|
||
<li class="md-nav__item">
|
||
<a href="#docling.datamodel.pipeline_options.OcrAutoOptions.lang" class="md-nav__link">
|
||
<span class="md-ellipsis">
|
||
|
||
<code class="doc-symbol doc-symbol-toc doc-symbol-attribute"></code> lang
|
||
|
||
</span>
|
||
</a>
|
||
|
||
</li>
|
||
|
||
</ul>
|
||
</nav>
|
||
|
||
</li>
|
||
|
||
<li class="md-nav__item">
|
||
<a href="#docling.datamodel.pipeline_options.OcrEngine" class="md-nav__link">
|
||
<span class="md-ellipsis">
|
||
|
||
<code class="doc-symbol doc-symbol-toc doc-symbol-class"></code> OcrEngine
|
||
|
||
</span>
|
||
</a>
|
||
|
||
<nav class="md-nav" aria-label=" OcrEngine">
|
||
<ul class="md-nav__list">
|
||
|
||
<li class="md-nav__item">
|
||
<a href="#docling.datamodel.pipeline_options.OcrEngine.AUTO" class="md-nav__link">
|
||
<span class="md-ellipsis">
|
||
|
||
<code class="doc-symbol doc-symbol-toc doc-symbol-attribute"></code> AUTO
|
||
|
||
</span>
|
||
</a>
|
||
|
||
</li>
|
||
|
||
<li class="md-nav__item">
|
||
<a href="#docling.datamodel.pipeline_options.OcrEngine.EASYOCR" class="md-nav__link">
|
||
<span class="md-ellipsis">
|
||
|
||
<code class="doc-symbol doc-symbol-toc doc-symbol-attribute"></code> EASYOCR
|
||
|
||
</span>
|
||
</a>
|
||
|
||
</li>
|
||
|
||
<li class="md-nav__item">
|
||
<a href="#docling.datamodel.pipeline_options.OcrEngine.OCRMAC" class="md-nav__link">
|
||
<span class="md-ellipsis">
|
||
|
||
<code class="doc-symbol doc-symbol-toc doc-symbol-attribute"></code> OCRMAC
|
||
|
||
</span>
|
||
</a>
|
||
|
||
</li>
|
||
|
||
<li class="md-nav__item">
|
||
<a href="#docling.datamodel.pipeline_options.OcrEngine.RAPIDOCR" class="md-nav__link">
|
||
<span class="md-ellipsis">
|
||
|
||
<code class="doc-symbol doc-symbol-toc doc-symbol-attribute"></code> RAPIDOCR
|
||
|
||
</span>
|
||
</a>
|
||
|
||
</li>
|
||
|
||
<li class="md-nav__item">
|
||
<a href="#docling.datamodel.pipeline_options.OcrEngine.TESSERACT" class="md-nav__link">
|
||
<span class="md-ellipsis">
|
||
|
||
<code class="doc-symbol doc-symbol-toc doc-symbol-attribute"></code> TESSERACT
|
||
|
||
</span>
|
||
</a>
|
||
|
||
</li>
|
||
|
||
<li class="md-nav__item">
|
||
<a href="#docling.datamodel.pipeline_options.OcrEngine.TESSERACT_CLI" class="md-nav__link">
|
||
<span class="md-ellipsis">
|
||
|
||
<code class="doc-symbol doc-symbol-toc doc-symbol-attribute"></code> TESSERACT_CLI
|
||
|
||
</span>
|
||
</a>
|
||
|
||
</li>
|
||
|
||
</ul>
|
||
</nav>
|
||
|
||
</li>
|
||
|
||
<li class="md-nav__item">
|
||
<a href="#docling.datamodel.pipeline_options.OcrMacOptions" class="md-nav__link">
|
||
<span class="md-ellipsis">
|
||
|
||
<code class="doc-symbol doc-symbol-toc doc-symbol-class"></code> OcrMacOptions
|
||
|
||
</span>
|
||
</a>
|
||
|
||
<nav class="md-nav" aria-label=" OcrMacOptions">
|
||
<ul class="md-nav__list">
|
||
|
||
<li class="md-nav__item">
|
||
<a href="#docling.datamodel.pipeline_options.OcrMacOptions.bitmap_area_threshold" class="md-nav__link">
|
||
<span class="md-ellipsis">
|
||
|
||
<code class="doc-symbol doc-symbol-toc doc-symbol-attribute"></code> bitmap_area_threshold
|
||
|
||
</span>
|
||
</a>
|
||
|
||
</li>
|
||
|
||
<li class="md-nav__item">
|
||
<a href="#docling.datamodel.pipeline_options.OcrMacOptions.force_full_page_ocr" class="md-nav__link">
|
||
<span class="md-ellipsis">
|
||
|
||
<code class="doc-symbol doc-symbol-toc doc-symbol-attribute"></code> force_full_page_ocr
|
||
|
||
</span>
|
||
</a>
|
||
|
||
</li>
|
||
|
||
<li class="md-nav__item">
|
||
<a href="#docling.datamodel.pipeline_options.OcrMacOptions.framework" class="md-nav__link">
|
||
<span class="md-ellipsis">
|
||
|
||
<code class="doc-symbol doc-symbol-toc doc-symbol-attribute"></code> framework
|
||
|
||
</span>
|
||
</a>
|
||
|
||
</li>
|
||
|
||
<li class="md-nav__item">
|
||
<a href="#docling.datamodel.pipeline_options.OcrMacOptions.kind" class="md-nav__link">
|
||
<span class="md-ellipsis">
|
||
|
||
<code class="doc-symbol doc-symbol-toc doc-symbol-attribute"></code> kind
|
||
|
||
</span>
|
||
</a>
|
||
|
||
</li>
|
||
|
||
<li class="md-nav__item">
|
||
<a href="#docling.datamodel.pipeline_options.OcrMacOptions.lang" class="md-nav__link">
|
||
<span class="md-ellipsis">
|
||
|
||
<code class="doc-symbol doc-symbol-toc doc-symbol-attribute"></code> lang
|
||
|
||
</span>
|
||
</a>
|
||
|
||
</li>
|
||
|
||
<li class="md-nav__item">
|
||
<a href="#docling.datamodel.pipeline_options.OcrMacOptions.model_config" class="md-nav__link">
|
||
<span class="md-ellipsis">
|
||
|
||
<code class="doc-symbol doc-symbol-toc doc-symbol-attribute"></code> model_config
|
||
|
||
</span>
|
||
</a>
|
||
|
||
</li>
|
||
|
||
<li class="md-nav__item">
|
||
<a href="#docling.datamodel.pipeline_options.OcrMacOptions.recognition" class="md-nav__link">
|
||
<span class="md-ellipsis">
|
||
|
||
<code class="doc-symbol doc-symbol-toc doc-symbol-attribute"></code> recognition
|
||
|
||
</span>
|
||
</a>
|
||
|
||
</li>
|
||
|
||
</ul>
|
||
</nav>
|
||
|
||
</li>
|
||
|
||
<li class="md-nav__item">
|
||
<a href="#docling.datamodel.pipeline_options.OcrOptions" class="md-nav__link">
|
||
<span class="md-ellipsis">
|
||
|
||
<code class="doc-symbol doc-symbol-toc doc-symbol-class"></code> OcrOptions
|
||
|
||
</span>
|
||
</a>
|
||
|
||
<nav class="md-nav" aria-label=" OcrOptions">
|
||
<ul class="md-nav__list">
|
||
|
||
<li class="md-nav__item">
|
||
<a href="#docling.datamodel.pipeline_options.OcrOptions.bitmap_area_threshold" class="md-nav__link">
|
||
<span class="md-ellipsis">
|
||
|
||
<code class="doc-symbol doc-symbol-toc doc-symbol-attribute"></code> bitmap_area_threshold
|
||
|
||
</span>
|
||
</a>
|
||
|
||
</li>
|
||
|
||
<li class="md-nav__item">
|
||
<a href="#docling.datamodel.pipeline_options.OcrOptions.force_full_page_ocr" class="md-nav__link">
|
||
<span class="md-ellipsis">
|
||
|
||
<code class="doc-symbol doc-symbol-toc doc-symbol-attribute"></code> force_full_page_ocr
|
||
|
||
</span>
|
||
</a>
|
||
|
||
</li>
|
||
|
||
<li class="md-nav__item">
|
||
<a href="#docling.datamodel.pipeline_options.OcrOptions.kind" class="md-nav__link">
|
||
<span class="md-ellipsis">
|
||
|
||
<code class="doc-symbol doc-symbol-toc doc-symbol-attribute"></code> kind
|
||
|
||
</span>
|
||
</a>
|
||
|
||
</li>
|
||
|
||
<li class="md-nav__item">
|
||
<a href="#docling.datamodel.pipeline_options.OcrOptions.lang" class="md-nav__link">
|
||
<span class="md-ellipsis">
|
||
|
||
<code class="doc-symbol doc-symbol-toc doc-symbol-attribute"></code> lang
|
||
|
||
</span>
|
||
</a>
|
||
|
||
</li>
|
||
|
||
</ul>
|
||
</nav>
|
||
|
||
</li>
|
||
|
||
<li class="md-nav__item">
|
||
<a href="#docling.datamodel.pipeline_options.PaginatedPipelineOptions" class="md-nav__link">
|
||
<span class="md-ellipsis">
|
||
|
||
<code class="doc-symbol doc-symbol-toc doc-symbol-class"></code> PaginatedPipelineOptions
|
||
|
||
</span>
|
||
</a>
|
||
|
||
<nav class="md-nav" aria-label=" PaginatedPipelineOptions">
|
||
<ul class="md-nav__list">
|
||
|
||
<li class="md-nav__item">
|
||
<a href="#docling.datamodel.pipeline_options.PaginatedPipelineOptions.accelerator_options" class="md-nav__link">
|
||
<span class="md-ellipsis">
|
||
|
||
<code class="doc-symbol doc-symbol-toc doc-symbol-attribute"></code> accelerator_options
|
||
|
||
</span>
|
||
</a>
|
||
|
||
</li>
|
||
|
||
<li class="md-nav__item">
|
||
<a href="#docling.datamodel.pipeline_options.PaginatedPipelineOptions.allow_external_plugins" class="md-nav__link">
|
||
<span class="md-ellipsis">
|
||
|
||
<code class="doc-symbol doc-symbol-toc doc-symbol-attribute"></code> allow_external_plugins
|
||
|
||
</span>
|
||
</a>
|
||
|
||
</li>
|
||
|
||
<li class="md-nav__item">
|
||
<a href="#docling.datamodel.pipeline_options.PaginatedPipelineOptions.artifacts_path" class="md-nav__link">
|
||
<span class="md-ellipsis">
|
||
|
||
<code class="doc-symbol doc-symbol-toc doc-symbol-attribute"></code> artifacts_path
|
||
|
||
</span>
|
||
</a>
|
||
|
||
</li>
|
||
|
||
<li class="md-nav__item">
|
||
<a href="#docling.datamodel.pipeline_options.PaginatedPipelineOptions.do_picture_classification" class="md-nav__link">
|
||
<span class="md-ellipsis">
|
||
|
||
<code class="doc-symbol doc-symbol-toc doc-symbol-attribute"></code> do_picture_classification
|
||
|
||
</span>
|
||
</a>
|
||
|
||
</li>
|
||
|
||
<li class="md-nav__item">
|
||
<a href="#docling.datamodel.pipeline_options.PaginatedPipelineOptions.do_picture_description" class="md-nav__link">
|
||
<span class="md-ellipsis">
|
||
|
||
<code class="doc-symbol doc-symbol-toc doc-symbol-attribute"></code> do_picture_description
|
||
|
||
</span>
|
||
</a>
|
||
|
||
</li>
|
||
|
||
<li class="md-nav__item">
|
||
<a href="#docling.datamodel.pipeline_options.PaginatedPipelineOptions.document_timeout" class="md-nav__link">
|
||
<span class="md-ellipsis">
|
||
|
||
<code class="doc-symbol doc-symbol-toc doc-symbol-attribute"></code> document_timeout
|
||
|
||
</span>
|
||
</a>
|
||
|
||
</li>
|
||
|
||
<li class="md-nav__item">
|
||
<a href="#docling.datamodel.pipeline_options.PaginatedPipelineOptions.enable_remote_services" class="md-nav__link">
|
||
<span class="md-ellipsis">
|
||
|
||
<code class="doc-symbol doc-symbol-toc doc-symbol-attribute"></code> enable_remote_services
|
||
|
||
</span>
|
||
</a>
|
||
|
||
</li>
|
||
|
||
<li class="md-nav__item">
|
||
<a href="#docling.datamodel.pipeline_options.PaginatedPipelineOptions.generate_page_images" class="md-nav__link">
|
||
<span class="md-ellipsis">
|
||
|
||
<code class="doc-symbol doc-symbol-toc doc-symbol-attribute"></code> generate_page_images
|
||
|
||
</span>
|
||
</a>
|
||
|
||
</li>
|
||
|
||
<li class="md-nav__item">
|
||
<a href="#docling.datamodel.pipeline_options.PaginatedPipelineOptions.generate_picture_images" class="md-nav__link">
|
||
<span class="md-ellipsis">
|
||
|
||
<code class="doc-symbol doc-symbol-toc doc-symbol-attribute"></code> generate_picture_images
|
||
|
||
</span>
|
||
</a>
|
||
|
||
</li>
|
||
|
||
<li class="md-nav__item">
|
||
<a href="#docling.datamodel.pipeline_options.PaginatedPipelineOptions.images_scale" class="md-nav__link">
|
||
<span class="md-ellipsis">
|
||
|
||
<code class="doc-symbol doc-symbol-toc doc-symbol-attribute"></code> images_scale
|
||
|
||
</span>
|
||
</a>
|
||
|
||
</li>
|
||
|
||
<li class="md-nav__item">
|
||
<a href="#docling.datamodel.pipeline_options.PaginatedPipelineOptions.kind" class="md-nav__link">
|
||
<span class="md-ellipsis">
|
||
|
||
<code class="doc-symbol doc-symbol-toc doc-symbol-attribute"></code> kind
|
||
|
||
</span>
|
||
</a>
|
||
|
||
</li>
|
||
|
||
<li class="md-nav__item">
|
||
<a href="#docling.datamodel.pipeline_options.PaginatedPipelineOptions.picture_description_options" class="md-nav__link">
|
||
<span class="md-ellipsis">
|
||
|
||
<code class="doc-symbol doc-symbol-toc doc-symbol-attribute"></code> picture_description_options
|
||
|
||
</span>
|
||
</a>
|
||
|
||
</li>
|
||
|
||
</ul>
|
||
</nav>
|
||
|
||
</li>
|
||
|
||
<li class="md-nav__item">
|
||
<a href="#docling.datamodel.pipeline_options.PdfBackend" class="md-nav__link">
|
||
<span class="md-ellipsis">
|
||
|
||
<code class="doc-symbol doc-symbol-toc doc-symbol-class"></code> PdfBackend
|
||
|
||
</span>
|
||
</a>
|
||
|
||
<nav class="md-nav" aria-label=" PdfBackend">
|
||
<ul class="md-nav__list">
|
||
|
||
<li class="md-nav__item">
|
||
<a href="#docling.datamodel.pipeline_options.PdfBackend.DLPARSE_V1" class="md-nav__link">
|
||
<span class="md-ellipsis">
|
||
|
||
<code class="doc-symbol doc-symbol-toc doc-symbol-attribute"></code> DLPARSE_V1
|
||
|
||
</span>
|
||
</a>
|
||
|
||
</li>
|
||
|
||
<li class="md-nav__item">
|
||
<a href="#docling.datamodel.pipeline_options.PdfBackend.DLPARSE_V2" class="md-nav__link">
|
||
<span class="md-ellipsis">
|
||
|
||
<code class="doc-symbol doc-symbol-toc doc-symbol-attribute"></code> DLPARSE_V2
|
||
|
||
</span>
|
||
</a>
|
||
|
||
</li>
|
||
|
||
<li class="md-nav__item">
|
||
<a href="#docling.datamodel.pipeline_options.PdfBackend.DLPARSE_V4" class="md-nav__link">
|
||
<span class="md-ellipsis">
|
||
|
||
<code class="doc-symbol doc-symbol-toc doc-symbol-attribute"></code> DLPARSE_V4
|
||
|
||
</span>
|
||
</a>
|
||
|
||
</li>
|
||
|
||
<li class="md-nav__item">
|
||
<a href="#docling.datamodel.pipeline_options.PdfBackend.PYPDFIUM2" class="md-nav__link">
|
||
<span class="md-ellipsis">
|
||
|
||
<code class="doc-symbol doc-symbol-toc doc-symbol-attribute"></code> PYPDFIUM2
|
||
|
||
</span>
|
||
</a>
|
||
|
||
</li>
|
||
|
||
</ul>
|
||
</nav>
|
||
|
||
</li>
|
||
|
||
<li class="md-nav__item">
|
||
<a href="#docling.datamodel.pipeline_options.PdfPipelineOptions" class="md-nav__link">
|
||
<span class="md-ellipsis">
|
||
|
||
<code class="doc-symbol doc-symbol-toc doc-symbol-class"></code> PdfPipelineOptions
|
||
|
||
</span>
|
||
</a>
|
||
|
||
<nav class="md-nav" aria-label=" PdfPipelineOptions">
|
||
<ul class="md-nav__list">
|
||
|
||
<li class="md-nav__item">
|
||
<a href="#docling.datamodel.pipeline_options.PdfPipelineOptions.accelerator_options" class="md-nav__link">
|
||
<span class="md-ellipsis">
|
||
|
||
<code class="doc-symbol doc-symbol-toc doc-symbol-attribute"></code> accelerator_options
|
||
|
||
</span>
|
||
</a>
|
||
|
||
</li>
|
||
|
||
<li class="md-nav__item">
|
||
<a href="#docling.datamodel.pipeline_options.PdfPipelineOptions.allow_external_plugins" class="md-nav__link">
|
||
<span class="md-ellipsis">
|
||
|
||
<code class="doc-symbol doc-symbol-toc doc-symbol-attribute"></code> allow_external_plugins
|
||
|
||
</span>
|
||
</a>
|
||
|
||
</li>
|
||
|
||
<li class="md-nav__item">
|
||
<a href="#docling.datamodel.pipeline_options.PdfPipelineOptions.artifacts_path" class="md-nav__link">
|
||
<span class="md-ellipsis">
|
||
|
||
<code class="doc-symbol doc-symbol-toc doc-symbol-attribute"></code> artifacts_path
|
||
|
||
</span>
|
||
</a>
|
||
|
||
</li>
|
||
|
||
<li class="md-nav__item">
|
||
<a href="#docling.datamodel.pipeline_options.PdfPipelineOptions.batch_polling_interval_seconds" class="md-nav__link">
|
||
<span class="md-ellipsis">
|
||
|
||
<code class="doc-symbol doc-symbol-toc doc-symbol-attribute"></code> batch_polling_interval_seconds
|
||
|
||
</span>
|
||
</a>
|
||
|
||
</li>
|
||
|
||
<li class="md-nav__item">
|
||
<a href="#docling.datamodel.pipeline_options.PdfPipelineOptions.do_code_enrichment" class="md-nav__link">
|
||
<span class="md-ellipsis">
|
||
|
||
<code class="doc-symbol doc-symbol-toc doc-symbol-attribute"></code> do_code_enrichment
|
||
|
||
</span>
|
||
</a>
|
||
|
||
</li>
|
||
|
||
<li class="md-nav__item">
|
||
<a href="#docling.datamodel.pipeline_options.PdfPipelineOptions.do_formula_enrichment" class="md-nav__link">
|
||
<span class="md-ellipsis">
|
||
|
||
<code class="doc-symbol doc-symbol-toc doc-symbol-attribute"></code> do_formula_enrichment
|
||
|
||
</span>
|
||
</a>
|
||
|
||
</li>
|
||
|
||
<li class="md-nav__item">
|
||
<a href="#docling.datamodel.pipeline_options.PdfPipelineOptions.do_ocr" class="md-nav__link">
|
||
<span class="md-ellipsis">
|
||
|
||
<code class="doc-symbol doc-symbol-toc doc-symbol-attribute"></code> do_ocr
|
||
|
||
</span>
|
||
</a>
|
||
|
||
</li>
|
||
|
||
<li class="md-nav__item">
|
||
<a href="#docling.datamodel.pipeline_options.PdfPipelineOptions.do_picture_classification" class="md-nav__link">
|
||
<span class="md-ellipsis">
|
||
|
||
<code class="doc-symbol doc-symbol-toc doc-symbol-attribute"></code> do_picture_classification
|
||
|
||
</span>
|
||
</a>
|
||
|
||
</li>
|
||
|
||
<li class="md-nav__item">
|
||
<a href="#docling.datamodel.pipeline_options.PdfPipelineOptions.do_picture_description" class="md-nav__link">
|
||
<span class="md-ellipsis">
|
||
|
||
<code class="doc-symbol doc-symbol-toc doc-symbol-attribute"></code> do_picture_description
|
||
|
||
</span>
|
||
</a>
|
||
|
||
</li>
|
||
|
||
<li class="md-nav__item">
|
||
<a href="#docling.datamodel.pipeline_options.PdfPipelineOptions.do_table_structure" class="md-nav__link">
|
||
<span class="md-ellipsis">
|
||
|
||
<code class="doc-symbol doc-symbol-toc doc-symbol-attribute"></code> do_table_structure
|
||
|
||
</span>
|
||
</a>
|
||
|
||
</li>
|
||
|
||
<li class="md-nav__item">
|
||
<a href="#docling.datamodel.pipeline_options.PdfPipelineOptions.document_timeout" class="md-nav__link">
|
||
<span class="md-ellipsis">
|
||
|
||
<code class="doc-symbol doc-symbol-toc doc-symbol-attribute"></code> document_timeout
|
||
|
||
</span>
|
||
</a>
|
||
|
||
</li>
|
||
|
||
<li class="md-nav__item">
|
||
<a href="#docling.datamodel.pipeline_options.PdfPipelineOptions.enable_remote_services" class="md-nav__link">
|
||
<span class="md-ellipsis">
|
||
|
||
<code class="doc-symbol doc-symbol-toc doc-symbol-attribute"></code> enable_remote_services
|
||
|
||
</span>
|
||
</a>
|
||
|
||
</li>
|
||
|
||
<li class="md-nav__item">
|
||
<a href="#docling.datamodel.pipeline_options.PdfPipelineOptions.force_backend_text" class="md-nav__link">
|
||
<span class="md-ellipsis">
|
||
|
||
<code class="doc-symbol doc-symbol-toc doc-symbol-attribute"></code> force_backend_text
|
||
|
||
</span>
|
||
</a>
|
||
|
||
</li>
|
||
|
||
<li class="md-nav__item">
|
||
<a href="#docling.datamodel.pipeline_options.PdfPipelineOptions.generate_page_images" class="md-nav__link">
|
||
<span class="md-ellipsis">
|
||
|
||
<code class="doc-symbol doc-symbol-toc doc-symbol-attribute"></code> generate_page_images
|
||
|
||
</span>
|
||
</a>
|
||
|
||
</li>
|
||
|
||
<li class="md-nav__item">
|
||
<a href="#docling.datamodel.pipeline_options.PdfPipelineOptions.generate_parsed_pages" class="md-nav__link">
|
||
<span class="md-ellipsis">
|
||
|
||
<code class="doc-symbol doc-symbol-toc doc-symbol-attribute"></code> generate_parsed_pages
|
||
|
||
</span>
|
||
</a>
|
||
|
||
</li>
|
||
|
||
<li class="md-nav__item">
|
||
<a href="#docling.datamodel.pipeline_options.PdfPipelineOptions.generate_picture_images" class="md-nav__link">
|
||
<span class="md-ellipsis">
|
||
|
||
<code class="doc-symbol doc-symbol-toc doc-symbol-attribute"></code> generate_picture_images
|
||
|
||
</span>
|
||
</a>
|
||
|
||
</li>
|
||
|
||
<li class="md-nav__item">
|
||
<a href="#docling.datamodel.pipeline_options.PdfPipelineOptions.generate_table_images" class="md-nav__link">
|
||
<span class="md-ellipsis">
|
||
|
||
<code class="doc-symbol doc-symbol-toc doc-symbol-attribute"></code> generate_table_images
|
||
|
||
</span>
|
||
</a>
|
||
|
||
</li>
|
||
|
||
<li class="md-nav__item">
|
||
<a href="#docling.datamodel.pipeline_options.PdfPipelineOptions.images_scale" class="md-nav__link">
|
||
<span class="md-ellipsis">
|
||
|
||
<code class="doc-symbol doc-symbol-toc doc-symbol-attribute"></code> images_scale
|
||
|
||
</span>
|
||
</a>
|
||
|
||
</li>
|
||
|
||
<li class="md-nav__item">
|
||
<a href="#docling.datamodel.pipeline_options.PdfPipelineOptions.kind" class="md-nav__link">
|
||
<span class="md-ellipsis">
|
||
|
||
<code class="doc-symbol doc-symbol-toc doc-symbol-attribute"></code> kind
|
||
|
||
</span>
|
||
</a>
|
||
|
||
</li>
|
||
|
||
<li class="md-nav__item">
|
||
<a href="#docling.datamodel.pipeline_options.PdfPipelineOptions.layout_batch_size" class="md-nav__link">
|
||
<span class="md-ellipsis">
|
||
|
||
<code class="doc-symbol doc-symbol-toc doc-symbol-attribute"></code> layout_batch_size
|
||
|
||
</span>
|
||
</a>
|
||
|
||
</li>
|
||
|
||
<li class="md-nav__item">
|
||
<a href="#docling.datamodel.pipeline_options.PdfPipelineOptions.layout_options" class="md-nav__link">
|
||
<span class="md-ellipsis">
|
||
|
||
<code class="doc-symbol doc-symbol-toc doc-symbol-attribute"></code> layout_options
|
||
|
||
</span>
|
||
</a>
|
||
|
||
</li>
|
||
|
||
<li class="md-nav__item">
|
||
<a href="#docling.datamodel.pipeline_options.PdfPipelineOptions.ocr_batch_size" class="md-nav__link">
|
||
<span class="md-ellipsis">
|
||
|
||
<code class="doc-symbol doc-symbol-toc doc-symbol-attribute"></code> ocr_batch_size
|
||
|
||
</span>
|
||
</a>
|
||
|
||
</li>
|
||
|
||
<li class="md-nav__item">
|
||
<a href="#docling.datamodel.pipeline_options.PdfPipelineOptions.ocr_options" class="md-nav__link">
|
||
<span class="md-ellipsis">
|
||
|
||
<code class="doc-symbol doc-symbol-toc doc-symbol-attribute"></code> ocr_options
|
||
|
||
</span>
|
||
</a>
|
||
|
||
</li>
|
||
|
||
<li class="md-nav__item">
|
||
<a href="#docling.datamodel.pipeline_options.PdfPipelineOptions.picture_description_options" class="md-nav__link">
|
||
<span class="md-ellipsis">
|
||
|
||
<code class="doc-symbol doc-symbol-toc doc-symbol-attribute"></code> picture_description_options
|
||
|
||
</span>
|
||
</a>
|
||
|
||
</li>
|
||
|
||
<li class="md-nav__item">
|
||
<a href="#docling.datamodel.pipeline_options.PdfPipelineOptions.queue_max_size" class="md-nav__link">
|
||
<span class="md-ellipsis">
|
||
|
||
<code class="doc-symbol doc-symbol-toc doc-symbol-attribute"></code> queue_max_size
|
||
|
||
</span>
|
||
</a>
|
||
|
||
</li>
|
||
|
||
<li class="md-nav__item">
|
||
<a href="#docling.datamodel.pipeline_options.PdfPipelineOptions.table_batch_size" class="md-nav__link">
|
||
<span class="md-ellipsis">
|
||
|
||
<code class="doc-symbol doc-symbol-toc doc-symbol-attribute"></code> table_batch_size
|
||
|
||
</span>
|
||
</a>
|
||
|
||
</li>
|
||
|
||
<li class="md-nav__item">
|
||
<a href="#docling.datamodel.pipeline_options.PdfPipelineOptions.table_structure_options" class="md-nav__link">
|
||
<span class="md-ellipsis">
|
||
|
||
<code class="doc-symbol doc-symbol-toc doc-symbol-attribute"></code> table_structure_options
|
||
|
||
</span>
|
||
</a>
|
||
|
||
</li>
|
||
|
||
</ul>
|
||
</nav>
|
||
|
||
</li>
|
||
|
||
<li class="md-nav__item">
|
||
<a href="#docling.datamodel.pipeline_options.PictureDescriptionApiOptions" class="md-nav__link">
|
||
<span class="md-ellipsis">
|
||
|
||
<code class="doc-symbol doc-symbol-toc doc-symbol-class"></code> PictureDescriptionApiOptions
|
||
|
||
</span>
|
||
</a>
|
||
|
||
<nav class="md-nav" aria-label=" PictureDescriptionApiOptions">
|
||
<ul class="md-nav__list">
|
||
|
||
<li class="md-nav__item">
|
||
<a href="#docling.datamodel.pipeline_options.PictureDescriptionApiOptions.batch_size" class="md-nav__link">
|
||
<span class="md-ellipsis">
|
||
|
||
<code class="doc-symbol doc-symbol-toc doc-symbol-attribute"></code> batch_size
|
||
|
||
</span>
|
||
</a>
|
||
|
||
</li>
|
||
|
||
<li class="md-nav__item">
|
||
<a href="#docling.datamodel.pipeline_options.PictureDescriptionApiOptions.concurrency" class="md-nav__link">
|
||
<span class="md-ellipsis">
|
||
|
||
<code class="doc-symbol doc-symbol-toc doc-symbol-attribute"></code> concurrency
|
||
|
||
</span>
|
||
</a>
|
||
|
||
</li>
|
||
|
||
<li class="md-nav__item">
|
||
<a href="#docling.datamodel.pipeline_options.PictureDescriptionApiOptions.headers" class="md-nav__link">
|
||
<span class="md-ellipsis">
|
||
|
||
<code class="doc-symbol doc-symbol-toc doc-symbol-attribute"></code> headers
|
||
|
||
</span>
|
||
</a>
|
||
|
||
</li>
|
||
|
||
<li class="md-nav__item">
|
||
<a href="#docling.datamodel.pipeline_options.PictureDescriptionApiOptions.kind" class="md-nav__link">
|
||
<span class="md-ellipsis">
|
||
|
||
<code class="doc-symbol doc-symbol-toc doc-symbol-attribute"></code> kind
|
||
|
||
</span>
|
||
</a>
|
||
|
||
</li>
|
||
|
||
<li class="md-nav__item">
|
||
<a href="#docling.datamodel.pipeline_options.PictureDescriptionApiOptions.params" class="md-nav__link">
|
||
<span class="md-ellipsis">
|
||
|
||
<code class="doc-symbol doc-symbol-toc doc-symbol-attribute"></code> params
|
||
|
||
</span>
|
||
</a>
|
||
|
||
</li>
|
||
|
||
<li class="md-nav__item">
|
||
<a href="#docling.datamodel.pipeline_options.PictureDescriptionApiOptions.picture_area_threshold" class="md-nav__link">
|
||
<span class="md-ellipsis">
|
||
|
||
<code class="doc-symbol doc-symbol-toc doc-symbol-attribute"></code> picture_area_threshold
|
||
|
||
</span>
|
||
</a>
|
||
|
||
</li>
|
||
|
||
<li class="md-nav__item">
|
||
<a href="#docling.datamodel.pipeline_options.PictureDescriptionApiOptions.prompt" class="md-nav__link">
|
||
<span class="md-ellipsis">
|
||
|
||
<code class="doc-symbol doc-symbol-toc doc-symbol-attribute"></code> prompt
|
||
|
||
</span>
|
||
</a>
|
||
|
||
</li>
|
||
|
||
<li class="md-nav__item">
|
||
<a href="#docling.datamodel.pipeline_options.PictureDescriptionApiOptions.provenance" class="md-nav__link">
|
||
<span class="md-ellipsis">
|
||
|
||
<code class="doc-symbol doc-symbol-toc doc-symbol-attribute"></code> provenance
|
||
|
||
</span>
|
||
</a>
|
||
|
||
</li>
|
||
|
||
<li class="md-nav__item">
|
||
<a href="#docling.datamodel.pipeline_options.PictureDescriptionApiOptions.scale" class="md-nav__link">
|
||
<span class="md-ellipsis">
|
||
|
||
<code class="doc-symbol doc-symbol-toc doc-symbol-attribute"></code> scale
|
||
|
||
</span>
|
||
</a>
|
||
|
||
</li>
|
||
|
||
<li class="md-nav__item">
|
||
<a href="#docling.datamodel.pipeline_options.PictureDescriptionApiOptions.timeout" class="md-nav__link">
|
||
<span class="md-ellipsis">
|
||
|
||
<code class="doc-symbol doc-symbol-toc doc-symbol-attribute"></code> timeout
|
||
|
||
</span>
|
||
</a>
|
||
|
||
</li>
|
||
|
||
<li class="md-nav__item">
|
||
<a href="#docling.datamodel.pipeline_options.PictureDescriptionApiOptions.url" class="md-nav__link">
|
||
<span class="md-ellipsis">
|
||
|
||
<code class="doc-symbol doc-symbol-toc doc-symbol-attribute"></code> url
|
||
|
||
</span>
|
||
</a>
|
||
|
||
</li>
|
||
|
||
</ul>
|
||
</nav>
|
||
|
||
</li>
|
||
|
||
<li class="md-nav__item">
|
||
<a href="#docling.datamodel.pipeline_options.PictureDescriptionBaseOptions" class="md-nav__link">
|
||
<span class="md-ellipsis">
|
||
|
||
<code class="doc-symbol doc-symbol-toc doc-symbol-class"></code> PictureDescriptionBaseOptions
|
||
|
||
</span>
|
||
</a>
|
||
|
||
<nav class="md-nav" aria-label=" PictureDescriptionBaseOptions">
|
||
<ul class="md-nav__list">
|
||
|
||
<li class="md-nav__item">
|
||
<a href="#docling.datamodel.pipeline_options.PictureDescriptionBaseOptions.batch_size" class="md-nav__link">
|
||
<span class="md-ellipsis">
|
||
|
||
<code class="doc-symbol doc-symbol-toc doc-symbol-attribute"></code> batch_size
|
||
|
||
</span>
|
||
</a>
|
||
|
||
</li>
|
||
|
||
<li class="md-nav__item">
|
||
<a href="#docling.datamodel.pipeline_options.PictureDescriptionBaseOptions.kind" class="md-nav__link">
|
||
<span class="md-ellipsis">
|
||
|
||
<code class="doc-symbol doc-symbol-toc doc-symbol-attribute"></code> kind
|
||
|
||
</span>
|
||
</a>
|
||
|
||
</li>
|
||
|
||
<li class="md-nav__item">
|
||
<a href="#docling.datamodel.pipeline_options.PictureDescriptionBaseOptions.picture_area_threshold" class="md-nav__link">
|
||
<span class="md-ellipsis">
|
||
|
||
<code class="doc-symbol doc-symbol-toc doc-symbol-attribute"></code> picture_area_threshold
|
||
|
||
</span>
|
||
</a>
|
||
|
||
</li>
|
||
|
||
<li class="md-nav__item">
|
||
<a href="#docling.datamodel.pipeline_options.PictureDescriptionBaseOptions.scale" class="md-nav__link">
|
||
<span class="md-ellipsis">
|
||
|
||
<code class="doc-symbol doc-symbol-toc doc-symbol-attribute"></code> scale
|
||
|
||
</span>
|
||
</a>
|
||
|
||
</li>
|
||
|
||
</ul>
|
||
</nav>
|
||
|
||
</li>
|
||
|
||
<li class="md-nav__item">
|
||
<a href="#docling.datamodel.pipeline_options.PictureDescriptionVlmOptions" class="md-nav__link">
|
||
<span class="md-ellipsis">
|
||
|
||
<code class="doc-symbol doc-symbol-toc doc-symbol-class"></code> PictureDescriptionVlmOptions
|
||
|
||
</span>
|
||
</a>
|
||
|
||
<nav class="md-nav" aria-label=" PictureDescriptionVlmOptions">
|
||
<ul class="md-nav__list">
|
||
|
||
<li class="md-nav__item">
|
||
<a href="#docling.datamodel.pipeline_options.PictureDescriptionVlmOptions.batch_size" class="md-nav__link">
|
||
<span class="md-ellipsis">
|
||
|
||
<code class="doc-symbol doc-symbol-toc doc-symbol-attribute"></code> batch_size
|
||
|
||
</span>
|
||
</a>
|
||
|
||
</li>
|
||
|
||
<li class="md-nav__item">
|
||
<a href="#docling.datamodel.pipeline_options.PictureDescriptionVlmOptions.generation_config" class="md-nav__link">
|
||
<span class="md-ellipsis">
|
||
|
||
<code class="doc-symbol doc-symbol-toc doc-symbol-attribute"></code> generation_config
|
||
|
||
</span>
|
||
</a>
|
||
|
||
</li>
|
||
|
||
<li class="md-nav__item">
|
||
<a href="#docling.datamodel.pipeline_options.PictureDescriptionVlmOptions.kind" class="md-nav__link">
|
||
<span class="md-ellipsis">
|
||
|
||
<code class="doc-symbol doc-symbol-toc doc-symbol-attribute"></code> kind
|
||
|
||
</span>
|
||
</a>
|
||
|
||
</li>
|
||
|
||
<li class="md-nav__item">
|
||
<a href="#docling.datamodel.pipeline_options.PictureDescriptionVlmOptions.picture_area_threshold" class="md-nav__link">
|
||
<span class="md-ellipsis">
|
||
|
||
<code class="doc-symbol doc-symbol-toc doc-symbol-attribute"></code> picture_area_threshold
|
||
|
||
</span>
|
||
</a>
|
||
|
||
</li>
|
||
|
||
<li class="md-nav__item">
|
||
<a href="#docling.datamodel.pipeline_options.PictureDescriptionVlmOptions.prompt" class="md-nav__link">
|
||
<span class="md-ellipsis">
|
||
|
||
<code class="doc-symbol doc-symbol-toc doc-symbol-attribute"></code> prompt
|
||
|
||
</span>
|
||
</a>
|
||
|
||
</li>
|
||
|
||
<li class="md-nav__item">
|
||
<a href="#docling.datamodel.pipeline_options.PictureDescriptionVlmOptions.repo_cache_folder" class="md-nav__link">
|
||
<span class="md-ellipsis">
|
||
|
||
<code class="doc-symbol doc-symbol-toc doc-symbol-attribute"></code> repo_cache_folder
|
||
|
||
</span>
|
||
</a>
|
||
|
||
</li>
|
||
|
||
<li class="md-nav__item">
|
||
<a href="#docling.datamodel.pipeline_options.PictureDescriptionVlmOptions.repo_id" class="md-nav__link">
|
||
<span class="md-ellipsis">
|
||
|
||
<code class="doc-symbol doc-symbol-toc doc-symbol-attribute"></code> repo_id
|
||
|
||
</span>
|
||
</a>
|
||
|
||
</li>
|
||
|
||
<li class="md-nav__item">
|
||
<a href="#docling.datamodel.pipeline_options.PictureDescriptionVlmOptions.scale" class="md-nav__link">
|
||
<span class="md-ellipsis">
|
||
|
||
<code class="doc-symbol doc-symbol-toc doc-symbol-attribute"></code> scale
|
||
|
||
</span>
|
||
</a>
|
||
|
||
</li>
|
||
|
||
</ul>
|
||
</nav>
|
||
|
||
</li>
|
||
|
||
<li class="md-nav__item">
|
||
<a href="#docling.datamodel.pipeline_options.PipelineOptions" class="md-nav__link">
|
||
<span class="md-ellipsis">
|
||
|
||
<code class="doc-symbol doc-symbol-toc doc-symbol-class"></code> PipelineOptions
|
||
|
||
</span>
|
||
</a>
|
||
|
||
<nav class="md-nav" aria-label=" PipelineOptions">
|
||
<ul class="md-nav__list">
|
||
|
||
<li class="md-nav__item">
|
||
<a href="#docling.datamodel.pipeline_options.PipelineOptions.accelerator_options" class="md-nav__link">
|
||
<span class="md-ellipsis">
|
||
|
||
<code class="doc-symbol doc-symbol-toc doc-symbol-attribute"></code> accelerator_options
|
||
|
||
</span>
|
||
</a>
|
||
|
||
</li>
|
||
|
||
<li class="md-nav__item">
|
||
<a href="#docling.datamodel.pipeline_options.PipelineOptions.allow_external_plugins" class="md-nav__link">
|
||
<span class="md-ellipsis">
|
||
|
||
<code class="doc-symbol doc-symbol-toc doc-symbol-attribute"></code> allow_external_plugins
|
||
|
||
</span>
|
||
</a>
|
||
|
||
</li>
|
||
|
||
<li class="md-nav__item">
|
||
<a href="#docling.datamodel.pipeline_options.PipelineOptions.artifacts_path" class="md-nav__link">
|
||
<span class="md-ellipsis">
|
||
|
||
<code class="doc-symbol doc-symbol-toc doc-symbol-attribute"></code> artifacts_path
|
||
|
||
</span>
|
||
</a>
|
||
|
||
</li>
|
||
|
||
<li class="md-nav__item">
|
||
<a href="#docling.datamodel.pipeline_options.PipelineOptions.document_timeout" class="md-nav__link">
|
||
<span class="md-ellipsis">
|
||
|
||
<code class="doc-symbol doc-symbol-toc doc-symbol-attribute"></code> document_timeout
|
||
|
||
</span>
|
||
</a>
|
||
|
||
</li>
|
||
|
||
<li class="md-nav__item">
|
||
<a href="#docling.datamodel.pipeline_options.PipelineOptions.enable_remote_services" class="md-nav__link">
|
||
<span class="md-ellipsis">
|
||
|
||
<code class="doc-symbol doc-symbol-toc doc-symbol-attribute"></code> enable_remote_services
|
||
|
||
</span>
|
||
</a>
|
||
|
||
</li>
|
||
|
||
<li class="md-nav__item">
|
||
<a href="#docling.datamodel.pipeline_options.PipelineOptions.kind" class="md-nav__link">
|
||
<span class="md-ellipsis">
|
||
|
||
<code class="doc-symbol doc-symbol-toc doc-symbol-attribute"></code> kind
|
||
|
||
</span>
|
||
</a>
|
||
|
||
</li>
|
||
|
||
</ul>
|
||
</nav>
|
||
|
||
</li>
|
||
|
||
<li class="md-nav__item">
|
||
<a href="#docling.datamodel.pipeline_options.ProcessingPipeline" class="md-nav__link">
|
||
<span class="md-ellipsis">
|
||
|
||
<code class="doc-symbol doc-symbol-toc doc-symbol-class"></code> ProcessingPipeline
|
||
|
||
</span>
|
||
</a>
|
||
|
||
<nav class="md-nav" aria-label=" ProcessingPipeline">
|
||
<ul class="md-nav__list">
|
||
|
||
<li class="md-nav__item">
|
||
<a href="#docling.datamodel.pipeline_options.ProcessingPipeline.ASR" class="md-nav__link">
|
||
<span class="md-ellipsis">
|
||
|
||
<code class="doc-symbol doc-symbol-toc doc-symbol-attribute"></code> ASR
|
||
|
||
</span>
|
||
</a>
|
||
|
||
</li>
|
||
|
||
<li class="md-nav__item">
|
||
<a href="#docling.datamodel.pipeline_options.ProcessingPipeline.LEGACY" class="md-nav__link">
|
||
<span class="md-ellipsis">
|
||
|
||
<code class="doc-symbol doc-symbol-toc doc-symbol-attribute"></code> LEGACY
|
||
|
||
</span>
|
||
</a>
|
||
|
||
</li>
|
||
|
||
<li class="md-nav__item">
|
||
<a href="#docling.datamodel.pipeline_options.ProcessingPipeline.STANDARD" class="md-nav__link">
|
||
<span class="md-ellipsis">
|
||
|
||
<code class="doc-symbol doc-symbol-toc doc-symbol-attribute"></code> STANDARD
|
||
|
||
</span>
|
||
</a>
|
||
|
||
</li>
|
||
|
||
<li class="md-nav__item">
|
||
<a href="#docling.datamodel.pipeline_options.ProcessingPipeline.VLM" class="md-nav__link">
|
||
<span class="md-ellipsis">
|
||
|
||
<code class="doc-symbol doc-symbol-toc doc-symbol-attribute"></code> VLM
|
||
|
||
</span>
|
||
</a>
|
||
|
||
</li>
|
||
|
||
</ul>
|
||
</nav>
|
||
|
||
</li>
|
||
|
||
<li class="md-nav__item">
|
||
<a href="#docling.datamodel.pipeline_options.RapidOcrOptions" class="md-nav__link">
|
||
<span class="md-ellipsis">
|
||
|
||
<code class="doc-symbol doc-symbol-toc doc-symbol-class"></code> RapidOcrOptions
|
||
|
||
</span>
|
||
</a>
|
||
|
||
<nav class="md-nav" aria-label=" RapidOcrOptions">
|
||
<ul class="md-nav__list">
|
||
|
||
<li class="md-nav__item">
|
||
<a href="#docling.datamodel.pipeline_options.RapidOcrOptions.backend" class="md-nav__link">
|
||
<span class="md-ellipsis">
|
||
|
||
<code class="doc-symbol doc-symbol-toc doc-symbol-attribute"></code> backend
|
||
|
||
</span>
|
||
</a>
|
||
|
||
</li>
|
||
|
||
<li class="md-nav__item">
|
||
<a href="#docling.datamodel.pipeline_options.RapidOcrOptions.bitmap_area_threshold" class="md-nav__link">
|
||
<span class="md-ellipsis">
|
||
|
||
<code class="doc-symbol doc-symbol-toc doc-symbol-attribute"></code> bitmap_area_threshold
|
||
|
||
</span>
|
||
</a>
|
||
|
||
</li>
|
||
|
||
<li class="md-nav__item">
|
||
<a href="#docling.datamodel.pipeline_options.RapidOcrOptions.cls_model_path" class="md-nav__link">
|
||
<span class="md-ellipsis">
|
||
|
||
<code class="doc-symbol doc-symbol-toc doc-symbol-attribute"></code> cls_model_path
|
||
|
||
</span>
|
||
</a>
|
||
|
||
</li>
|
||
|
||
<li class="md-nav__item">
|
||
<a href="#docling.datamodel.pipeline_options.RapidOcrOptions.det_model_path" class="md-nav__link">
|
||
<span class="md-ellipsis">
|
||
|
||
<code class="doc-symbol doc-symbol-toc doc-symbol-attribute"></code> det_model_path
|
||
|
||
</span>
|
||
</a>
|
||
|
||
</li>
|
||
|
||
<li class="md-nav__item">
|
||
<a href="#docling.datamodel.pipeline_options.RapidOcrOptions.font_path" class="md-nav__link">
|
||
<span class="md-ellipsis">
|
||
|
||
<code class="doc-symbol doc-symbol-toc doc-symbol-attribute"></code> font_path
|
||
|
||
</span>
|
||
</a>
|
||
|
||
</li>
|
||
|
||
<li class="md-nav__item">
|
||
<a href="#docling.datamodel.pipeline_options.RapidOcrOptions.force_full_page_ocr" class="md-nav__link">
|
||
<span class="md-ellipsis">
|
||
|
||
<code class="doc-symbol doc-symbol-toc doc-symbol-attribute"></code> force_full_page_ocr
|
||
|
||
</span>
|
||
</a>
|
||
|
||
</li>
|
||
|
||
<li class="md-nav__item">
|
||
<a href="#docling.datamodel.pipeline_options.RapidOcrOptions.kind" class="md-nav__link">
|
||
<span class="md-ellipsis">
|
||
|
||
<code class="doc-symbol doc-symbol-toc doc-symbol-attribute"></code> kind
|
||
|
||
</span>
|
||
</a>
|
||
|
||
</li>
|
||
|
||
<li class="md-nav__item">
|
||
<a href="#docling.datamodel.pipeline_options.RapidOcrOptions.lang" class="md-nav__link">
|
||
<span class="md-ellipsis">
|
||
|
||
<code class="doc-symbol doc-symbol-toc doc-symbol-attribute"></code> lang
|
||
|
||
</span>
|
||
</a>
|
||
|
||
</li>
|
||
|
||
<li class="md-nav__item">
|
||
<a href="#docling.datamodel.pipeline_options.RapidOcrOptions.model_config" class="md-nav__link">
|
||
<span class="md-ellipsis">
|
||
|
||
<code class="doc-symbol doc-symbol-toc doc-symbol-attribute"></code> model_config
|
||
|
||
</span>
|
||
</a>
|
||
|
||
</li>
|
||
|
||
<li class="md-nav__item">
|
||
<a href="#docling.datamodel.pipeline_options.RapidOcrOptions.print_verbose" class="md-nav__link">
|
||
<span class="md-ellipsis">
|
||
|
||
<code class="doc-symbol doc-symbol-toc doc-symbol-attribute"></code> print_verbose
|
||
|
||
</span>
|
||
</a>
|
||
|
||
</li>
|
||
|
||
<li class="md-nav__item">
|
||
<a href="#docling.datamodel.pipeline_options.RapidOcrOptions.rapidocr_params" class="md-nav__link">
|
||
<span class="md-ellipsis">
|
||
|
||
<code class="doc-symbol doc-symbol-toc doc-symbol-attribute"></code> rapidocr_params
|
||
|
||
</span>
|
||
</a>
|
||
|
||
</li>
|
||
|
||
<li class="md-nav__item">
|
||
<a href="#docling.datamodel.pipeline_options.RapidOcrOptions.rec_font_path" class="md-nav__link">
|
||
<span class="md-ellipsis">
|
||
|
||
<code class="doc-symbol doc-symbol-toc doc-symbol-attribute"></code> rec_font_path
|
||
|
||
</span>
|
||
</a>
|
||
|
||
</li>
|
||
|
||
<li class="md-nav__item">
|
||
<a href="#docling.datamodel.pipeline_options.RapidOcrOptions.rec_keys_path" class="md-nav__link">
|
||
<span class="md-ellipsis">
|
||
|
||
<code class="doc-symbol doc-symbol-toc doc-symbol-attribute"></code> rec_keys_path
|
||
|
||
</span>
|
||
</a>
|
||
|
||
</li>
|
||
|
||
<li class="md-nav__item">
|
||
<a href="#docling.datamodel.pipeline_options.RapidOcrOptions.rec_model_path" class="md-nav__link">
|
||
<span class="md-ellipsis">
|
||
|
||
<code class="doc-symbol doc-symbol-toc doc-symbol-attribute"></code> rec_model_path
|
||
|
||
</span>
|
||
</a>
|
||
|
||
</li>
|
||
|
||
<li class="md-nav__item">
|
||
<a href="#docling.datamodel.pipeline_options.RapidOcrOptions.text_score" class="md-nav__link">
|
||
<span class="md-ellipsis">
|
||
|
||
<code class="doc-symbol doc-symbol-toc doc-symbol-attribute"></code> text_score
|
||
|
||
</span>
|
||
</a>
|
||
|
||
</li>
|
||
|
||
<li class="md-nav__item">
|
||
<a href="#docling.datamodel.pipeline_options.RapidOcrOptions.use_cls" class="md-nav__link">
|
||
<span class="md-ellipsis">
|
||
|
||
<code class="doc-symbol doc-symbol-toc doc-symbol-attribute"></code> use_cls
|
||
|
||
</span>
|
||
</a>
|
||
|
||
</li>
|
||
|
||
<li class="md-nav__item">
|
||
<a href="#docling.datamodel.pipeline_options.RapidOcrOptions.use_det" class="md-nav__link">
|
||
<span class="md-ellipsis">
|
||
|
||
<code class="doc-symbol doc-symbol-toc doc-symbol-attribute"></code> use_det
|
||
|
||
</span>
|
||
</a>
|
||
|
||
</li>
|
||
|
||
<li class="md-nav__item">
|
||
<a href="#docling.datamodel.pipeline_options.RapidOcrOptions.use_rec" class="md-nav__link">
|
||
<span class="md-ellipsis">
|
||
|
||
<code class="doc-symbol doc-symbol-toc doc-symbol-attribute"></code> use_rec
|
||
|
||
</span>
|
||
</a>
|
||
|
||
</li>
|
||
|
||
</ul>
|
||
</nav>
|
||
|
||
</li>
|
||
|
||
<li class="md-nav__item">
|
||
<a href="#docling.datamodel.pipeline_options.TableFormerMode" class="md-nav__link">
|
||
<span class="md-ellipsis">
|
||
|
||
<code class="doc-symbol doc-symbol-toc doc-symbol-class"></code> TableFormerMode
|
||
|
||
</span>
|
||
</a>
|
||
|
||
<nav class="md-nav" aria-label=" TableFormerMode">
|
||
<ul class="md-nav__list">
|
||
|
||
<li class="md-nav__item">
|
||
<a href="#docling.datamodel.pipeline_options.TableFormerMode.ACCURATE" class="md-nav__link">
|
||
<span class="md-ellipsis">
|
||
|
||
<code class="doc-symbol doc-symbol-toc doc-symbol-attribute"></code> ACCURATE
|
||
|
||
</span>
|
||
</a>
|
||
|
||
</li>
|
||
|
||
<li class="md-nav__item">
|
||
<a href="#docling.datamodel.pipeline_options.TableFormerMode.FAST" class="md-nav__link">
|
||
<span class="md-ellipsis">
|
||
|
||
<code class="doc-symbol doc-symbol-toc doc-symbol-attribute"></code> FAST
|
||
|
||
</span>
|
||
</a>
|
||
|
||
</li>
|
||
|
||
</ul>
|
||
</nav>
|
||
|
||
</li>
|
||
|
||
<li class="md-nav__item">
|
||
<a href="#docling.datamodel.pipeline_options.TableStructureOptions" class="md-nav__link">
|
||
<span class="md-ellipsis">
|
||
|
||
<code class="doc-symbol doc-symbol-toc doc-symbol-class"></code> TableStructureOptions
|
||
|
||
</span>
|
||
</a>
|
||
|
||
<nav class="md-nav" aria-label=" TableStructureOptions">
|
||
<ul class="md-nav__list">
|
||
|
||
<li class="md-nav__item">
|
||
<a href="#docling.datamodel.pipeline_options.TableStructureOptions.do_cell_matching" class="md-nav__link">
|
||
<span class="md-ellipsis">
|
||
|
||
<code class="doc-symbol doc-symbol-toc doc-symbol-attribute"></code> do_cell_matching
|
||
|
||
</span>
|
||
</a>
|
||
|
||
</li>
|
||
|
||
<li class="md-nav__item">
|
||
<a href="#docling.datamodel.pipeline_options.TableStructureOptions.kind" class="md-nav__link">
|
||
<span class="md-ellipsis">
|
||
|
||
<code class="doc-symbol doc-symbol-toc doc-symbol-attribute"></code> kind
|
||
|
||
</span>
|
||
</a>
|
||
|
||
</li>
|
||
|
||
<li class="md-nav__item">
|
||
<a href="#docling.datamodel.pipeline_options.TableStructureOptions.mode" class="md-nav__link">
|
||
<span class="md-ellipsis">
|
||
|
||
<code class="doc-symbol doc-symbol-toc doc-symbol-attribute"></code> mode
|
||
|
||
</span>
|
||
</a>
|
||
|
||
</li>
|
||
|
||
</ul>
|
||
</nav>
|
||
|
||
</li>
|
||
|
||
<li class="md-nav__item">
|
||
<a href="#docling.datamodel.pipeline_options.TesseractCliOcrOptions" class="md-nav__link">
|
||
<span class="md-ellipsis">
|
||
|
||
<code class="doc-symbol doc-symbol-toc doc-symbol-class"></code> TesseractCliOcrOptions
|
||
|
||
</span>
|
||
</a>
|
||
|
||
<nav class="md-nav" aria-label=" TesseractCliOcrOptions">
|
||
<ul class="md-nav__list">
|
||
|
||
<li class="md-nav__item">
|
||
<a href="#docling.datamodel.pipeline_options.TesseractCliOcrOptions.bitmap_area_threshold" class="md-nav__link">
|
||
<span class="md-ellipsis">
|
||
|
||
<code class="doc-symbol doc-symbol-toc doc-symbol-attribute"></code> bitmap_area_threshold
|
||
|
||
</span>
|
||
</a>
|
||
|
||
</li>
|
||
|
||
<li class="md-nav__item">
|
||
<a href="#docling.datamodel.pipeline_options.TesseractCliOcrOptions.force_full_page_ocr" class="md-nav__link">
|
||
<span class="md-ellipsis">
|
||
|
||
<code class="doc-symbol doc-symbol-toc doc-symbol-attribute"></code> force_full_page_ocr
|
||
|
||
</span>
|
||
</a>
|
||
|
||
</li>
|
||
|
||
<li class="md-nav__item">
|
||
<a href="#docling.datamodel.pipeline_options.TesseractCliOcrOptions.kind" class="md-nav__link">
|
||
<span class="md-ellipsis">
|
||
|
||
<code class="doc-symbol doc-symbol-toc doc-symbol-attribute"></code> kind
|
||
|
||
</span>
|
||
</a>
|
||
|
||
</li>
|
||
|
||
<li class="md-nav__item">
|
||
<a href="#docling.datamodel.pipeline_options.TesseractCliOcrOptions.lang" class="md-nav__link">
|
||
<span class="md-ellipsis">
|
||
|
||
<code class="doc-symbol doc-symbol-toc doc-symbol-attribute"></code> lang
|
||
|
||
</span>
|
||
</a>
|
||
|
||
</li>
|
||
|
||
<li class="md-nav__item">
|
||
<a href="#docling.datamodel.pipeline_options.TesseractCliOcrOptions.model_config" class="md-nav__link">
|
||
<span class="md-ellipsis">
|
||
|
||
<code class="doc-symbol doc-symbol-toc doc-symbol-attribute"></code> model_config
|
||
|
||
</span>
|
||
</a>
|
||
|
||
</li>
|
||
|
||
<li class="md-nav__item">
|
||
<a href="#docling.datamodel.pipeline_options.TesseractCliOcrOptions.path" class="md-nav__link">
|
||
<span class="md-ellipsis">
|
||
|
||
<code class="doc-symbol doc-symbol-toc doc-symbol-attribute"></code> path
|
||
|
||
</span>
|
||
</a>
|
||
|
||
</li>
|
||
|
||
<li class="md-nav__item">
|
||
<a href="#docling.datamodel.pipeline_options.TesseractCliOcrOptions.psm" class="md-nav__link">
|
||
<span class="md-ellipsis">
|
||
|
||
<code class="doc-symbol doc-symbol-toc doc-symbol-attribute"></code> psm
|
||
|
||
</span>
|
||
</a>
|
||
|
||
</li>
|
||
|
||
<li class="md-nav__item">
|
||
<a href="#docling.datamodel.pipeline_options.TesseractCliOcrOptions.tesseract_cmd" class="md-nav__link">
|
||
<span class="md-ellipsis">
|
||
|
||
<code class="doc-symbol doc-symbol-toc doc-symbol-attribute"></code> tesseract_cmd
|
||
|
||
</span>
|
||
</a>
|
||
|
||
</li>
|
||
|
||
</ul>
|
||
</nav>
|
||
|
||
</li>
|
||
|
||
<li class="md-nav__item">
|
||
<a href="#docling.datamodel.pipeline_options.TesseractOcrOptions" class="md-nav__link">
|
||
<span class="md-ellipsis">
|
||
|
||
<code class="doc-symbol doc-symbol-toc doc-symbol-class"></code> TesseractOcrOptions
|
||
|
||
</span>
|
||
</a>
|
||
|
||
<nav class="md-nav" aria-label=" TesseractOcrOptions">
|
||
<ul class="md-nav__list">
|
||
|
||
<li class="md-nav__item">
|
||
<a href="#docling.datamodel.pipeline_options.TesseractOcrOptions.bitmap_area_threshold" class="md-nav__link">
|
||
<span class="md-ellipsis">
|
||
|
||
<code class="doc-symbol doc-symbol-toc doc-symbol-attribute"></code> bitmap_area_threshold
|
||
|
||
</span>
|
||
</a>
|
||
|
||
</li>
|
||
|
||
<li class="md-nav__item">
|
||
<a href="#docling.datamodel.pipeline_options.TesseractOcrOptions.force_full_page_ocr" class="md-nav__link">
|
||
<span class="md-ellipsis">
|
||
|
||
<code class="doc-symbol doc-symbol-toc doc-symbol-attribute"></code> force_full_page_ocr
|
||
|
||
</span>
|
||
</a>
|
||
|
||
</li>
|
||
|
||
<li class="md-nav__item">
|
||
<a href="#docling.datamodel.pipeline_options.TesseractOcrOptions.kind" class="md-nav__link">
|
||
<span class="md-ellipsis">
|
||
|
||
<code class="doc-symbol doc-symbol-toc doc-symbol-attribute"></code> kind
|
||
|
||
</span>
|
||
</a>
|
||
|
||
</li>
|
||
|
||
<li class="md-nav__item">
|
||
<a href="#docling.datamodel.pipeline_options.TesseractOcrOptions.lang" class="md-nav__link">
|
||
<span class="md-ellipsis">
|
||
|
||
<code class="doc-symbol doc-symbol-toc doc-symbol-attribute"></code> lang
|
||
|
||
</span>
|
||
</a>
|
||
|
||
</li>
|
||
|
||
<li class="md-nav__item">
|
||
<a href="#docling.datamodel.pipeline_options.TesseractOcrOptions.model_config" class="md-nav__link">
|
||
<span class="md-ellipsis">
|
||
|
||
<code class="doc-symbol doc-symbol-toc doc-symbol-attribute"></code> model_config
|
||
|
||
</span>
|
||
</a>
|
||
|
||
</li>
|
||
|
||
<li class="md-nav__item">
|
||
<a href="#docling.datamodel.pipeline_options.TesseractOcrOptions.path" class="md-nav__link">
|
||
<span class="md-ellipsis">
|
||
|
||
<code class="doc-symbol doc-symbol-toc doc-symbol-attribute"></code> path
|
||
|
||
</span>
|
||
</a>
|
||
|
||
</li>
|
||
|
||
<li class="md-nav__item">
|
||
<a href="#docling.datamodel.pipeline_options.TesseractOcrOptions.psm" class="md-nav__link">
|
||
<span class="md-ellipsis">
|
||
|
||
<code class="doc-symbol doc-symbol-toc doc-symbol-attribute"></code> psm
|
||
|
||
</span>
|
||
</a>
|
||
|
||
</li>
|
||
|
||
</ul>
|
||
</nav>
|
||
|
||
</li>
|
||
|
||
<li class="md-nav__item">
|
||
<a href="#docling.datamodel.pipeline_options.ThreadedPdfPipelineOptions" class="md-nav__link">
|
||
<span class="md-ellipsis">
|
||
|
||
<code class="doc-symbol doc-symbol-toc doc-symbol-class"></code> ThreadedPdfPipelineOptions
|
||
|
||
</span>
|
||
</a>
|
||
|
||
<nav class="md-nav" aria-label=" ThreadedPdfPipelineOptions">
|
||
<ul class="md-nav__list">
|
||
|
||
<li class="md-nav__item">
|
||
<a href="#docling.datamodel.pipeline_options.ThreadedPdfPipelineOptions.accelerator_options" class="md-nav__link">
|
||
<span class="md-ellipsis">
|
||
|
||
<code class="doc-symbol doc-symbol-toc doc-symbol-attribute"></code> accelerator_options
|
||
|
||
</span>
|
||
</a>
|
||
|
||
</li>
|
||
|
||
<li class="md-nav__item">
|
||
<a href="#docling.datamodel.pipeline_options.ThreadedPdfPipelineOptions.allow_external_plugins" class="md-nav__link">
|
||
<span class="md-ellipsis">
|
||
|
||
<code class="doc-symbol doc-symbol-toc doc-symbol-attribute"></code> allow_external_plugins
|
||
|
||
</span>
|
||
</a>
|
||
|
||
</li>
|
||
|
||
<li class="md-nav__item">
|
||
<a href="#docling.datamodel.pipeline_options.ThreadedPdfPipelineOptions.artifacts_path" class="md-nav__link">
|
||
<span class="md-ellipsis">
|
||
|
||
<code class="doc-symbol doc-symbol-toc doc-symbol-attribute"></code> artifacts_path
|
||
|
||
</span>
|
||
</a>
|
||
|
||
</li>
|
||
|
||
<li class="md-nav__item">
|
||
<a href="#docling.datamodel.pipeline_options.ThreadedPdfPipelineOptions.batch_polling_interval_seconds" class="md-nav__link">
|
||
<span class="md-ellipsis">
|
||
|
||
<code class="doc-symbol doc-symbol-toc doc-symbol-attribute"></code> batch_polling_interval_seconds
|
||
|
||
</span>
|
||
</a>
|
||
|
||
</li>
|
||
|
||
<li class="md-nav__item">
|
||
<a href="#docling.datamodel.pipeline_options.ThreadedPdfPipelineOptions.do_code_enrichment" class="md-nav__link">
|
||
<span class="md-ellipsis">
|
||
|
||
<code class="doc-symbol doc-symbol-toc doc-symbol-attribute"></code> do_code_enrichment
|
||
|
||
</span>
|
||
</a>
|
||
|
||
</li>
|
||
|
||
<li class="md-nav__item">
|
||
<a href="#docling.datamodel.pipeline_options.ThreadedPdfPipelineOptions.do_formula_enrichment" class="md-nav__link">
|
||
<span class="md-ellipsis">
|
||
|
||
<code class="doc-symbol doc-symbol-toc doc-symbol-attribute"></code> do_formula_enrichment
|
||
|
||
</span>
|
||
</a>
|
||
|
||
</li>
|
||
|
||
<li class="md-nav__item">
|
||
<a href="#docling.datamodel.pipeline_options.ThreadedPdfPipelineOptions.do_ocr" class="md-nav__link">
|
||
<span class="md-ellipsis">
|
||
|
||
<code class="doc-symbol doc-symbol-toc doc-symbol-attribute"></code> do_ocr
|
||
|
||
</span>
|
||
</a>
|
||
|
||
</li>
|
||
|
||
<li class="md-nav__item">
|
||
<a href="#docling.datamodel.pipeline_options.ThreadedPdfPipelineOptions.do_picture_classification" class="md-nav__link">
|
||
<span class="md-ellipsis">
|
||
|
||
<code class="doc-symbol doc-symbol-toc doc-symbol-attribute"></code> do_picture_classification
|
||
|
||
</span>
|
||
</a>
|
||
|
||
</li>
|
||
|
||
<li class="md-nav__item">
|
||
<a href="#docling.datamodel.pipeline_options.ThreadedPdfPipelineOptions.do_picture_description" class="md-nav__link">
|
||
<span class="md-ellipsis">
|
||
|
||
<code class="doc-symbol doc-symbol-toc doc-symbol-attribute"></code> do_picture_description
|
||
|
||
</span>
|
||
</a>
|
||
|
||
</li>
|
||
|
||
<li class="md-nav__item">
|
||
<a href="#docling.datamodel.pipeline_options.ThreadedPdfPipelineOptions.do_table_structure" class="md-nav__link">
|
||
<span class="md-ellipsis">
|
||
|
||
<code class="doc-symbol doc-symbol-toc doc-symbol-attribute"></code> do_table_structure
|
||
|
||
</span>
|
||
</a>
|
||
|
||
</li>
|
||
|
||
<li class="md-nav__item">
|
||
<a href="#docling.datamodel.pipeline_options.ThreadedPdfPipelineOptions.document_timeout" class="md-nav__link">
|
||
<span class="md-ellipsis">
|
||
|
||
<code class="doc-symbol doc-symbol-toc doc-symbol-attribute"></code> document_timeout
|
||
|
||
</span>
|
||
</a>
|
||
|
||
</li>
|
||
|
||
<li class="md-nav__item">
|
||
<a href="#docling.datamodel.pipeline_options.ThreadedPdfPipelineOptions.enable_remote_services" class="md-nav__link">
|
||
<span class="md-ellipsis">
|
||
|
||
<code class="doc-symbol doc-symbol-toc doc-symbol-attribute"></code> enable_remote_services
|
||
|
||
</span>
|
||
</a>
|
||
|
||
</li>
|
||
|
||
<li class="md-nav__item">
|
||
<a href="#docling.datamodel.pipeline_options.ThreadedPdfPipelineOptions.force_backend_text" class="md-nav__link">
|
||
<span class="md-ellipsis">
|
||
|
||
<code class="doc-symbol doc-symbol-toc doc-symbol-attribute"></code> force_backend_text
|
||
|
||
</span>
|
||
</a>
|
||
|
||
</li>
|
||
|
||
<li class="md-nav__item">
|
||
<a href="#docling.datamodel.pipeline_options.ThreadedPdfPipelineOptions.generate_page_images" class="md-nav__link">
|
||
<span class="md-ellipsis">
|
||
|
||
<code class="doc-symbol doc-symbol-toc doc-symbol-attribute"></code> generate_page_images
|
||
|
||
</span>
|
||
</a>
|
||
|
||
</li>
|
||
|
||
<li class="md-nav__item">
|
||
<a href="#docling.datamodel.pipeline_options.ThreadedPdfPipelineOptions.generate_parsed_pages" class="md-nav__link">
|
||
<span class="md-ellipsis">
|
||
|
||
<code class="doc-symbol doc-symbol-toc doc-symbol-attribute"></code> generate_parsed_pages
|
||
|
||
</span>
|
||
</a>
|
||
|
||
</li>
|
||
|
||
<li class="md-nav__item">
|
||
<a href="#docling.datamodel.pipeline_options.ThreadedPdfPipelineOptions.generate_picture_images" class="md-nav__link">
|
||
<span class="md-ellipsis">
|
||
|
||
<code class="doc-symbol doc-symbol-toc doc-symbol-attribute"></code> generate_picture_images
|
||
|
||
</span>
|
||
</a>
|
||
|
||
</li>
|
||
|
||
<li class="md-nav__item">
|
||
<a href="#docling.datamodel.pipeline_options.ThreadedPdfPipelineOptions.generate_table_images" class="md-nav__link">
|
||
<span class="md-ellipsis">
|
||
|
||
<code class="doc-symbol doc-symbol-toc doc-symbol-attribute"></code> generate_table_images
|
||
|
||
</span>
|
||
</a>
|
||
|
||
</li>
|
||
|
||
<li class="md-nav__item">
|
||
<a href="#docling.datamodel.pipeline_options.ThreadedPdfPipelineOptions.images_scale" class="md-nav__link">
|
||
<span class="md-ellipsis">
|
||
|
||
<code class="doc-symbol doc-symbol-toc doc-symbol-attribute"></code> images_scale
|
||
|
||
</span>
|
||
</a>
|
||
|
||
</li>
|
||
|
||
<li class="md-nav__item">
|
||
<a href="#docling.datamodel.pipeline_options.ThreadedPdfPipelineOptions.kind" class="md-nav__link">
|
||
<span class="md-ellipsis">
|
||
|
||
<code class="doc-symbol doc-symbol-toc doc-symbol-attribute"></code> kind
|
||
|
||
</span>
|
||
</a>
|
||
|
||
</li>
|
||
|
||
<li class="md-nav__item">
|
||
<a href="#docling.datamodel.pipeline_options.ThreadedPdfPipelineOptions.layout_batch_size" class="md-nav__link">
|
||
<span class="md-ellipsis">
|
||
|
||
<code class="doc-symbol doc-symbol-toc doc-symbol-attribute"></code> layout_batch_size
|
||
|
||
</span>
|
||
</a>
|
||
|
||
</li>
|
||
|
||
<li class="md-nav__item">
|
||
<a href="#docling.datamodel.pipeline_options.ThreadedPdfPipelineOptions.layout_options" class="md-nav__link">
|
||
<span class="md-ellipsis">
|
||
|
||
<code class="doc-symbol doc-symbol-toc doc-symbol-attribute"></code> layout_options
|
||
|
||
</span>
|
||
</a>
|
||
|
||
</li>
|
||
|
||
<li class="md-nav__item">
|
||
<a href="#docling.datamodel.pipeline_options.ThreadedPdfPipelineOptions.ocr_batch_size" class="md-nav__link">
|
||
<span class="md-ellipsis">
|
||
|
||
<code class="doc-symbol doc-symbol-toc doc-symbol-attribute"></code> ocr_batch_size
|
||
|
||
</span>
|
||
</a>
|
||
|
||
</li>
|
||
|
||
<li class="md-nav__item">
|
||
<a href="#docling.datamodel.pipeline_options.ThreadedPdfPipelineOptions.ocr_options" class="md-nav__link">
|
||
<span class="md-ellipsis">
|
||
|
||
<code class="doc-symbol doc-symbol-toc doc-symbol-attribute"></code> ocr_options
|
||
|
||
</span>
|
||
</a>
|
||
|
||
</li>
|
||
|
||
<li class="md-nav__item">
|
||
<a href="#docling.datamodel.pipeline_options.ThreadedPdfPipelineOptions.picture_description_options" class="md-nav__link">
|
||
<span class="md-ellipsis">
|
||
|
||
<code class="doc-symbol doc-symbol-toc doc-symbol-attribute"></code> picture_description_options
|
||
|
||
</span>
|
||
</a>
|
||
|
||
</li>
|
||
|
||
<li class="md-nav__item">
|
||
<a href="#docling.datamodel.pipeline_options.ThreadedPdfPipelineOptions.queue_max_size" class="md-nav__link">
|
||
<span class="md-ellipsis">
|
||
|
||
<code class="doc-symbol doc-symbol-toc doc-symbol-attribute"></code> queue_max_size
|
||
|
||
</span>
|
||
</a>
|
||
|
||
</li>
|
||
|
||
<li class="md-nav__item">
|
||
<a href="#docling.datamodel.pipeline_options.ThreadedPdfPipelineOptions.table_batch_size" class="md-nav__link">
|
||
<span class="md-ellipsis">
|
||
|
||
<code class="doc-symbol doc-symbol-toc doc-symbol-attribute"></code> table_batch_size
|
||
|
||
</span>
|
||
</a>
|
||
|
||
</li>
|
||
|
||
<li class="md-nav__item">
|
||
<a href="#docling.datamodel.pipeline_options.ThreadedPdfPipelineOptions.table_structure_options" class="md-nav__link">
|
||
<span class="md-ellipsis">
|
||
|
||
<code class="doc-symbol doc-symbol-toc doc-symbol-attribute"></code> table_structure_options
|
||
|
||
</span>
|
||
</a>
|
||
|
||
</li>
|
||
|
||
</ul>
|
||
</nav>
|
||
|
||
</li>
|
||
|
||
<li class="md-nav__item">
|
||
<a href="#docling.datamodel.pipeline_options.VlmExtractionPipelineOptions" class="md-nav__link">
|
||
<span class="md-ellipsis">
|
||
|
||
<code class="doc-symbol doc-symbol-toc doc-symbol-class"></code> VlmExtractionPipelineOptions
|
||
|
||
</span>
|
||
</a>
|
||
|
||
<nav class="md-nav" aria-label=" VlmExtractionPipelineOptions">
|
||
<ul class="md-nav__list">
|
||
|
||
<li class="md-nav__item">
|
||
<a href="#docling.datamodel.pipeline_options.VlmExtractionPipelineOptions.accelerator_options" class="md-nav__link">
|
||
<span class="md-ellipsis">
|
||
|
||
<code class="doc-symbol doc-symbol-toc doc-symbol-attribute"></code> accelerator_options
|
||
|
||
</span>
|
||
</a>
|
||
|
||
</li>
|
||
|
||
<li class="md-nav__item">
|
||
<a href="#docling.datamodel.pipeline_options.VlmExtractionPipelineOptions.allow_external_plugins" class="md-nav__link">
|
||
<span class="md-ellipsis">
|
||
|
||
<code class="doc-symbol doc-symbol-toc doc-symbol-attribute"></code> allow_external_plugins
|
||
|
||
</span>
|
||
</a>
|
||
|
||
</li>
|
||
|
||
<li class="md-nav__item">
|
||
<a href="#docling.datamodel.pipeline_options.VlmExtractionPipelineOptions.artifacts_path" class="md-nav__link">
|
||
<span class="md-ellipsis">
|
||
|
||
<code class="doc-symbol doc-symbol-toc doc-symbol-attribute"></code> artifacts_path
|
||
|
||
</span>
|
||
</a>
|
||
|
||
</li>
|
||
|
||
<li class="md-nav__item">
|
||
<a href="#docling.datamodel.pipeline_options.VlmExtractionPipelineOptions.document_timeout" class="md-nav__link">
|
||
<span class="md-ellipsis">
|
||
|
||
<code class="doc-symbol doc-symbol-toc doc-symbol-attribute"></code> document_timeout
|
||
|
||
</span>
|
||
</a>
|
||
|
||
</li>
|
||
|
||
<li class="md-nav__item">
|
||
<a href="#docling.datamodel.pipeline_options.VlmExtractionPipelineOptions.enable_remote_services" class="md-nav__link">
|
||
<span class="md-ellipsis">
|
||
|
||
<code class="doc-symbol doc-symbol-toc doc-symbol-attribute"></code> enable_remote_services
|
||
|
||
</span>
|
||
</a>
|
||
|
||
</li>
|
||
|
||
<li class="md-nav__item">
|
||
<a href="#docling.datamodel.pipeline_options.VlmExtractionPipelineOptions.kind" class="md-nav__link">
|
||
<span class="md-ellipsis">
|
||
|
||
<code class="doc-symbol doc-symbol-toc doc-symbol-attribute"></code> kind
|
||
|
||
</span>
|
||
</a>
|
||
|
||
</li>
|
||
|
||
<li class="md-nav__item">
|
||
<a href="#docling.datamodel.pipeline_options.VlmExtractionPipelineOptions.vlm_options" class="md-nav__link">
|
||
<span class="md-ellipsis">
|
||
|
||
<code class="doc-symbol doc-symbol-toc doc-symbol-attribute"></code> vlm_options
|
||
|
||
</span>
|
||
</a>
|
||
|
||
</li>
|
||
|
||
</ul>
|
||
</nav>
|
||
|
||
</li>
|
||
|
||
<li class="md-nav__item">
|
||
<a href="#docling.datamodel.pipeline_options.VlmPipelineOptions" class="md-nav__link">
|
||
<span class="md-ellipsis">
|
||
|
||
<code class="doc-symbol doc-symbol-toc doc-symbol-class"></code> VlmPipelineOptions
|
||
|
||
</span>
|
||
</a>
|
||
|
||
<nav class="md-nav" aria-label=" VlmPipelineOptions">
|
||
<ul class="md-nav__list">
|
||
|
||
<li class="md-nav__item">
|
||
<a href="#docling.datamodel.pipeline_options.VlmPipelineOptions.accelerator_options" class="md-nav__link">
|
||
<span class="md-ellipsis">
|
||
|
||
<code class="doc-symbol doc-symbol-toc doc-symbol-attribute"></code> accelerator_options
|
||
|
||
</span>
|
||
</a>
|
||
|
||
</li>
|
||
|
||
<li class="md-nav__item">
|
||
<a href="#docling.datamodel.pipeline_options.VlmPipelineOptions.allow_external_plugins" class="md-nav__link">
|
||
<span class="md-ellipsis">
|
||
|
||
<code class="doc-symbol doc-symbol-toc doc-symbol-attribute"></code> allow_external_plugins
|
||
|
||
</span>
|
||
</a>
|
||
|
||
</li>
|
||
|
||
<li class="md-nav__item">
|
||
<a href="#docling.datamodel.pipeline_options.VlmPipelineOptions.artifacts_path" class="md-nav__link">
|
||
<span class="md-ellipsis">
|
||
|
||
<code class="doc-symbol doc-symbol-toc doc-symbol-attribute"></code> artifacts_path
|
||
|
||
</span>
|
||
</a>
|
||
|
||
</li>
|
||
|
||
<li class="md-nav__item">
|
||
<a href="#docling.datamodel.pipeline_options.VlmPipelineOptions.do_picture_classification" class="md-nav__link">
|
||
<span class="md-ellipsis">
|
||
|
||
<code class="doc-symbol doc-symbol-toc doc-symbol-attribute"></code> do_picture_classification
|
||
|
||
</span>
|
||
</a>
|
||
|
||
</li>
|
||
|
||
<li class="md-nav__item">
|
||
<a href="#docling.datamodel.pipeline_options.VlmPipelineOptions.do_picture_description" class="md-nav__link">
|
||
<span class="md-ellipsis">
|
||
|
||
<code class="doc-symbol doc-symbol-toc doc-symbol-attribute"></code> do_picture_description
|
||
|
||
</span>
|
||
</a>
|
||
|
||
</li>
|
||
|
||
<li class="md-nav__item">
|
||
<a href="#docling.datamodel.pipeline_options.VlmPipelineOptions.document_timeout" class="md-nav__link">
|
||
<span class="md-ellipsis">
|
||
|
||
<code class="doc-symbol doc-symbol-toc doc-symbol-attribute"></code> document_timeout
|
||
|
||
</span>
|
||
</a>
|
||
|
||
</li>
|
||
|
||
<li class="md-nav__item">
|
||
<a href="#docling.datamodel.pipeline_options.VlmPipelineOptions.enable_remote_services" class="md-nav__link">
|
||
<span class="md-ellipsis">
|
||
|
||
<code class="doc-symbol doc-symbol-toc doc-symbol-attribute"></code> enable_remote_services
|
||
|
||
</span>
|
||
</a>
|
||
|
||
</li>
|
||
|
||
<li class="md-nav__item">
|
||
<a href="#docling.datamodel.pipeline_options.VlmPipelineOptions.force_backend_text" class="md-nav__link">
|
||
<span class="md-ellipsis">
|
||
|
||
<code class="doc-symbol doc-symbol-toc doc-symbol-attribute"></code> force_backend_text
|
||
|
||
</span>
|
||
</a>
|
||
|
||
</li>
|
||
|
||
<li class="md-nav__item">
|
||
<a href="#docling.datamodel.pipeline_options.VlmPipelineOptions.generate_page_images" class="md-nav__link">
|
||
<span class="md-ellipsis">
|
||
|
||
<code class="doc-symbol doc-symbol-toc doc-symbol-attribute"></code> generate_page_images
|
||
|
||
</span>
|
||
</a>
|
||
|
||
</li>
|
||
|
||
<li class="md-nav__item">
|
||
<a href="#docling.datamodel.pipeline_options.VlmPipelineOptions.generate_picture_images" class="md-nav__link">
|
||
<span class="md-ellipsis">
|
||
|
||
<code class="doc-symbol doc-symbol-toc doc-symbol-attribute"></code> generate_picture_images
|
||
|
||
</span>
|
||
</a>
|
||
|
||
</li>
|
||
|
||
<li class="md-nav__item">
|
||
<a href="#docling.datamodel.pipeline_options.VlmPipelineOptions.images_scale" class="md-nav__link">
|
||
<span class="md-ellipsis">
|
||
|
||
<code class="doc-symbol doc-symbol-toc doc-symbol-attribute"></code> images_scale
|
||
|
||
</span>
|
||
</a>
|
||
|
||
</li>
|
||
|
||
<li class="md-nav__item">
|
||
<a href="#docling.datamodel.pipeline_options.VlmPipelineOptions.kind" class="md-nav__link">
|
||
<span class="md-ellipsis">
|
||
|
||
<code class="doc-symbol doc-symbol-toc doc-symbol-attribute"></code> kind
|
||
|
||
</span>
|
||
</a>
|
||
|
||
</li>
|
||
|
||
<li class="md-nav__item">
|
||
<a href="#docling.datamodel.pipeline_options.VlmPipelineOptions.picture_description_options" class="md-nav__link">
|
||
<span class="md-ellipsis">
|
||
|
||
<code class="doc-symbol doc-symbol-toc doc-symbol-attribute"></code> picture_description_options
|
||
|
||
</span>
|
||
</a>
|
||
|
||
</li>
|
||
|
||
<li class="md-nav__item">
|
||
<a href="#docling.datamodel.pipeline_options.VlmPipelineOptions.vlm_options" class="md-nav__link">
|
||
<span class="md-ellipsis">
|
||
|
||
<code class="doc-symbol doc-symbol-toc doc-symbol-attribute"></code> vlm_options
|
||
|
||
</span>
|
||
</a>
|
||
|
||
</li>
|
||
|
||
</ul>
|
||
</nav>
|
||
|
||
</li>
|
||
|
||
</ul>
|
||
</nav>
|
||
|
||
</li>
|
||
|
||
</ul>
|
||
|
||
</nav>
|
||
|
||
</li>
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
<li class="md-nav__item">
|
||
<a href="../docling_document/" class="md-nav__link">
|
||
|
||
|
||
|
||
<span class="md-ellipsis">
|
||
|
||
|
||
Docling Document
|
||
|
||
|
||
|
||
</span>
|
||
|
||
|
||
|
||
</a>
|
||
</li>
|
||
|
||
|
||
|
||
|
||
</ul>
|
||
</nav>
|
||
|
||
</li>
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
<li class="md-nav__item md-nav__item--nested">
|
||
|
||
|
||
|
||
<input class="md-nav__toggle md-toggle " type="checkbox" id="__nav_5_2" >
|
||
|
||
|
||
<label class="md-nav__link" for="__nav_5_2" id="__nav_5_2_label" tabindex="0">
|
||
|
||
|
||
|
||
<span class="md-ellipsis">
|
||
|
||
|
||
CLI
|
||
|
||
|
||
|
||
</span>
|
||
|
||
|
||
|
||
<span class="md-nav__icon md-icon"></span>
|
||
</label>
|
||
|
||
<nav class="md-nav" data-md-level="2" aria-labelledby="__nav_5_2_label" aria-expanded="false">
|
||
<label class="md-nav__title" for="__nav_5_2">
|
||
<span class="md-nav__icon md-icon"></span>
|
||
|
||
|
||
CLI
|
||
|
||
|
||
</label>
|
||
<ul class="md-nav__list" data-md-scrollfix>
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
<li class="md-nav__item">
|
||
<a href="../cli/" class="md-nav__link">
|
||
|
||
|
||
|
||
<span class="md-ellipsis">
|
||
|
||
|
||
CLI reference
|
||
|
||
|
||
|
||
</span>
|
||
|
||
|
||
|
||
</a>
|
||
</li>
|
||
|
||
|
||
|
||
|
||
</ul>
|
||
</nav>
|
||
|
||
</li>
|
||
|
||
|
||
|
||
|
||
</ul>
|
||
</nav>
|
||
|
||
</li>
|
||
|
||
|
||
|
||
</ul>
|
||
</nav>
|
||
</div>
|
||
</div>
|
||
</div>
|
||
|
||
|
||
|
||
<div class="md-sidebar md-sidebar--secondary" data-md-component="sidebar" data-md-type="toc" >
|
||
<div class="md-sidebar__scrollwrap">
|
||
<div class="md-sidebar__inner">
|
||
|
||
|
||
<nav class="md-nav md-nav--secondary" aria-label="Table of contents">
|
||
|
||
|
||
|
||
|
||
|
||
|
||
<label class="md-nav__title" for="__toc">
|
||
<span class="md-nav__icon md-icon"></span>
|
||
Table of contents
|
||
</label>
|
||
<ul class="md-nav__list" data-md-component="toc" data-md-scrollfix>
|
||
|
||
<li class="md-nav__item">
|
||
<a href="#docling.datamodel.pipeline_options" class="md-nav__link">
|
||
<span class="md-ellipsis">
|
||
|
||
<code class="doc-symbol doc-symbol-toc doc-symbol-module"></code> pipeline_options
|
||
|
||
</span>
|
||
</a>
|
||
|
||
<nav class="md-nav" aria-label=" pipeline_options">
|
||
<ul class="md-nav__list">
|
||
|
||
<li class="md-nav__item">
|
||
<a href="#docling.datamodel.pipeline_options.granite_picture_description" class="md-nav__link">
|
||
<span class="md-ellipsis">
|
||
|
||
<code class="doc-symbol doc-symbol-toc doc-symbol-attribute"></code> granite_picture_description
|
||
|
||
</span>
|
||
</a>
|
||
|
||
</li>
|
||
|
||
<li class="md-nav__item">
|
||
<a href="#docling.datamodel.pipeline_options.smolvlm_picture_description" class="md-nav__link">
|
||
<span class="md-ellipsis">
|
||
|
||
<code class="doc-symbol doc-symbol-toc doc-symbol-attribute"></code> smolvlm_picture_description
|
||
|
||
</span>
|
||
</a>
|
||
|
||
</li>
|
||
|
||
<li class="md-nav__item">
|
||
<a href="#docling.datamodel.pipeline_options.AsrPipelineOptions" class="md-nav__link">
|
||
<span class="md-ellipsis">
|
||
|
||
<code class="doc-symbol doc-symbol-toc doc-symbol-class"></code> AsrPipelineOptions
|
||
|
||
</span>
|
||
</a>
|
||
|
||
<nav class="md-nav" aria-label=" AsrPipelineOptions">
|
||
<ul class="md-nav__list">
|
||
|
||
<li class="md-nav__item">
|
||
<a href="#docling.datamodel.pipeline_options.AsrPipelineOptions.accelerator_options" class="md-nav__link">
|
||
<span class="md-ellipsis">
|
||
|
||
<code class="doc-symbol doc-symbol-toc doc-symbol-attribute"></code> accelerator_options
|
||
|
||
</span>
|
||
</a>
|
||
|
||
</li>
|
||
|
||
<li class="md-nav__item">
|
||
<a href="#docling.datamodel.pipeline_options.AsrPipelineOptions.allow_external_plugins" class="md-nav__link">
|
||
<span class="md-ellipsis">
|
||
|
||
<code class="doc-symbol doc-symbol-toc doc-symbol-attribute"></code> allow_external_plugins
|
||
|
||
</span>
|
||
</a>
|
||
|
||
</li>
|
||
|
||
<li class="md-nav__item">
|
||
<a href="#docling.datamodel.pipeline_options.AsrPipelineOptions.artifacts_path" class="md-nav__link">
|
||
<span class="md-ellipsis">
|
||
|
||
<code class="doc-symbol doc-symbol-toc doc-symbol-attribute"></code> artifacts_path
|
||
|
||
</span>
|
||
</a>
|
||
|
||
</li>
|
||
|
||
<li class="md-nav__item">
|
||
<a href="#docling.datamodel.pipeline_options.AsrPipelineOptions.asr_options" class="md-nav__link">
|
||
<span class="md-ellipsis">
|
||
|
||
<code class="doc-symbol doc-symbol-toc doc-symbol-attribute"></code> asr_options
|
||
|
||
</span>
|
||
</a>
|
||
|
||
</li>
|
||
|
||
<li class="md-nav__item">
|
||
<a href="#docling.datamodel.pipeline_options.AsrPipelineOptions.document_timeout" class="md-nav__link">
|
||
<span class="md-ellipsis">
|
||
|
||
<code class="doc-symbol doc-symbol-toc doc-symbol-attribute"></code> document_timeout
|
||
|
||
</span>
|
||
</a>
|
||
|
||
</li>
|
||
|
||
<li class="md-nav__item">
|
||
<a href="#docling.datamodel.pipeline_options.AsrPipelineOptions.enable_remote_services" class="md-nav__link">
|
||
<span class="md-ellipsis">
|
||
|
||
<code class="doc-symbol doc-symbol-toc doc-symbol-attribute"></code> enable_remote_services
|
||
|
||
</span>
|
||
</a>
|
||
|
||
</li>
|
||
|
||
<li class="md-nav__item">
|
||
<a href="#docling.datamodel.pipeline_options.AsrPipelineOptions.kind" class="md-nav__link">
|
||
<span class="md-ellipsis">
|
||
|
||
<code class="doc-symbol doc-symbol-toc doc-symbol-attribute"></code> kind
|
||
|
||
</span>
|
||
</a>
|
||
|
||
</li>
|
||
|
||
</ul>
|
||
</nav>
|
||
|
||
</li>
|
||
|
||
<li class="md-nav__item">
|
||
<a href="#docling.datamodel.pipeline_options.BaseLayoutOptions" class="md-nav__link">
|
||
<span class="md-ellipsis">
|
||
|
||
<code class="doc-symbol doc-symbol-toc doc-symbol-class"></code> BaseLayoutOptions
|
||
|
||
</span>
|
||
</a>
|
||
|
||
<nav class="md-nav" aria-label=" BaseLayoutOptions">
|
||
<ul class="md-nav__list">
|
||
|
||
<li class="md-nav__item">
|
||
<a href="#docling.datamodel.pipeline_options.BaseLayoutOptions.keep_empty_clusters" class="md-nav__link">
|
||
<span class="md-ellipsis">
|
||
|
||
<code class="doc-symbol doc-symbol-toc doc-symbol-attribute"></code> keep_empty_clusters
|
||
|
||
</span>
|
||
</a>
|
||
|
||
</li>
|
||
|
||
<li class="md-nav__item">
|
||
<a href="#docling.datamodel.pipeline_options.BaseLayoutOptions.kind" class="md-nav__link">
|
||
<span class="md-ellipsis">
|
||
|
||
<code class="doc-symbol doc-symbol-toc doc-symbol-attribute"></code> kind
|
||
|
||
</span>
|
||
</a>
|
||
|
||
</li>
|
||
|
||
<li class="md-nav__item">
|
||
<a href="#docling.datamodel.pipeline_options.BaseLayoutOptions.skip_cell_assignment" class="md-nav__link">
|
||
<span class="md-ellipsis">
|
||
|
||
<code class="doc-symbol doc-symbol-toc doc-symbol-attribute"></code> skip_cell_assignment
|
||
|
||
</span>
|
||
</a>
|
||
|
||
</li>
|
||
|
||
</ul>
|
||
</nav>
|
||
|
||
</li>
|
||
|
||
<li class="md-nav__item">
|
||
<a href="#docling.datamodel.pipeline_options.BaseOptions" class="md-nav__link">
|
||
<span class="md-ellipsis">
|
||
|
||
<code class="doc-symbol doc-symbol-toc doc-symbol-class"></code> BaseOptions
|
||
|
||
</span>
|
||
</a>
|
||
|
||
<nav class="md-nav" aria-label=" BaseOptions">
|
||
<ul class="md-nav__list">
|
||
|
||
<li class="md-nav__item">
|
||
<a href="#docling.datamodel.pipeline_options.BaseOptions.kind" class="md-nav__link">
|
||
<span class="md-ellipsis">
|
||
|
||
<code class="doc-symbol doc-symbol-toc doc-symbol-attribute"></code> kind
|
||
|
||
</span>
|
||
</a>
|
||
|
||
</li>
|
||
|
||
</ul>
|
||
</nav>
|
||
|
||
</li>
|
||
|
||
<li class="md-nav__item">
|
||
<a href="#docling.datamodel.pipeline_options.BaseTableStructureOptions" class="md-nav__link">
|
||
<span class="md-ellipsis">
|
||
|
||
<code class="doc-symbol doc-symbol-toc doc-symbol-class"></code> BaseTableStructureOptions
|
||
|
||
</span>
|
||
</a>
|
||
|
||
<nav class="md-nav" aria-label=" BaseTableStructureOptions">
|
||
<ul class="md-nav__list">
|
||
|
||
<li class="md-nav__item">
|
||
<a href="#docling.datamodel.pipeline_options.BaseTableStructureOptions.kind" class="md-nav__link">
|
||
<span class="md-ellipsis">
|
||
|
||
<code class="doc-symbol doc-symbol-toc doc-symbol-attribute"></code> kind
|
||
|
||
</span>
|
||
</a>
|
||
|
||
</li>
|
||
|
||
</ul>
|
||
</nav>
|
||
|
||
</li>
|
||
|
||
<li class="md-nav__item">
|
||
<a href="#docling.datamodel.pipeline_options.ConvertPipelineOptions" class="md-nav__link">
|
||
<span class="md-ellipsis">
|
||
|
||
<code class="doc-symbol doc-symbol-toc doc-symbol-class"></code> ConvertPipelineOptions
|
||
|
||
</span>
|
||
</a>
|
||
|
||
<nav class="md-nav" aria-label=" ConvertPipelineOptions">
|
||
<ul class="md-nav__list">
|
||
|
||
<li class="md-nav__item">
|
||
<a href="#docling.datamodel.pipeline_options.ConvertPipelineOptions.accelerator_options" class="md-nav__link">
|
||
<span class="md-ellipsis">
|
||
|
||
<code class="doc-symbol doc-symbol-toc doc-symbol-attribute"></code> accelerator_options
|
||
|
||
</span>
|
||
</a>
|
||
|
||
</li>
|
||
|
||
<li class="md-nav__item">
|
||
<a href="#docling.datamodel.pipeline_options.ConvertPipelineOptions.allow_external_plugins" class="md-nav__link">
|
||
<span class="md-ellipsis">
|
||
|
||
<code class="doc-symbol doc-symbol-toc doc-symbol-attribute"></code> allow_external_plugins
|
||
|
||
</span>
|
||
</a>
|
||
|
||
</li>
|
||
|
||
<li class="md-nav__item">
|
||
<a href="#docling.datamodel.pipeline_options.ConvertPipelineOptions.artifacts_path" class="md-nav__link">
|
||
<span class="md-ellipsis">
|
||
|
||
<code class="doc-symbol doc-symbol-toc doc-symbol-attribute"></code> artifacts_path
|
||
|
||
</span>
|
||
</a>
|
||
|
||
</li>
|
||
|
||
<li class="md-nav__item">
|
||
<a href="#docling.datamodel.pipeline_options.ConvertPipelineOptions.do_picture_classification" class="md-nav__link">
|
||
<span class="md-ellipsis">
|
||
|
||
<code class="doc-symbol doc-symbol-toc doc-symbol-attribute"></code> do_picture_classification
|
||
|
||
</span>
|
||
</a>
|
||
|
||
</li>
|
||
|
||
<li class="md-nav__item">
|
||
<a href="#docling.datamodel.pipeline_options.ConvertPipelineOptions.do_picture_description" class="md-nav__link">
|
||
<span class="md-ellipsis">
|
||
|
||
<code class="doc-symbol doc-symbol-toc doc-symbol-attribute"></code> do_picture_description
|
||
|
||
</span>
|
||
</a>
|
||
|
||
</li>
|
||
|
||
<li class="md-nav__item">
|
||
<a href="#docling.datamodel.pipeline_options.ConvertPipelineOptions.document_timeout" class="md-nav__link">
|
||
<span class="md-ellipsis">
|
||
|
||
<code class="doc-symbol doc-symbol-toc doc-symbol-attribute"></code> document_timeout
|
||
|
||
</span>
|
||
</a>
|
||
|
||
</li>
|
||
|
||
<li class="md-nav__item">
|
||
<a href="#docling.datamodel.pipeline_options.ConvertPipelineOptions.enable_remote_services" class="md-nav__link">
|
||
<span class="md-ellipsis">
|
||
|
||
<code class="doc-symbol doc-symbol-toc doc-symbol-attribute"></code> enable_remote_services
|
||
|
||
</span>
|
||
</a>
|
||
|
||
</li>
|
||
|
||
<li class="md-nav__item">
|
||
<a href="#docling.datamodel.pipeline_options.ConvertPipelineOptions.kind" class="md-nav__link">
|
||
<span class="md-ellipsis">
|
||
|
||
<code class="doc-symbol doc-symbol-toc doc-symbol-attribute"></code> kind
|
||
|
||
</span>
|
||
</a>
|
||
|
||
</li>
|
||
|
||
<li class="md-nav__item">
|
||
<a href="#docling.datamodel.pipeline_options.ConvertPipelineOptions.picture_description_options" class="md-nav__link">
|
||
<span class="md-ellipsis">
|
||
|
||
<code class="doc-symbol doc-symbol-toc doc-symbol-attribute"></code> picture_description_options
|
||
|
||
</span>
|
||
</a>
|
||
|
||
</li>
|
||
|
||
</ul>
|
||
</nav>
|
||
|
||
</li>
|
||
|
||
<li class="md-nav__item">
|
||
<a href="#docling.datamodel.pipeline_options.EasyOcrOptions" class="md-nav__link">
|
||
<span class="md-ellipsis">
|
||
|
||
<code class="doc-symbol doc-symbol-toc doc-symbol-class"></code> EasyOcrOptions
|
||
|
||
</span>
|
||
</a>
|
||
|
||
<nav class="md-nav" aria-label=" EasyOcrOptions">
|
||
<ul class="md-nav__list">
|
||
|
||
<li class="md-nav__item">
|
||
<a href="#docling.datamodel.pipeline_options.EasyOcrOptions.bitmap_area_threshold" class="md-nav__link">
|
||
<span class="md-ellipsis">
|
||
|
||
<code class="doc-symbol doc-symbol-toc doc-symbol-attribute"></code> bitmap_area_threshold
|
||
|
||
</span>
|
||
</a>
|
||
|
||
</li>
|
||
|
||
<li class="md-nav__item">
|
||
<a href="#docling.datamodel.pipeline_options.EasyOcrOptions.confidence_threshold" class="md-nav__link">
|
||
<span class="md-ellipsis">
|
||
|
||
<code class="doc-symbol doc-symbol-toc doc-symbol-attribute"></code> confidence_threshold
|
||
|
||
</span>
|
||
</a>
|
||
|
||
</li>
|
||
|
||
<li class="md-nav__item">
|
||
<a href="#docling.datamodel.pipeline_options.EasyOcrOptions.download_enabled" class="md-nav__link">
|
||
<span class="md-ellipsis">
|
||
|
||
<code class="doc-symbol doc-symbol-toc doc-symbol-attribute"></code> download_enabled
|
||
|
||
</span>
|
||
</a>
|
||
|
||
</li>
|
||
|
||
<li class="md-nav__item">
|
||
<a href="#docling.datamodel.pipeline_options.EasyOcrOptions.force_full_page_ocr" class="md-nav__link">
|
||
<span class="md-ellipsis">
|
||
|
||
<code class="doc-symbol doc-symbol-toc doc-symbol-attribute"></code> force_full_page_ocr
|
||
|
||
</span>
|
||
</a>
|
||
|
||
</li>
|
||
|
||
<li class="md-nav__item">
|
||
<a href="#docling.datamodel.pipeline_options.EasyOcrOptions.kind" class="md-nav__link">
|
||
<span class="md-ellipsis">
|
||
|
||
<code class="doc-symbol doc-symbol-toc doc-symbol-attribute"></code> kind
|
||
|
||
</span>
|
||
</a>
|
||
|
||
</li>
|
||
|
||
<li class="md-nav__item">
|
||
<a href="#docling.datamodel.pipeline_options.EasyOcrOptions.lang" class="md-nav__link">
|
||
<span class="md-ellipsis">
|
||
|
||
<code class="doc-symbol doc-symbol-toc doc-symbol-attribute"></code> lang
|
||
|
||
</span>
|
||
</a>
|
||
|
||
</li>
|
||
|
||
<li class="md-nav__item">
|
||
<a href="#docling.datamodel.pipeline_options.EasyOcrOptions.model_config" class="md-nav__link">
|
||
<span class="md-ellipsis">
|
||
|
||
<code class="doc-symbol doc-symbol-toc doc-symbol-attribute"></code> model_config
|
||
|
||
</span>
|
||
</a>
|
||
|
||
</li>
|
||
|
||
<li class="md-nav__item">
|
||
<a href="#docling.datamodel.pipeline_options.EasyOcrOptions.model_storage_directory" class="md-nav__link">
|
||
<span class="md-ellipsis">
|
||
|
||
<code class="doc-symbol doc-symbol-toc doc-symbol-attribute"></code> model_storage_directory
|
||
|
||
</span>
|
||
</a>
|
||
|
||
</li>
|
||
|
||
<li class="md-nav__item">
|
||
<a href="#docling.datamodel.pipeline_options.EasyOcrOptions.recog_network" class="md-nav__link">
|
||
<span class="md-ellipsis">
|
||
|
||
<code class="doc-symbol doc-symbol-toc doc-symbol-attribute"></code> recog_network
|
||
|
||
</span>
|
||
</a>
|
||
|
||
</li>
|
||
|
||
<li class="md-nav__item">
|
||
<a href="#docling.datamodel.pipeline_options.EasyOcrOptions.suppress_mps_warnings" class="md-nav__link">
|
||
<span class="md-ellipsis">
|
||
|
||
<code class="doc-symbol doc-symbol-toc doc-symbol-attribute"></code> suppress_mps_warnings
|
||
|
||
</span>
|
||
</a>
|
||
|
||
</li>
|
||
|
||
<li class="md-nav__item">
|
||
<a href="#docling.datamodel.pipeline_options.EasyOcrOptions.use_gpu" class="md-nav__link">
|
||
<span class="md-ellipsis">
|
||
|
||
<code class="doc-symbol doc-symbol-toc doc-symbol-attribute"></code> use_gpu
|
||
|
||
</span>
|
||
</a>
|
||
|
||
</li>
|
||
|
||
</ul>
|
||
</nav>
|
||
|
||
</li>
|
||
|
||
<li class="md-nav__item">
|
||
<a href="#docling.datamodel.pipeline_options.LayoutOptions" class="md-nav__link">
|
||
<span class="md-ellipsis">
|
||
|
||
<code class="doc-symbol doc-symbol-toc doc-symbol-class"></code> LayoutOptions
|
||
|
||
</span>
|
||
</a>
|
||
|
||
<nav class="md-nav" aria-label=" LayoutOptions">
|
||
<ul class="md-nav__list">
|
||
|
||
<li class="md-nav__item">
|
||
<a href="#docling.datamodel.pipeline_options.LayoutOptions.create_orphan_clusters" class="md-nav__link">
|
||
<span class="md-ellipsis">
|
||
|
||
<code class="doc-symbol doc-symbol-toc doc-symbol-attribute"></code> create_orphan_clusters
|
||
|
||
</span>
|
||
</a>
|
||
|
||
</li>
|
||
|
||
<li class="md-nav__item">
|
||
<a href="#docling.datamodel.pipeline_options.LayoutOptions.keep_empty_clusters" class="md-nav__link">
|
||
<span class="md-ellipsis">
|
||
|
||
<code class="doc-symbol doc-symbol-toc doc-symbol-attribute"></code> keep_empty_clusters
|
||
|
||
</span>
|
||
</a>
|
||
|
||
</li>
|
||
|
||
<li class="md-nav__item">
|
||
<a href="#docling.datamodel.pipeline_options.LayoutOptions.kind" class="md-nav__link">
|
||
<span class="md-ellipsis">
|
||
|
||
<code class="doc-symbol doc-symbol-toc doc-symbol-attribute"></code> kind
|
||
|
||
</span>
|
||
</a>
|
||
|
||
</li>
|
||
|
||
<li class="md-nav__item">
|
||
<a href="#docling.datamodel.pipeline_options.LayoutOptions.model_spec" class="md-nav__link">
|
||
<span class="md-ellipsis">
|
||
|
||
<code class="doc-symbol doc-symbol-toc doc-symbol-attribute"></code> model_spec
|
||
|
||
</span>
|
||
</a>
|
||
|
||
</li>
|
||
|
||
<li class="md-nav__item">
|
||
<a href="#docling.datamodel.pipeline_options.LayoutOptions.skip_cell_assignment" class="md-nav__link">
|
||
<span class="md-ellipsis">
|
||
|
||
<code class="doc-symbol doc-symbol-toc doc-symbol-attribute"></code> skip_cell_assignment
|
||
|
||
</span>
|
||
</a>
|
||
|
||
</li>
|
||
|
||
</ul>
|
||
</nav>
|
||
|
||
</li>
|
||
|
||
<li class="md-nav__item">
|
||
<a href="#docling.datamodel.pipeline_options.OcrAutoOptions" class="md-nav__link">
|
||
<span class="md-ellipsis">
|
||
|
||
<code class="doc-symbol doc-symbol-toc doc-symbol-class"></code> OcrAutoOptions
|
||
|
||
</span>
|
||
</a>
|
||
|
||
<nav class="md-nav" aria-label=" OcrAutoOptions">
|
||
<ul class="md-nav__list">
|
||
|
||
<li class="md-nav__item">
|
||
<a href="#docling.datamodel.pipeline_options.OcrAutoOptions.bitmap_area_threshold" class="md-nav__link">
|
||
<span class="md-ellipsis">
|
||
|
||
<code class="doc-symbol doc-symbol-toc doc-symbol-attribute"></code> bitmap_area_threshold
|
||
|
||
</span>
|
||
</a>
|
||
|
||
</li>
|
||
|
||
<li class="md-nav__item">
|
||
<a href="#docling.datamodel.pipeline_options.OcrAutoOptions.force_full_page_ocr" class="md-nav__link">
|
||
<span class="md-ellipsis">
|
||
|
||
<code class="doc-symbol doc-symbol-toc doc-symbol-attribute"></code> force_full_page_ocr
|
||
|
||
</span>
|
||
</a>
|
||
|
||
</li>
|
||
|
||
<li class="md-nav__item">
|
||
<a href="#docling.datamodel.pipeline_options.OcrAutoOptions.kind" class="md-nav__link">
|
||
<span class="md-ellipsis">
|
||
|
||
<code class="doc-symbol doc-symbol-toc doc-symbol-attribute"></code> kind
|
||
|
||
</span>
|
||
</a>
|
||
|
||
</li>
|
||
|
||
<li class="md-nav__item">
|
||
<a href="#docling.datamodel.pipeline_options.OcrAutoOptions.lang" class="md-nav__link">
|
||
<span class="md-ellipsis">
|
||
|
||
<code class="doc-symbol doc-symbol-toc doc-symbol-attribute"></code> lang
|
||
|
||
</span>
|
||
</a>
|
||
|
||
</li>
|
||
|
||
</ul>
|
||
</nav>
|
||
|
||
</li>
|
||
|
||
<li class="md-nav__item">
|
||
<a href="#docling.datamodel.pipeline_options.OcrEngine" class="md-nav__link">
|
||
<span class="md-ellipsis">
|
||
|
||
<code class="doc-symbol doc-symbol-toc doc-symbol-class"></code> OcrEngine
|
||
|
||
</span>
|
||
</a>
|
||
|
||
<nav class="md-nav" aria-label=" OcrEngine">
|
||
<ul class="md-nav__list">
|
||
|
||
<li class="md-nav__item">
|
||
<a href="#docling.datamodel.pipeline_options.OcrEngine.AUTO" class="md-nav__link">
|
||
<span class="md-ellipsis">
|
||
|
||
<code class="doc-symbol doc-symbol-toc doc-symbol-attribute"></code> AUTO
|
||
|
||
</span>
|
||
</a>
|
||
|
||
</li>
|
||
|
||
<li class="md-nav__item">
|
||
<a href="#docling.datamodel.pipeline_options.OcrEngine.EASYOCR" class="md-nav__link">
|
||
<span class="md-ellipsis">
|
||
|
||
<code class="doc-symbol doc-symbol-toc doc-symbol-attribute"></code> EASYOCR
|
||
|
||
</span>
|
||
</a>
|
||
|
||
</li>
|
||
|
||
<li class="md-nav__item">
|
||
<a href="#docling.datamodel.pipeline_options.OcrEngine.OCRMAC" class="md-nav__link">
|
||
<span class="md-ellipsis">
|
||
|
||
<code class="doc-symbol doc-symbol-toc doc-symbol-attribute"></code> OCRMAC
|
||
|
||
</span>
|
||
</a>
|
||
|
||
</li>
|
||
|
||
<li class="md-nav__item">
|
||
<a href="#docling.datamodel.pipeline_options.OcrEngine.RAPIDOCR" class="md-nav__link">
|
||
<span class="md-ellipsis">
|
||
|
||
<code class="doc-symbol doc-symbol-toc doc-symbol-attribute"></code> RAPIDOCR
|
||
|
||
</span>
|
||
</a>
|
||
|
||
</li>
|
||
|
||
<li class="md-nav__item">
|
||
<a href="#docling.datamodel.pipeline_options.OcrEngine.TESSERACT" class="md-nav__link">
|
||
<span class="md-ellipsis">
|
||
|
||
<code class="doc-symbol doc-symbol-toc doc-symbol-attribute"></code> TESSERACT
|
||
|
||
</span>
|
||
</a>
|
||
|
||
</li>
|
||
|
||
<li class="md-nav__item">
|
||
<a href="#docling.datamodel.pipeline_options.OcrEngine.TESSERACT_CLI" class="md-nav__link">
|
||
<span class="md-ellipsis">
|
||
|
||
<code class="doc-symbol doc-symbol-toc doc-symbol-attribute"></code> TESSERACT_CLI
|
||
|
||
</span>
|
||
</a>
|
||
|
||
</li>
|
||
|
||
</ul>
|
||
</nav>
|
||
|
||
</li>
|
||
|
||
<li class="md-nav__item">
|
||
<a href="#docling.datamodel.pipeline_options.OcrMacOptions" class="md-nav__link">
|
||
<span class="md-ellipsis">
|
||
|
||
<code class="doc-symbol doc-symbol-toc doc-symbol-class"></code> OcrMacOptions
|
||
|
||
</span>
|
||
</a>
|
||
|
||
<nav class="md-nav" aria-label=" OcrMacOptions">
|
||
<ul class="md-nav__list">
|
||
|
||
<li class="md-nav__item">
|
||
<a href="#docling.datamodel.pipeline_options.OcrMacOptions.bitmap_area_threshold" class="md-nav__link">
|
||
<span class="md-ellipsis">
|
||
|
||
<code class="doc-symbol doc-symbol-toc doc-symbol-attribute"></code> bitmap_area_threshold
|
||
|
||
</span>
|
||
</a>
|
||
|
||
</li>
|
||
|
||
<li class="md-nav__item">
|
||
<a href="#docling.datamodel.pipeline_options.OcrMacOptions.force_full_page_ocr" class="md-nav__link">
|
||
<span class="md-ellipsis">
|
||
|
||
<code class="doc-symbol doc-symbol-toc doc-symbol-attribute"></code> force_full_page_ocr
|
||
|
||
</span>
|
||
</a>
|
||
|
||
</li>
|
||
|
||
<li class="md-nav__item">
|
||
<a href="#docling.datamodel.pipeline_options.OcrMacOptions.framework" class="md-nav__link">
|
||
<span class="md-ellipsis">
|
||
|
||
<code class="doc-symbol doc-symbol-toc doc-symbol-attribute"></code> framework
|
||
|
||
</span>
|
||
</a>
|
||
|
||
</li>
|
||
|
||
<li class="md-nav__item">
|
||
<a href="#docling.datamodel.pipeline_options.OcrMacOptions.kind" class="md-nav__link">
|
||
<span class="md-ellipsis">
|
||
|
||
<code class="doc-symbol doc-symbol-toc doc-symbol-attribute"></code> kind
|
||
|
||
</span>
|
||
</a>
|
||
|
||
</li>
|
||
|
||
<li class="md-nav__item">
|
||
<a href="#docling.datamodel.pipeline_options.OcrMacOptions.lang" class="md-nav__link">
|
||
<span class="md-ellipsis">
|
||
|
||
<code class="doc-symbol doc-symbol-toc doc-symbol-attribute"></code> lang
|
||
|
||
</span>
|
||
</a>
|
||
|
||
</li>
|
||
|
||
<li class="md-nav__item">
|
||
<a href="#docling.datamodel.pipeline_options.OcrMacOptions.model_config" class="md-nav__link">
|
||
<span class="md-ellipsis">
|
||
|
||
<code class="doc-symbol doc-symbol-toc doc-symbol-attribute"></code> model_config
|
||
|
||
</span>
|
||
</a>
|
||
|
||
</li>
|
||
|
||
<li class="md-nav__item">
|
||
<a href="#docling.datamodel.pipeline_options.OcrMacOptions.recognition" class="md-nav__link">
|
||
<span class="md-ellipsis">
|
||
|
||
<code class="doc-symbol doc-symbol-toc doc-symbol-attribute"></code> recognition
|
||
|
||
</span>
|
||
</a>
|
||
|
||
</li>
|
||
|
||
</ul>
|
||
</nav>
|
||
|
||
</li>
|
||
|
||
<li class="md-nav__item">
|
||
<a href="#docling.datamodel.pipeline_options.OcrOptions" class="md-nav__link">
|
||
<span class="md-ellipsis">
|
||
|
||
<code class="doc-symbol doc-symbol-toc doc-symbol-class"></code> OcrOptions
|
||
|
||
</span>
|
||
</a>
|
||
|
||
<nav class="md-nav" aria-label=" OcrOptions">
|
||
<ul class="md-nav__list">
|
||
|
||
<li class="md-nav__item">
|
||
<a href="#docling.datamodel.pipeline_options.OcrOptions.bitmap_area_threshold" class="md-nav__link">
|
||
<span class="md-ellipsis">
|
||
|
||
<code class="doc-symbol doc-symbol-toc doc-symbol-attribute"></code> bitmap_area_threshold
|
||
|
||
</span>
|
||
</a>
|
||
|
||
</li>
|
||
|
||
<li class="md-nav__item">
|
||
<a href="#docling.datamodel.pipeline_options.OcrOptions.force_full_page_ocr" class="md-nav__link">
|
||
<span class="md-ellipsis">
|
||
|
||
<code class="doc-symbol doc-symbol-toc doc-symbol-attribute"></code> force_full_page_ocr
|
||
|
||
</span>
|
||
</a>
|
||
|
||
</li>
|
||
|
||
<li class="md-nav__item">
|
||
<a href="#docling.datamodel.pipeline_options.OcrOptions.kind" class="md-nav__link">
|
||
<span class="md-ellipsis">
|
||
|
||
<code class="doc-symbol doc-symbol-toc doc-symbol-attribute"></code> kind
|
||
|
||
</span>
|
||
</a>
|
||
|
||
</li>
|
||
|
||
<li class="md-nav__item">
|
||
<a href="#docling.datamodel.pipeline_options.OcrOptions.lang" class="md-nav__link">
|
||
<span class="md-ellipsis">
|
||
|
||
<code class="doc-symbol doc-symbol-toc doc-symbol-attribute"></code> lang
|
||
|
||
</span>
|
||
</a>
|
||
|
||
</li>
|
||
|
||
</ul>
|
||
</nav>
|
||
|
||
</li>
|
||
|
||
<li class="md-nav__item">
|
||
<a href="#docling.datamodel.pipeline_options.PaginatedPipelineOptions" class="md-nav__link">
|
||
<span class="md-ellipsis">
|
||
|
||
<code class="doc-symbol doc-symbol-toc doc-symbol-class"></code> PaginatedPipelineOptions
|
||
|
||
</span>
|
||
</a>
|
||
|
||
<nav class="md-nav" aria-label=" PaginatedPipelineOptions">
|
||
<ul class="md-nav__list">
|
||
|
||
<li class="md-nav__item">
|
||
<a href="#docling.datamodel.pipeline_options.PaginatedPipelineOptions.accelerator_options" class="md-nav__link">
|
||
<span class="md-ellipsis">
|
||
|
||
<code class="doc-symbol doc-symbol-toc doc-symbol-attribute"></code> accelerator_options
|
||
|
||
</span>
|
||
</a>
|
||
|
||
</li>
|
||
|
||
<li class="md-nav__item">
|
||
<a href="#docling.datamodel.pipeline_options.PaginatedPipelineOptions.allow_external_plugins" class="md-nav__link">
|
||
<span class="md-ellipsis">
|
||
|
||
<code class="doc-symbol doc-symbol-toc doc-symbol-attribute"></code> allow_external_plugins
|
||
|
||
</span>
|
||
</a>
|
||
|
||
</li>
|
||
|
||
<li class="md-nav__item">
|
||
<a href="#docling.datamodel.pipeline_options.PaginatedPipelineOptions.artifacts_path" class="md-nav__link">
|
||
<span class="md-ellipsis">
|
||
|
||
<code class="doc-symbol doc-symbol-toc doc-symbol-attribute"></code> artifacts_path
|
||
|
||
</span>
|
||
</a>
|
||
|
||
</li>
|
||
|
||
<li class="md-nav__item">
|
||
<a href="#docling.datamodel.pipeline_options.PaginatedPipelineOptions.do_picture_classification" class="md-nav__link">
|
||
<span class="md-ellipsis">
|
||
|
||
<code class="doc-symbol doc-symbol-toc doc-symbol-attribute"></code> do_picture_classification
|
||
|
||
</span>
|
||
</a>
|
||
|
||
</li>
|
||
|
||
<li class="md-nav__item">
|
||
<a href="#docling.datamodel.pipeline_options.PaginatedPipelineOptions.do_picture_description" class="md-nav__link">
|
||
<span class="md-ellipsis">
|
||
|
||
<code class="doc-symbol doc-symbol-toc doc-symbol-attribute"></code> do_picture_description
|
||
|
||
</span>
|
||
</a>
|
||
|
||
</li>
|
||
|
||
<li class="md-nav__item">
|
||
<a href="#docling.datamodel.pipeline_options.PaginatedPipelineOptions.document_timeout" class="md-nav__link">
|
||
<span class="md-ellipsis">
|
||
|
||
<code class="doc-symbol doc-symbol-toc doc-symbol-attribute"></code> document_timeout
|
||
|
||
</span>
|
||
</a>
|
||
|
||
</li>
|
||
|
||
<li class="md-nav__item">
|
||
<a href="#docling.datamodel.pipeline_options.PaginatedPipelineOptions.enable_remote_services" class="md-nav__link">
|
||
<span class="md-ellipsis">
|
||
|
||
<code class="doc-symbol doc-symbol-toc doc-symbol-attribute"></code> enable_remote_services
|
||
|
||
</span>
|
||
</a>
|
||
|
||
</li>
|
||
|
||
<li class="md-nav__item">
|
||
<a href="#docling.datamodel.pipeline_options.PaginatedPipelineOptions.generate_page_images" class="md-nav__link">
|
||
<span class="md-ellipsis">
|
||
|
||
<code class="doc-symbol doc-symbol-toc doc-symbol-attribute"></code> generate_page_images
|
||
|
||
</span>
|
||
</a>
|
||
|
||
</li>
|
||
|
||
<li class="md-nav__item">
|
||
<a href="#docling.datamodel.pipeline_options.PaginatedPipelineOptions.generate_picture_images" class="md-nav__link">
|
||
<span class="md-ellipsis">
|
||
|
||
<code class="doc-symbol doc-symbol-toc doc-symbol-attribute"></code> generate_picture_images
|
||
|
||
</span>
|
||
</a>
|
||
|
||
</li>
|
||
|
||
<li class="md-nav__item">
|
||
<a href="#docling.datamodel.pipeline_options.PaginatedPipelineOptions.images_scale" class="md-nav__link">
|
||
<span class="md-ellipsis">
|
||
|
||
<code class="doc-symbol doc-symbol-toc doc-symbol-attribute"></code> images_scale
|
||
|
||
</span>
|
||
</a>
|
||
|
||
</li>
|
||
|
||
<li class="md-nav__item">
|
||
<a href="#docling.datamodel.pipeline_options.PaginatedPipelineOptions.kind" class="md-nav__link">
|
||
<span class="md-ellipsis">
|
||
|
||
<code class="doc-symbol doc-symbol-toc doc-symbol-attribute"></code> kind
|
||
|
||
</span>
|
||
</a>
|
||
|
||
</li>
|
||
|
||
<li class="md-nav__item">
|
||
<a href="#docling.datamodel.pipeline_options.PaginatedPipelineOptions.picture_description_options" class="md-nav__link">
|
||
<span class="md-ellipsis">
|
||
|
||
<code class="doc-symbol doc-symbol-toc doc-symbol-attribute"></code> picture_description_options
|
||
|
||
</span>
|
||
</a>
|
||
|
||
</li>
|
||
|
||
</ul>
|
||
</nav>
|
||
|
||
</li>
|
||
|
||
<li class="md-nav__item">
|
||
<a href="#docling.datamodel.pipeline_options.PdfBackend" class="md-nav__link">
|
||
<span class="md-ellipsis">
|
||
|
||
<code class="doc-symbol doc-symbol-toc doc-symbol-class"></code> PdfBackend
|
||
|
||
</span>
|
||
</a>
|
||
|
||
<nav class="md-nav" aria-label=" PdfBackend">
|
||
<ul class="md-nav__list">
|
||
|
||
<li class="md-nav__item">
|
||
<a href="#docling.datamodel.pipeline_options.PdfBackend.DLPARSE_V1" class="md-nav__link">
|
||
<span class="md-ellipsis">
|
||
|
||
<code class="doc-symbol doc-symbol-toc doc-symbol-attribute"></code> DLPARSE_V1
|
||
|
||
</span>
|
||
</a>
|
||
|
||
</li>
|
||
|
||
<li class="md-nav__item">
|
||
<a href="#docling.datamodel.pipeline_options.PdfBackend.DLPARSE_V2" class="md-nav__link">
|
||
<span class="md-ellipsis">
|
||
|
||
<code class="doc-symbol doc-symbol-toc doc-symbol-attribute"></code> DLPARSE_V2
|
||
|
||
</span>
|
||
</a>
|
||
|
||
</li>
|
||
|
||
<li class="md-nav__item">
|
||
<a href="#docling.datamodel.pipeline_options.PdfBackend.DLPARSE_V4" class="md-nav__link">
|
||
<span class="md-ellipsis">
|
||
|
||
<code class="doc-symbol doc-symbol-toc doc-symbol-attribute"></code> DLPARSE_V4
|
||
|
||
</span>
|
||
</a>
|
||
|
||
</li>
|
||
|
||
<li class="md-nav__item">
|
||
<a href="#docling.datamodel.pipeline_options.PdfBackend.PYPDFIUM2" class="md-nav__link">
|
||
<span class="md-ellipsis">
|
||
|
||
<code class="doc-symbol doc-symbol-toc doc-symbol-attribute"></code> PYPDFIUM2
|
||
|
||
</span>
|
||
</a>
|
||
|
||
</li>
|
||
|
||
</ul>
|
||
</nav>
|
||
|
||
</li>
|
||
|
||
<li class="md-nav__item">
|
||
<a href="#docling.datamodel.pipeline_options.PdfPipelineOptions" class="md-nav__link">
|
||
<span class="md-ellipsis">
|
||
|
||
<code class="doc-symbol doc-symbol-toc doc-symbol-class"></code> PdfPipelineOptions
|
||
|
||
</span>
|
||
</a>
|
||
|
||
<nav class="md-nav" aria-label=" PdfPipelineOptions">
|
||
<ul class="md-nav__list">
|
||
|
||
<li class="md-nav__item">
|
||
<a href="#docling.datamodel.pipeline_options.PdfPipelineOptions.accelerator_options" class="md-nav__link">
|
||
<span class="md-ellipsis">
|
||
|
||
<code class="doc-symbol doc-symbol-toc doc-symbol-attribute"></code> accelerator_options
|
||
|
||
</span>
|
||
</a>
|
||
|
||
</li>
|
||
|
||
<li class="md-nav__item">
|
||
<a href="#docling.datamodel.pipeline_options.PdfPipelineOptions.allow_external_plugins" class="md-nav__link">
|
||
<span class="md-ellipsis">
|
||
|
||
<code class="doc-symbol doc-symbol-toc doc-symbol-attribute"></code> allow_external_plugins
|
||
|
||
</span>
|
||
</a>
|
||
|
||
</li>
|
||
|
||
<li class="md-nav__item">
|
||
<a href="#docling.datamodel.pipeline_options.PdfPipelineOptions.artifacts_path" class="md-nav__link">
|
||
<span class="md-ellipsis">
|
||
|
||
<code class="doc-symbol doc-symbol-toc doc-symbol-attribute"></code> artifacts_path
|
||
|
||
</span>
|
||
</a>
|
||
|
||
</li>
|
||
|
||
<li class="md-nav__item">
|
||
<a href="#docling.datamodel.pipeline_options.PdfPipelineOptions.batch_polling_interval_seconds" class="md-nav__link">
|
||
<span class="md-ellipsis">
|
||
|
||
<code class="doc-symbol doc-symbol-toc doc-symbol-attribute"></code> batch_polling_interval_seconds
|
||
|
||
</span>
|
||
</a>
|
||
|
||
</li>
|
||
|
||
<li class="md-nav__item">
|
||
<a href="#docling.datamodel.pipeline_options.PdfPipelineOptions.do_code_enrichment" class="md-nav__link">
|
||
<span class="md-ellipsis">
|
||
|
||
<code class="doc-symbol doc-symbol-toc doc-symbol-attribute"></code> do_code_enrichment
|
||
|
||
</span>
|
||
</a>
|
||
|
||
</li>
|
||
|
||
<li class="md-nav__item">
|
||
<a href="#docling.datamodel.pipeline_options.PdfPipelineOptions.do_formula_enrichment" class="md-nav__link">
|
||
<span class="md-ellipsis">
|
||
|
||
<code class="doc-symbol doc-symbol-toc doc-symbol-attribute"></code> do_formula_enrichment
|
||
|
||
</span>
|
||
</a>
|
||
|
||
</li>
|
||
|
||
<li class="md-nav__item">
|
||
<a href="#docling.datamodel.pipeline_options.PdfPipelineOptions.do_ocr" class="md-nav__link">
|
||
<span class="md-ellipsis">
|
||
|
||
<code class="doc-symbol doc-symbol-toc doc-symbol-attribute"></code> do_ocr
|
||
|
||
</span>
|
||
</a>
|
||
|
||
</li>
|
||
|
||
<li class="md-nav__item">
|
||
<a href="#docling.datamodel.pipeline_options.PdfPipelineOptions.do_picture_classification" class="md-nav__link">
|
||
<span class="md-ellipsis">
|
||
|
||
<code class="doc-symbol doc-symbol-toc doc-symbol-attribute"></code> do_picture_classification
|
||
|
||
</span>
|
||
</a>
|
||
|
||
</li>
|
||
|
||
<li class="md-nav__item">
|
||
<a href="#docling.datamodel.pipeline_options.PdfPipelineOptions.do_picture_description" class="md-nav__link">
|
||
<span class="md-ellipsis">
|
||
|
||
<code class="doc-symbol doc-symbol-toc doc-symbol-attribute"></code> do_picture_description
|
||
|
||
</span>
|
||
</a>
|
||
|
||
</li>
|
||
|
||
<li class="md-nav__item">
|
||
<a href="#docling.datamodel.pipeline_options.PdfPipelineOptions.do_table_structure" class="md-nav__link">
|
||
<span class="md-ellipsis">
|
||
|
||
<code class="doc-symbol doc-symbol-toc doc-symbol-attribute"></code> do_table_structure
|
||
|
||
</span>
|
||
</a>
|
||
|
||
</li>
|
||
|
||
<li class="md-nav__item">
|
||
<a href="#docling.datamodel.pipeline_options.PdfPipelineOptions.document_timeout" class="md-nav__link">
|
||
<span class="md-ellipsis">
|
||
|
||
<code class="doc-symbol doc-symbol-toc doc-symbol-attribute"></code> document_timeout
|
||
|
||
</span>
|
||
</a>
|
||
|
||
</li>
|
||
|
||
<li class="md-nav__item">
|
||
<a href="#docling.datamodel.pipeline_options.PdfPipelineOptions.enable_remote_services" class="md-nav__link">
|
||
<span class="md-ellipsis">
|
||
|
||
<code class="doc-symbol doc-symbol-toc doc-symbol-attribute"></code> enable_remote_services
|
||
|
||
</span>
|
||
</a>
|
||
|
||
</li>
|
||
|
||
<li class="md-nav__item">
|
||
<a href="#docling.datamodel.pipeline_options.PdfPipelineOptions.force_backend_text" class="md-nav__link">
|
||
<span class="md-ellipsis">
|
||
|
||
<code class="doc-symbol doc-symbol-toc doc-symbol-attribute"></code> force_backend_text
|
||
|
||
</span>
|
||
</a>
|
||
|
||
</li>
|
||
|
||
<li class="md-nav__item">
|
||
<a href="#docling.datamodel.pipeline_options.PdfPipelineOptions.generate_page_images" class="md-nav__link">
|
||
<span class="md-ellipsis">
|
||
|
||
<code class="doc-symbol doc-symbol-toc doc-symbol-attribute"></code> generate_page_images
|
||
|
||
</span>
|
||
</a>
|
||
|
||
</li>
|
||
|
||
<li class="md-nav__item">
|
||
<a href="#docling.datamodel.pipeline_options.PdfPipelineOptions.generate_parsed_pages" class="md-nav__link">
|
||
<span class="md-ellipsis">
|
||
|
||
<code class="doc-symbol doc-symbol-toc doc-symbol-attribute"></code> generate_parsed_pages
|
||
|
||
</span>
|
||
</a>
|
||
|
||
</li>
|
||
|
||
<li class="md-nav__item">
|
||
<a href="#docling.datamodel.pipeline_options.PdfPipelineOptions.generate_picture_images" class="md-nav__link">
|
||
<span class="md-ellipsis">
|
||
|
||
<code class="doc-symbol doc-symbol-toc doc-symbol-attribute"></code> generate_picture_images
|
||
|
||
</span>
|
||
</a>
|
||
|
||
</li>
|
||
|
||
<li class="md-nav__item">
|
||
<a href="#docling.datamodel.pipeline_options.PdfPipelineOptions.generate_table_images" class="md-nav__link">
|
||
<span class="md-ellipsis">
|
||
|
||
<code class="doc-symbol doc-symbol-toc doc-symbol-attribute"></code> generate_table_images
|
||
|
||
</span>
|
||
</a>
|
||
|
||
</li>
|
||
|
||
<li class="md-nav__item">
|
||
<a href="#docling.datamodel.pipeline_options.PdfPipelineOptions.images_scale" class="md-nav__link">
|
||
<span class="md-ellipsis">
|
||
|
||
<code class="doc-symbol doc-symbol-toc doc-symbol-attribute"></code> images_scale
|
||
|
||
</span>
|
||
</a>
|
||
|
||
</li>
|
||
|
||
<li class="md-nav__item">
|
||
<a href="#docling.datamodel.pipeline_options.PdfPipelineOptions.kind" class="md-nav__link">
|
||
<span class="md-ellipsis">
|
||
|
||
<code class="doc-symbol doc-symbol-toc doc-symbol-attribute"></code> kind
|
||
|
||
</span>
|
||
</a>
|
||
|
||
</li>
|
||
|
||
<li class="md-nav__item">
|
||
<a href="#docling.datamodel.pipeline_options.PdfPipelineOptions.layout_batch_size" class="md-nav__link">
|
||
<span class="md-ellipsis">
|
||
|
||
<code class="doc-symbol doc-symbol-toc doc-symbol-attribute"></code> layout_batch_size
|
||
|
||
</span>
|
||
</a>
|
||
|
||
</li>
|
||
|
||
<li class="md-nav__item">
|
||
<a href="#docling.datamodel.pipeline_options.PdfPipelineOptions.layout_options" class="md-nav__link">
|
||
<span class="md-ellipsis">
|
||
|
||
<code class="doc-symbol doc-symbol-toc doc-symbol-attribute"></code> layout_options
|
||
|
||
</span>
|
||
</a>
|
||
|
||
</li>
|
||
|
||
<li class="md-nav__item">
|
||
<a href="#docling.datamodel.pipeline_options.PdfPipelineOptions.ocr_batch_size" class="md-nav__link">
|
||
<span class="md-ellipsis">
|
||
|
||
<code class="doc-symbol doc-symbol-toc doc-symbol-attribute"></code> ocr_batch_size
|
||
|
||
</span>
|
||
</a>
|
||
|
||
</li>
|
||
|
||
<li class="md-nav__item">
|
||
<a href="#docling.datamodel.pipeline_options.PdfPipelineOptions.ocr_options" class="md-nav__link">
|
||
<span class="md-ellipsis">
|
||
|
||
<code class="doc-symbol doc-symbol-toc doc-symbol-attribute"></code> ocr_options
|
||
|
||
</span>
|
||
</a>
|
||
|
||
</li>
|
||
|
||
<li class="md-nav__item">
|
||
<a href="#docling.datamodel.pipeline_options.PdfPipelineOptions.picture_description_options" class="md-nav__link">
|
||
<span class="md-ellipsis">
|
||
|
||
<code class="doc-symbol doc-symbol-toc doc-symbol-attribute"></code> picture_description_options
|
||
|
||
</span>
|
||
</a>
|
||
|
||
</li>
|
||
|
||
<li class="md-nav__item">
|
||
<a href="#docling.datamodel.pipeline_options.PdfPipelineOptions.queue_max_size" class="md-nav__link">
|
||
<span class="md-ellipsis">
|
||
|
||
<code class="doc-symbol doc-symbol-toc doc-symbol-attribute"></code> queue_max_size
|
||
|
||
</span>
|
||
</a>
|
||
|
||
</li>
|
||
|
||
<li class="md-nav__item">
|
||
<a href="#docling.datamodel.pipeline_options.PdfPipelineOptions.table_batch_size" class="md-nav__link">
|
||
<span class="md-ellipsis">
|
||
|
||
<code class="doc-symbol doc-symbol-toc doc-symbol-attribute"></code> table_batch_size
|
||
|
||
</span>
|
||
</a>
|
||
|
||
</li>
|
||
|
||
<li class="md-nav__item">
|
||
<a href="#docling.datamodel.pipeline_options.PdfPipelineOptions.table_structure_options" class="md-nav__link">
|
||
<span class="md-ellipsis">
|
||
|
||
<code class="doc-symbol doc-symbol-toc doc-symbol-attribute"></code> table_structure_options
|
||
|
||
</span>
|
||
</a>
|
||
|
||
</li>
|
||
|
||
</ul>
|
||
</nav>
|
||
|
||
</li>
|
||
|
||
<li class="md-nav__item">
|
||
<a href="#docling.datamodel.pipeline_options.PictureDescriptionApiOptions" class="md-nav__link">
|
||
<span class="md-ellipsis">
|
||
|
||
<code class="doc-symbol doc-symbol-toc doc-symbol-class"></code> PictureDescriptionApiOptions
|
||
|
||
</span>
|
||
</a>
|
||
|
||
<nav class="md-nav" aria-label=" PictureDescriptionApiOptions">
|
||
<ul class="md-nav__list">
|
||
|
||
<li class="md-nav__item">
|
||
<a href="#docling.datamodel.pipeline_options.PictureDescriptionApiOptions.batch_size" class="md-nav__link">
|
||
<span class="md-ellipsis">
|
||
|
||
<code class="doc-symbol doc-symbol-toc doc-symbol-attribute"></code> batch_size
|
||
|
||
</span>
|
||
</a>
|
||
|
||
</li>
|
||
|
||
<li class="md-nav__item">
|
||
<a href="#docling.datamodel.pipeline_options.PictureDescriptionApiOptions.concurrency" class="md-nav__link">
|
||
<span class="md-ellipsis">
|
||
|
||
<code class="doc-symbol doc-symbol-toc doc-symbol-attribute"></code> concurrency
|
||
|
||
</span>
|
||
</a>
|
||
|
||
</li>
|
||
|
||
<li class="md-nav__item">
|
||
<a href="#docling.datamodel.pipeline_options.PictureDescriptionApiOptions.headers" class="md-nav__link">
|
||
<span class="md-ellipsis">
|
||
|
||
<code class="doc-symbol doc-symbol-toc doc-symbol-attribute"></code> headers
|
||
|
||
</span>
|
||
</a>
|
||
|
||
</li>
|
||
|
||
<li class="md-nav__item">
|
||
<a href="#docling.datamodel.pipeline_options.PictureDescriptionApiOptions.kind" class="md-nav__link">
|
||
<span class="md-ellipsis">
|
||
|
||
<code class="doc-symbol doc-symbol-toc doc-symbol-attribute"></code> kind
|
||
|
||
</span>
|
||
</a>
|
||
|
||
</li>
|
||
|
||
<li class="md-nav__item">
|
||
<a href="#docling.datamodel.pipeline_options.PictureDescriptionApiOptions.params" class="md-nav__link">
|
||
<span class="md-ellipsis">
|
||
|
||
<code class="doc-symbol doc-symbol-toc doc-symbol-attribute"></code> params
|
||
|
||
</span>
|
||
</a>
|
||
|
||
</li>
|
||
|
||
<li class="md-nav__item">
|
||
<a href="#docling.datamodel.pipeline_options.PictureDescriptionApiOptions.picture_area_threshold" class="md-nav__link">
|
||
<span class="md-ellipsis">
|
||
|
||
<code class="doc-symbol doc-symbol-toc doc-symbol-attribute"></code> picture_area_threshold
|
||
|
||
</span>
|
||
</a>
|
||
|
||
</li>
|
||
|
||
<li class="md-nav__item">
|
||
<a href="#docling.datamodel.pipeline_options.PictureDescriptionApiOptions.prompt" class="md-nav__link">
|
||
<span class="md-ellipsis">
|
||
|
||
<code class="doc-symbol doc-symbol-toc doc-symbol-attribute"></code> prompt
|
||
|
||
</span>
|
||
</a>
|
||
|
||
</li>
|
||
|
||
<li class="md-nav__item">
|
||
<a href="#docling.datamodel.pipeline_options.PictureDescriptionApiOptions.provenance" class="md-nav__link">
|
||
<span class="md-ellipsis">
|
||
|
||
<code class="doc-symbol doc-symbol-toc doc-symbol-attribute"></code> provenance
|
||
|
||
</span>
|
||
</a>
|
||
|
||
</li>
|
||
|
||
<li class="md-nav__item">
|
||
<a href="#docling.datamodel.pipeline_options.PictureDescriptionApiOptions.scale" class="md-nav__link">
|
||
<span class="md-ellipsis">
|
||
|
||
<code class="doc-symbol doc-symbol-toc doc-symbol-attribute"></code> scale
|
||
|
||
</span>
|
||
</a>
|
||
|
||
</li>
|
||
|
||
<li class="md-nav__item">
|
||
<a href="#docling.datamodel.pipeline_options.PictureDescriptionApiOptions.timeout" class="md-nav__link">
|
||
<span class="md-ellipsis">
|
||
|
||
<code class="doc-symbol doc-symbol-toc doc-symbol-attribute"></code> timeout
|
||
|
||
</span>
|
||
</a>
|
||
|
||
</li>
|
||
|
||
<li class="md-nav__item">
|
||
<a href="#docling.datamodel.pipeline_options.PictureDescriptionApiOptions.url" class="md-nav__link">
|
||
<span class="md-ellipsis">
|
||
|
||
<code class="doc-symbol doc-symbol-toc doc-symbol-attribute"></code> url
|
||
|
||
</span>
|
||
</a>
|
||
|
||
</li>
|
||
|
||
</ul>
|
||
</nav>
|
||
|
||
</li>
|
||
|
||
<li class="md-nav__item">
|
||
<a href="#docling.datamodel.pipeline_options.PictureDescriptionBaseOptions" class="md-nav__link">
|
||
<span class="md-ellipsis">
|
||
|
||
<code class="doc-symbol doc-symbol-toc doc-symbol-class"></code> PictureDescriptionBaseOptions
|
||
|
||
</span>
|
||
</a>
|
||
|
||
<nav class="md-nav" aria-label=" PictureDescriptionBaseOptions">
|
||
<ul class="md-nav__list">
|
||
|
||
<li class="md-nav__item">
|
||
<a href="#docling.datamodel.pipeline_options.PictureDescriptionBaseOptions.batch_size" class="md-nav__link">
|
||
<span class="md-ellipsis">
|
||
|
||
<code class="doc-symbol doc-symbol-toc doc-symbol-attribute"></code> batch_size
|
||
|
||
</span>
|
||
</a>
|
||
|
||
</li>
|
||
|
||
<li class="md-nav__item">
|
||
<a href="#docling.datamodel.pipeline_options.PictureDescriptionBaseOptions.kind" class="md-nav__link">
|
||
<span class="md-ellipsis">
|
||
|
||
<code class="doc-symbol doc-symbol-toc doc-symbol-attribute"></code> kind
|
||
|
||
</span>
|
||
</a>
|
||
|
||
</li>
|
||
|
||
<li class="md-nav__item">
|
||
<a href="#docling.datamodel.pipeline_options.PictureDescriptionBaseOptions.picture_area_threshold" class="md-nav__link">
|
||
<span class="md-ellipsis">
|
||
|
||
<code class="doc-symbol doc-symbol-toc doc-symbol-attribute"></code> picture_area_threshold
|
||
|
||
</span>
|
||
</a>
|
||
|
||
</li>
|
||
|
||
<li class="md-nav__item">
|
||
<a href="#docling.datamodel.pipeline_options.PictureDescriptionBaseOptions.scale" class="md-nav__link">
|
||
<span class="md-ellipsis">
|
||
|
||
<code class="doc-symbol doc-symbol-toc doc-symbol-attribute"></code> scale
|
||
|
||
</span>
|
||
</a>
|
||
|
||
</li>
|
||
|
||
</ul>
|
||
</nav>
|
||
|
||
</li>
|
||
|
||
<li class="md-nav__item">
|
||
<a href="#docling.datamodel.pipeline_options.PictureDescriptionVlmOptions" class="md-nav__link">
|
||
<span class="md-ellipsis">
|
||
|
||
<code class="doc-symbol doc-symbol-toc doc-symbol-class"></code> PictureDescriptionVlmOptions
|
||
|
||
</span>
|
||
</a>
|
||
|
||
<nav class="md-nav" aria-label=" PictureDescriptionVlmOptions">
|
||
<ul class="md-nav__list">
|
||
|
||
<li class="md-nav__item">
|
||
<a href="#docling.datamodel.pipeline_options.PictureDescriptionVlmOptions.batch_size" class="md-nav__link">
|
||
<span class="md-ellipsis">
|
||
|
||
<code class="doc-symbol doc-symbol-toc doc-symbol-attribute"></code> batch_size
|
||
|
||
</span>
|
||
</a>
|
||
|
||
</li>
|
||
|
||
<li class="md-nav__item">
|
||
<a href="#docling.datamodel.pipeline_options.PictureDescriptionVlmOptions.generation_config" class="md-nav__link">
|
||
<span class="md-ellipsis">
|
||
|
||
<code class="doc-symbol doc-symbol-toc doc-symbol-attribute"></code> generation_config
|
||
|
||
</span>
|
||
</a>
|
||
|
||
</li>
|
||
|
||
<li class="md-nav__item">
|
||
<a href="#docling.datamodel.pipeline_options.PictureDescriptionVlmOptions.kind" class="md-nav__link">
|
||
<span class="md-ellipsis">
|
||
|
||
<code class="doc-symbol doc-symbol-toc doc-symbol-attribute"></code> kind
|
||
|
||
</span>
|
||
</a>
|
||
|
||
</li>
|
||
|
||
<li class="md-nav__item">
|
||
<a href="#docling.datamodel.pipeline_options.PictureDescriptionVlmOptions.picture_area_threshold" class="md-nav__link">
|
||
<span class="md-ellipsis">
|
||
|
||
<code class="doc-symbol doc-symbol-toc doc-symbol-attribute"></code> picture_area_threshold
|
||
|
||
</span>
|
||
</a>
|
||
|
||
</li>
|
||
|
||
<li class="md-nav__item">
|
||
<a href="#docling.datamodel.pipeline_options.PictureDescriptionVlmOptions.prompt" class="md-nav__link">
|
||
<span class="md-ellipsis">
|
||
|
||
<code class="doc-symbol doc-symbol-toc doc-symbol-attribute"></code> prompt
|
||
|
||
</span>
|
||
</a>
|
||
|
||
</li>
|
||
|
||
<li class="md-nav__item">
|
||
<a href="#docling.datamodel.pipeline_options.PictureDescriptionVlmOptions.repo_cache_folder" class="md-nav__link">
|
||
<span class="md-ellipsis">
|
||
|
||
<code class="doc-symbol doc-symbol-toc doc-symbol-attribute"></code> repo_cache_folder
|
||
|
||
</span>
|
||
</a>
|
||
|
||
</li>
|
||
|
||
<li class="md-nav__item">
|
||
<a href="#docling.datamodel.pipeline_options.PictureDescriptionVlmOptions.repo_id" class="md-nav__link">
|
||
<span class="md-ellipsis">
|
||
|
||
<code class="doc-symbol doc-symbol-toc doc-symbol-attribute"></code> repo_id
|
||
|
||
</span>
|
||
</a>
|
||
|
||
</li>
|
||
|
||
<li class="md-nav__item">
|
||
<a href="#docling.datamodel.pipeline_options.PictureDescriptionVlmOptions.scale" class="md-nav__link">
|
||
<span class="md-ellipsis">
|
||
|
||
<code class="doc-symbol doc-symbol-toc doc-symbol-attribute"></code> scale
|
||
|
||
</span>
|
||
</a>
|
||
|
||
</li>
|
||
|
||
</ul>
|
||
</nav>
|
||
|
||
</li>
|
||
|
||
<li class="md-nav__item">
|
||
<a href="#docling.datamodel.pipeline_options.PipelineOptions" class="md-nav__link">
|
||
<span class="md-ellipsis">
|
||
|
||
<code class="doc-symbol doc-symbol-toc doc-symbol-class"></code> PipelineOptions
|
||
|
||
</span>
|
||
</a>
|
||
|
||
<nav class="md-nav" aria-label=" PipelineOptions">
|
||
<ul class="md-nav__list">
|
||
|
||
<li class="md-nav__item">
|
||
<a href="#docling.datamodel.pipeline_options.PipelineOptions.accelerator_options" class="md-nav__link">
|
||
<span class="md-ellipsis">
|
||
|
||
<code class="doc-symbol doc-symbol-toc doc-symbol-attribute"></code> accelerator_options
|
||
|
||
</span>
|
||
</a>
|
||
|
||
</li>
|
||
|
||
<li class="md-nav__item">
|
||
<a href="#docling.datamodel.pipeline_options.PipelineOptions.allow_external_plugins" class="md-nav__link">
|
||
<span class="md-ellipsis">
|
||
|
||
<code class="doc-symbol doc-symbol-toc doc-symbol-attribute"></code> allow_external_plugins
|
||
|
||
</span>
|
||
</a>
|
||
|
||
</li>
|
||
|
||
<li class="md-nav__item">
|
||
<a href="#docling.datamodel.pipeline_options.PipelineOptions.artifacts_path" class="md-nav__link">
|
||
<span class="md-ellipsis">
|
||
|
||
<code class="doc-symbol doc-symbol-toc doc-symbol-attribute"></code> artifacts_path
|
||
|
||
</span>
|
||
</a>
|
||
|
||
</li>
|
||
|
||
<li class="md-nav__item">
|
||
<a href="#docling.datamodel.pipeline_options.PipelineOptions.document_timeout" class="md-nav__link">
|
||
<span class="md-ellipsis">
|
||
|
||
<code class="doc-symbol doc-symbol-toc doc-symbol-attribute"></code> document_timeout
|
||
|
||
</span>
|
||
</a>
|
||
|
||
</li>
|
||
|
||
<li class="md-nav__item">
|
||
<a href="#docling.datamodel.pipeline_options.PipelineOptions.enable_remote_services" class="md-nav__link">
|
||
<span class="md-ellipsis">
|
||
|
||
<code class="doc-symbol doc-symbol-toc doc-symbol-attribute"></code> enable_remote_services
|
||
|
||
</span>
|
||
</a>
|
||
|
||
</li>
|
||
|
||
<li class="md-nav__item">
|
||
<a href="#docling.datamodel.pipeline_options.PipelineOptions.kind" class="md-nav__link">
|
||
<span class="md-ellipsis">
|
||
|
||
<code class="doc-symbol doc-symbol-toc doc-symbol-attribute"></code> kind
|
||
|
||
</span>
|
||
</a>
|
||
|
||
</li>
|
||
|
||
</ul>
|
||
</nav>
|
||
|
||
</li>
|
||
|
||
<li class="md-nav__item">
|
||
<a href="#docling.datamodel.pipeline_options.ProcessingPipeline" class="md-nav__link">
|
||
<span class="md-ellipsis">
|
||
|
||
<code class="doc-symbol doc-symbol-toc doc-symbol-class"></code> ProcessingPipeline
|
||
|
||
</span>
|
||
</a>
|
||
|
||
<nav class="md-nav" aria-label=" ProcessingPipeline">
|
||
<ul class="md-nav__list">
|
||
|
||
<li class="md-nav__item">
|
||
<a href="#docling.datamodel.pipeline_options.ProcessingPipeline.ASR" class="md-nav__link">
|
||
<span class="md-ellipsis">
|
||
|
||
<code class="doc-symbol doc-symbol-toc doc-symbol-attribute"></code> ASR
|
||
|
||
</span>
|
||
</a>
|
||
|
||
</li>
|
||
|
||
<li class="md-nav__item">
|
||
<a href="#docling.datamodel.pipeline_options.ProcessingPipeline.LEGACY" class="md-nav__link">
|
||
<span class="md-ellipsis">
|
||
|
||
<code class="doc-symbol doc-symbol-toc doc-symbol-attribute"></code> LEGACY
|
||
|
||
</span>
|
||
</a>
|
||
|
||
</li>
|
||
|
||
<li class="md-nav__item">
|
||
<a href="#docling.datamodel.pipeline_options.ProcessingPipeline.STANDARD" class="md-nav__link">
|
||
<span class="md-ellipsis">
|
||
|
||
<code class="doc-symbol doc-symbol-toc doc-symbol-attribute"></code> STANDARD
|
||
|
||
</span>
|
||
</a>
|
||
|
||
</li>
|
||
|
||
<li class="md-nav__item">
|
||
<a href="#docling.datamodel.pipeline_options.ProcessingPipeline.VLM" class="md-nav__link">
|
||
<span class="md-ellipsis">
|
||
|
||
<code class="doc-symbol doc-symbol-toc doc-symbol-attribute"></code> VLM
|
||
|
||
</span>
|
||
</a>
|
||
|
||
</li>
|
||
|
||
</ul>
|
||
</nav>
|
||
|
||
</li>
|
||
|
||
<li class="md-nav__item">
|
||
<a href="#docling.datamodel.pipeline_options.RapidOcrOptions" class="md-nav__link">
|
||
<span class="md-ellipsis">
|
||
|
||
<code class="doc-symbol doc-symbol-toc doc-symbol-class"></code> RapidOcrOptions
|
||
|
||
</span>
|
||
</a>
|
||
|
||
<nav class="md-nav" aria-label=" RapidOcrOptions">
|
||
<ul class="md-nav__list">
|
||
|
||
<li class="md-nav__item">
|
||
<a href="#docling.datamodel.pipeline_options.RapidOcrOptions.backend" class="md-nav__link">
|
||
<span class="md-ellipsis">
|
||
|
||
<code class="doc-symbol doc-symbol-toc doc-symbol-attribute"></code> backend
|
||
|
||
</span>
|
||
</a>
|
||
|
||
</li>
|
||
|
||
<li class="md-nav__item">
|
||
<a href="#docling.datamodel.pipeline_options.RapidOcrOptions.bitmap_area_threshold" class="md-nav__link">
|
||
<span class="md-ellipsis">
|
||
|
||
<code class="doc-symbol doc-symbol-toc doc-symbol-attribute"></code> bitmap_area_threshold
|
||
|
||
</span>
|
||
</a>
|
||
|
||
</li>
|
||
|
||
<li class="md-nav__item">
|
||
<a href="#docling.datamodel.pipeline_options.RapidOcrOptions.cls_model_path" class="md-nav__link">
|
||
<span class="md-ellipsis">
|
||
|
||
<code class="doc-symbol doc-symbol-toc doc-symbol-attribute"></code> cls_model_path
|
||
|
||
</span>
|
||
</a>
|
||
|
||
</li>
|
||
|
||
<li class="md-nav__item">
|
||
<a href="#docling.datamodel.pipeline_options.RapidOcrOptions.det_model_path" class="md-nav__link">
|
||
<span class="md-ellipsis">
|
||
|
||
<code class="doc-symbol doc-symbol-toc doc-symbol-attribute"></code> det_model_path
|
||
|
||
</span>
|
||
</a>
|
||
|
||
</li>
|
||
|
||
<li class="md-nav__item">
|
||
<a href="#docling.datamodel.pipeline_options.RapidOcrOptions.font_path" class="md-nav__link">
|
||
<span class="md-ellipsis">
|
||
|
||
<code class="doc-symbol doc-symbol-toc doc-symbol-attribute"></code> font_path
|
||
|
||
</span>
|
||
</a>
|
||
|
||
</li>
|
||
|
||
<li class="md-nav__item">
|
||
<a href="#docling.datamodel.pipeline_options.RapidOcrOptions.force_full_page_ocr" class="md-nav__link">
|
||
<span class="md-ellipsis">
|
||
|
||
<code class="doc-symbol doc-symbol-toc doc-symbol-attribute"></code> force_full_page_ocr
|
||
|
||
</span>
|
||
</a>
|
||
|
||
</li>
|
||
|
||
<li class="md-nav__item">
|
||
<a href="#docling.datamodel.pipeline_options.RapidOcrOptions.kind" class="md-nav__link">
|
||
<span class="md-ellipsis">
|
||
|
||
<code class="doc-symbol doc-symbol-toc doc-symbol-attribute"></code> kind
|
||
|
||
</span>
|
||
</a>
|
||
|
||
</li>
|
||
|
||
<li class="md-nav__item">
|
||
<a href="#docling.datamodel.pipeline_options.RapidOcrOptions.lang" class="md-nav__link">
|
||
<span class="md-ellipsis">
|
||
|
||
<code class="doc-symbol doc-symbol-toc doc-symbol-attribute"></code> lang
|
||
|
||
</span>
|
||
</a>
|
||
|
||
</li>
|
||
|
||
<li class="md-nav__item">
|
||
<a href="#docling.datamodel.pipeline_options.RapidOcrOptions.model_config" class="md-nav__link">
|
||
<span class="md-ellipsis">
|
||
|
||
<code class="doc-symbol doc-symbol-toc doc-symbol-attribute"></code> model_config
|
||
|
||
</span>
|
||
</a>
|
||
|
||
</li>
|
||
|
||
<li class="md-nav__item">
|
||
<a href="#docling.datamodel.pipeline_options.RapidOcrOptions.print_verbose" class="md-nav__link">
|
||
<span class="md-ellipsis">
|
||
|
||
<code class="doc-symbol doc-symbol-toc doc-symbol-attribute"></code> print_verbose
|
||
|
||
</span>
|
||
</a>
|
||
|
||
</li>
|
||
|
||
<li class="md-nav__item">
|
||
<a href="#docling.datamodel.pipeline_options.RapidOcrOptions.rapidocr_params" class="md-nav__link">
|
||
<span class="md-ellipsis">
|
||
|
||
<code class="doc-symbol doc-symbol-toc doc-symbol-attribute"></code> rapidocr_params
|
||
|
||
</span>
|
||
</a>
|
||
|
||
</li>
|
||
|
||
<li class="md-nav__item">
|
||
<a href="#docling.datamodel.pipeline_options.RapidOcrOptions.rec_font_path" class="md-nav__link">
|
||
<span class="md-ellipsis">
|
||
|
||
<code class="doc-symbol doc-symbol-toc doc-symbol-attribute"></code> rec_font_path
|
||
|
||
</span>
|
||
</a>
|
||
|
||
</li>
|
||
|
||
<li class="md-nav__item">
|
||
<a href="#docling.datamodel.pipeline_options.RapidOcrOptions.rec_keys_path" class="md-nav__link">
|
||
<span class="md-ellipsis">
|
||
|
||
<code class="doc-symbol doc-symbol-toc doc-symbol-attribute"></code> rec_keys_path
|
||
|
||
</span>
|
||
</a>
|
||
|
||
</li>
|
||
|
||
<li class="md-nav__item">
|
||
<a href="#docling.datamodel.pipeline_options.RapidOcrOptions.rec_model_path" class="md-nav__link">
|
||
<span class="md-ellipsis">
|
||
|
||
<code class="doc-symbol doc-symbol-toc doc-symbol-attribute"></code> rec_model_path
|
||
|
||
</span>
|
||
</a>
|
||
|
||
</li>
|
||
|
||
<li class="md-nav__item">
|
||
<a href="#docling.datamodel.pipeline_options.RapidOcrOptions.text_score" class="md-nav__link">
|
||
<span class="md-ellipsis">
|
||
|
||
<code class="doc-symbol doc-symbol-toc doc-symbol-attribute"></code> text_score
|
||
|
||
</span>
|
||
</a>
|
||
|
||
</li>
|
||
|
||
<li class="md-nav__item">
|
||
<a href="#docling.datamodel.pipeline_options.RapidOcrOptions.use_cls" class="md-nav__link">
|
||
<span class="md-ellipsis">
|
||
|
||
<code class="doc-symbol doc-symbol-toc doc-symbol-attribute"></code> use_cls
|
||
|
||
</span>
|
||
</a>
|
||
|
||
</li>
|
||
|
||
<li class="md-nav__item">
|
||
<a href="#docling.datamodel.pipeline_options.RapidOcrOptions.use_det" class="md-nav__link">
|
||
<span class="md-ellipsis">
|
||
|
||
<code class="doc-symbol doc-symbol-toc doc-symbol-attribute"></code> use_det
|
||
|
||
</span>
|
||
</a>
|
||
|
||
</li>
|
||
|
||
<li class="md-nav__item">
|
||
<a href="#docling.datamodel.pipeline_options.RapidOcrOptions.use_rec" class="md-nav__link">
|
||
<span class="md-ellipsis">
|
||
|
||
<code class="doc-symbol doc-symbol-toc doc-symbol-attribute"></code> use_rec
|
||
|
||
</span>
|
||
</a>
|
||
|
||
</li>
|
||
|
||
</ul>
|
||
</nav>
|
||
|
||
</li>
|
||
|
||
<li class="md-nav__item">
|
||
<a href="#docling.datamodel.pipeline_options.TableFormerMode" class="md-nav__link">
|
||
<span class="md-ellipsis">
|
||
|
||
<code class="doc-symbol doc-symbol-toc doc-symbol-class"></code> TableFormerMode
|
||
|
||
</span>
|
||
</a>
|
||
|
||
<nav class="md-nav" aria-label=" TableFormerMode">
|
||
<ul class="md-nav__list">
|
||
|
||
<li class="md-nav__item">
|
||
<a href="#docling.datamodel.pipeline_options.TableFormerMode.ACCURATE" class="md-nav__link">
|
||
<span class="md-ellipsis">
|
||
|
||
<code class="doc-symbol doc-symbol-toc doc-symbol-attribute"></code> ACCURATE
|
||
|
||
</span>
|
||
</a>
|
||
|
||
</li>
|
||
|
||
<li class="md-nav__item">
|
||
<a href="#docling.datamodel.pipeline_options.TableFormerMode.FAST" class="md-nav__link">
|
||
<span class="md-ellipsis">
|
||
|
||
<code class="doc-symbol doc-symbol-toc doc-symbol-attribute"></code> FAST
|
||
|
||
</span>
|
||
</a>
|
||
|
||
</li>
|
||
|
||
</ul>
|
||
</nav>
|
||
|
||
</li>
|
||
|
||
<li class="md-nav__item">
|
||
<a href="#docling.datamodel.pipeline_options.TableStructureOptions" class="md-nav__link">
|
||
<span class="md-ellipsis">
|
||
|
||
<code class="doc-symbol doc-symbol-toc doc-symbol-class"></code> TableStructureOptions
|
||
|
||
</span>
|
||
</a>
|
||
|
||
<nav class="md-nav" aria-label=" TableStructureOptions">
|
||
<ul class="md-nav__list">
|
||
|
||
<li class="md-nav__item">
|
||
<a href="#docling.datamodel.pipeline_options.TableStructureOptions.do_cell_matching" class="md-nav__link">
|
||
<span class="md-ellipsis">
|
||
|
||
<code class="doc-symbol doc-symbol-toc doc-symbol-attribute"></code> do_cell_matching
|
||
|
||
</span>
|
||
</a>
|
||
|
||
</li>
|
||
|
||
<li class="md-nav__item">
|
||
<a href="#docling.datamodel.pipeline_options.TableStructureOptions.kind" class="md-nav__link">
|
||
<span class="md-ellipsis">
|
||
|
||
<code class="doc-symbol doc-symbol-toc doc-symbol-attribute"></code> kind
|
||
|
||
</span>
|
||
</a>
|
||
|
||
</li>
|
||
|
||
<li class="md-nav__item">
|
||
<a href="#docling.datamodel.pipeline_options.TableStructureOptions.mode" class="md-nav__link">
|
||
<span class="md-ellipsis">
|
||
|
||
<code class="doc-symbol doc-symbol-toc doc-symbol-attribute"></code> mode
|
||
|
||
</span>
|
||
</a>
|
||
|
||
</li>
|
||
|
||
</ul>
|
||
</nav>
|
||
|
||
</li>
|
||
|
||
<li class="md-nav__item">
|
||
<a href="#docling.datamodel.pipeline_options.TesseractCliOcrOptions" class="md-nav__link">
|
||
<span class="md-ellipsis">
|
||
|
||
<code class="doc-symbol doc-symbol-toc doc-symbol-class"></code> TesseractCliOcrOptions
|
||
|
||
</span>
|
||
</a>
|
||
|
||
<nav class="md-nav" aria-label=" TesseractCliOcrOptions">
|
||
<ul class="md-nav__list">
|
||
|
||
<li class="md-nav__item">
|
||
<a href="#docling.datamodel.pipeline_options.TesseractCliOcrOptions.bitmap_area_threshold" class="md-nav__link">
|
||
<span class="md-ellipsis">
|
||
|
||
<code class="doc-symbol doc-symbol-toc doc-symbol-attribute"></code> bitmap_area_threshold
|
||
|
||
</span>
|
||
</a>
|
||
|
||
</li>
|
||
|
||
<li class="md-nav__item">
|
||
<a href="#docling.datamodel.pipeline_options.TesseractCliOcrOptions.force_full_page_ocr" class="md-nav__link">
|
||
<span class="md-ellipsis">
|
||
|
||
<code class="doc-symbol doc-symbol-toc doc-symbol-attribute"></code> force_full_page_ocr
|
||
|
||
</span>
|
||
</a>
|
||
|
||
</li>
|
||
|
||
<li class="md-nav__item">
|
||
<a href="#docling.datamodel.pipeline_options.TesseractCliOcrOptions.kind" class="md-nav__link">
|
||
<span class="md-ellipsis">
|
||
|
||
<code class="doc-symbol doc-symbol-toc doc-symbol-attribute"></code> kind
|
||
|
||
</span>
|
||
</a>
|
||
|
||
</li>
|
||
|
||
<li class="md-nav__item">
|
||
<a href="#docling.datamodel.pipeline_options.TesseractCliOcrOptions.lang" class="md-nav__link">
|
||
<span class="md-ellipsis">
|
||
|
||
<code class="doc-symbol doc-symbol-toc doc-symbol-attribute"></code> lang
|
||
|
||
</span>
|
||
</a>
|
||
|
||
</li>
|
||
|
||
<li class="md-nav__item">
|
||
<a href="#docling.datamodel.pipeline_options.TesseractCliOcrOptions.model_config" class="md-nav__link">
|
||
<span class="md-ellipsis">
|
||
|
||
<code class="doc-symbol doc-symbol-toc doc-symbol-attribute"></code> model_config
|
||
|
||
</span>
|
||
</a>
|
||
|
||
</li>
|
||
|
||
<li class="md-nav__item">
|
||
<a href="#docling.datamodel.pipeline_options.TesseractCliOcrOptions.path" class="md-nav__link">
|
||
<span class="md-ellipsis">
|
||
|
||
<code class="doc-symbol doc-symbol-toc doc-symbol-attribute"></code> path
|
||
|
||
</span>
|
||
</a>
|
||
|
||
</li>
|
||
|
||
<li class="md-nav__item">
|
||
<a href="#docling.datamodel.pipeline_options.TesseractCliOcrOptions.psm" class="md-nav__link">
|
||
<span class="md-ellipsis">
|
||
|
||
<code class="doc-symbol doc-symbol-toc doc-symbol-attribute"></code> psm
|
||
|
||
</span>
|
||
</a>
|
||
|
||
</li>
|
||
|
||
<li class="md-nav__item">
|
||
<a href="#docling.datamodel.pipeline_options.TesseractCliOcrOptions.tesseract_cmd" class="md-nav__link">
|
||
<span class="md-ellipsis">
|
||
|
||
<code class="doc-symbol doc-symbol-toc doc-symbol-attribute"></code> tesseract_cmd
|
||
|
||
</span>
|
||
</a>
|
||
|
||
</li>
|
||
|
||
</ul>
|
||
</nav>
|
||
|
||
</li>
|
||
|
||
<li class="md-nav__item">
|
||
<a href="#docling.datamodel.pipeline_options.TesseractOcrOptions" class="md-nav__link">
|
||
<span class="md-ellipsis">
|
||
|
||
<code class="doc-symbol doc-symbol-toc doc-symbol-class"></code> TesseractOcrOptions
|
||
|
||
</span>
|
||
</a>
|
||
|
||
<nav class="md-nav" aria-label=" TesseractOcrOptions">
|
||
<ul class="md-nav__list">
|
||
|
||
<li class="md-nav__item">
|
||
<a href="#docling.datamodel.pipeline_options.TesseractOcrOptions.bitmap_area_threshold" class="md-nav__link">
|
||
<span class="md-ellipsis">
|
||
|
||
<code class="doc-symbol doc-symbol-toc doc-symbol-attribute"></code> bitmap_area_threshold
|
||
|
||
</span>
|
||
</a>
|
||
|
||
</li>
|
||
|
||
<li class="md-nav__item">
|
||
<a href="#docling.datamodel.pipeline_options.TesseractOcrOptions.force_full_page_ocr" class="md-nav__link">
|
||
<span class="md-ellipsis">
|
||
|
||
<code class="doc-symbol doc-symbol-toc doc-symbol-attribute"></code> force_full_page_ocr
|
||
|
||
</span>
|
||
</a>
|
||
|
||
</li>
|
||
|
||
<li class="md-nav__item">
|
||
<a href="#docling.datamodel.pipeline_options.TesseractOcrOptions.kind" class="md-nav__link">
|
||
<span class="md-ellipsis">
|
||
|
||
<code class="doc-symbol doc-symbol-toc doc-symbol-attribute"></code> kind
|
||
|
||
</span>
|
||
</a>
|
||
|
||
</li>
|
||
|
||
<li class="md-nav__item">
|
||
<a href="#docling.datamodel.pipeline_options.TesseractOcrOptions.lang" class="md-nav__link">
|
||
<span class="md-ellipsis">
|
||
|
||
<code class="doc-symbol doc-symbol-toc doc-symbol-attribute"></code> lang
|
||
|
||
</span>
|
||
</a>
|
||
|
||
</li>
|
||
|
||
<li class="md-nav__item">
|
||
<a href="#docling.datamodel.pipeline_options.TesseractOcrOptions.model_config" class="md-nav__link">
|
||
<span class="md-ellipsis">
|
||
|
||
<code class="doc-symbol doc-symbol-toc doc-symbol-attribute"></code> model_config
|
||
|
||
</span>
|
||
</a>
|
||
|
||
</li>
|
||
|
||
<li class="md-nav__item">
|
||
<a href="#docling.datamodel.pipeline_options.TesseractOcrOptions.path" class="md-nav__link">
|
||
<span class="md-ellipsis">
|
||
|
||
<code class="doc-symbol doc-symbol-toc doc-symbol-attribute"></code> path
|
||
|
||
</span>
|
||
</a>
|
||
|
||
</li>
|
||
|
||
<li class="md-nav__item">
|
||
<a href="#docling.datamodel.pipeline_options.TesseractOcrOptions.psm" class="md-nav__link">
|
||
<span class="md-ellipsis">
|
||
|
||
<code class="doc-symbol doc-symbol-toc doc-symbol-attribute"></code> psm
|
||
|
||
</span>
|
||
</a>
|
||
|
||
</li>
|
||
|
||
</ul>
|
||
</nav>
|
||
|
||
</li>
|
||
|
||
<li class="md-nav__item">
|
||
<a href="#docling.datamodel.pipeline_options.ThreadedPdfPipelineOptions" class="md-nav__link">
|
||
<span class="md-ellipsis">
|
||
|
||
<code class="doc-symbol doc-symbol-toc doc-symbol-class"></code> ThreadedPdfPipelineOptions
|
||
|
||
</span>
|
||
</a>
|
||
|
||
<nav class="md-nav" aria-label=" ThreadedPdfPipelineOptions">
|
||
<ul class="md-nav__list">
|
||
|
||
<li class="md-nav__item">
|
||
<a href="#docling.datamodel.pipeline_options.ThreadedPdfPipelineOptions.accelerator_options" class="md-nav__link">
|
||
<span class="md-ellipsis">
|
||
|
||
<code class="doc-symbol doc-symbol-toc doc-symbol-attribute"></code> accelerator_options
|
||
|
||
</span>
|
||
</a>
|
||
|
||
</li>
|
||
|
||
<li class="md-nav__item">
|
||
<a href="#docling.datamodel.pipeline_options.ThreadedPdfPipelineOptions.allow_external_plugins" class="md-nav__link">
|
||
<span class="md-ellipsis">
|
||
|
||
<code class="doc-symbol doc-symbol-toc doc-symbol-attribute"></code> allow_external_plugins
|
||
|
||
</span>
|
||
</a>
|
||
|
||
</li>
|
||
|
||
<li class="md-nav__item">
|
||
<a href="#docling.datamodel.pipeline_options.ThreadedPdfPipelineOptions.artifacts_path" class="md-nav__link">
|
||
<span class="md-ellipsis">
|
||
|
||
<code class="doc-symbol doc-symbol-toc doc-symbol-attribute"></code> artifacts_path
|
||
|
||
</span>
|
||
</a>
|
||
|
||
</li>
|
||
|
||
<li class="md-nav__item">
|
||
<a href="#docling.datamodel.pipeline_options.ThreadedPdfPipelineOptions.batch_polling_interval_seconds" class="md-nav__link">
|
||
<span class="md-ellipsis">
|
||
|
||
<code class="doc-symbol doc-symbol-toc doc-symbol-attribute"></code> batch_polling_interval_seconds
|
||
|
||
</span>
|
||
</a>
|
||
|
||
</li>
|
||
|
||
<li class="md-nav__item">
|
||
<a href="#docling.datamodel.pipeline_options.ThreadedPdfPipelineOptions.do_code_enrichment" class="md-nav__link">
|
||
<span class="md-ellipsis">
|
||
|
||
<code class="doc-symbol doc-symbol-toc doc-symbol-attribute"></code> do_code_enrichment
|
||
|
||
</span>
|
||
</a>
|
||
|
||
</li>
|
||
|
||
<li class="md-nav__item">
|
||
<a href="#docling.datamodel.pipeline_options.ThreadedPdfPipelineOptions.do_formula_enrichment" class="md-nav__link">
|
||
<span class="md-ellipsis">
|
||
|
||
<code class="doc-symbol doc-symbol-toc doc-symbol-attribute"></code> do_formula_enrichment
|
||
|
||
</span>
|
||
</a>
|
||
|
||
</li>
|
||
|
||
<li class="md-nav__item">
|
||
<a href="#docling.datamodel.pipeline_options.ThreadedPdfPipelineOptions.do_ocr" class="md-nav__link">
|
||
<span class="md-ellipsis">
|
||
|
||
<code class="doc-symbol doc-symbol-toc doc-symbol-attribute"></code> do_ocr
|
||
|
||
</span>
|
||
</a>
|
||
|
||
</li>
|
||
|
||
<li class="md-nav__item">
|
||
<a href="#docling.datamodel.pipeline_options.ThreadedPdfPipelineOptions.do_picture_classification" class="md-nav__link">
|
||
<span class="md-ellipsis">
|
||
|
||
<code class="doc-symbol doc-symbol-toc doc-symbol-attribute"></code> do_picture_classification
|
||
|
||
</span>
|
||
</a>
|
||
|
||
</li>
|
||
|
||
<li class="md-nav__item">
|
||
<a href="#docling.datamodel.pipeline_options.ThreadedPdfPipelineOptions.do_picture_description" class="md-nav__link">
|
||
<span class="md-ellipsis">
|
||
|
||
<code class="doc-symbol doc-symbol-toc doc-symbol-attribute"></code> do_picture_description
|
||
|
||
</span>
|
||
</a>
|
||
|
||
</li>
|
||
|
||
<li class="md-nav__item">
|
||
<a href="#docling.datamodel.pipeline_options.ThreadedPdfPipelineOptions.do_table_structure" class="md-nav__link">
|
||
<span class="md-ellipsis">
|
||
|
||
<code class="doc-symbol doc-symbol-toc doc-symbol-attribute"></code> do_table_structure
|
||
|
||
</span>
|
||
</a>
|
||
|
||
</li>
|
||
|
||
<li class="md-nav__item">
|
||
<a href="#docling.datamodel.pipeline_options.ThreadedPdfPipelineOptions.document_timeout" class="md-nav__link">
|
||
<span class="md-ellipsis">
|
||
|
||
<code class="doc-symbol doc-symbol-toc doc-symbol-attribute"></code> document_timeout
|
||
|
||
</span>
|
||
</a>
|
||
|
||
</li>
|
||
|
||
<li class="md-nav__item">
|
||
<a href="#docling.datamodel.pipeline_options.ThreadedPdfPipelineOptions.enable_remote_services" class="md-nav__link">
|
||
<span class="md-ellipsis">
|
||
|
||
<code class="doc-symbol doc-symbol-toc doc-symbol-attribute"></code> enable_remote_services
|
||
|
||
</span>
|
||
</a>
|
||
|
||
</li>
|
||
|
||
<li class="md-nav__item">
|
||
<a href="#docling.datamodel.pipeline_options.ThreadedPdfPipelineOptions.force_backend_text" class="md-nav__link">
|
||
<span class="md-ellipsis">
|
||
|
||
<code class="doc-symbol doc-symbol-toc doc-symbol-attribute"></code> force_backend_text
|
||
|
||
</span>
|
||
</a>
|
||
|
||
</li>
|
||
|
||
<li class="md-nav__item">
|
||
<a href="#docling.datamodel.pipeline_options.ThreadedPdfPipelineOptions.generate_page_images" class="md-nav__link">
|
||
<span class="md-ellipsis">
|
||
|
||
<code class="doc-symbol doc-symbol-toc doc-symbol-attribute"></code> generate_page_images
|
||
|
||
</span>
|
||
</a>
|
||
|
||
</li>
|
||
|
||
<li class="md-nav__item">
|
||
<a href="#docling.datamodel.pipeline_options.ThreadedPdfPipelineOptions.generate_parsed_pages" class="md-nav__link">
|
||
<span class="md-ellipsis">
|
||
|
||
<code class="doc-symbol doc-symbol-toc doc-symbol-attribute"></code> generate_parsed_pages
|
||
|
||
</span>
|
||
</a>
|
||
|
||
</li>
|
||
|
||
<li class="md-nav__item">
|
||
<a href="#docling.datamodel.pipeline_options.ThreadedPdfPipelineOptions.generate_picture_images" class="md-nav__link">
|
||
<span class="md-ellipsis">
|
||
|
||
<code class="doc-symbol doc-symbol-toc doc-symbol-attribute"></code> generate_picture_images
|
||
|
||
</span>
|
||
</a>
|
||
|
||
</li>
|
||
|
||
<li class="md-nav__item">
|
||
<a href="#docling.datamodel.pipeline_options.ThreadedPdfPipelineOptions.generate_table_images" class="md-nav__link">
|
||
<span class="md-ellipsis">
|
||
|
||
<code class="doc-symbol doc-symbol-toc doc-symbol-attribute"></code> generate_table_images
|
||
|
||
</span>
|
||
</a>
|
||
|
||
</li>
|
||
|
||
<li class="md-nav__item">
|
||
<a href="#docling.datamodel.pipeline_options.ThreadedPdfPipelineOptions.images_scale" class="md-nav__link">
|
||
<span class="md-ellipsis">
|
||
|
||
<code class="doc-symbol doc-symbol-toc doc-symbol-attribute"></code> images_scale
|
||
|
||
</span>
|
||
</a>
|
||
|
||
</li>
|
||
|
||
<li class="md-nav__item">
|
||
<a href="#docling.datamodel.pipeline_options.ThreadedPdfPipelineOptions.kind" class="md-nav__link">
|
||
<span class="md-ellipsis">
|
||
|
||
<code class="doc-symbol doc-symbol-toc doc-symbol-attribute"></code> kind
|
||
|
||
</span>
|
||
</a>
|
||
|
||
</li>
|
||
|
||
<li class="md-nav__item">
|
||
<a href="#docling.datamodel.pipeline_options.ThreadedPdfPipelineOptions.layout_batch_size" class="md-nav__link">
|
||
<span class="md-ellipsis">
|
||
|
||
<code class="doc-symbol doc-symbol-toc doc-symbol-attribute"></code> layout_batch_size
|
||
|
||
</span>
|
||
</a>
|
||
|
||
</li>
|
||
|
||
<li class="md-nav__item">
|
||
<a href="#docling.datamodel.pipeline_options.ThreadedPdfPipelineOptions.layout_options" class="md-nav__link">
|
||
<span class="md-ellipsis">
|
||
|
||
<code class="doc-symbol doc-symbol-toc doc-symbol-attribute"></code> layout_options
|
||
|
||
</span>
|
||
</a>
|
||
|
||
</li>
|
||
|
||
<li class="md-nav__item">
|
||
<a href="#docling.datamodel.pipeline_options.ThreadedPdfPipelineOptions.ocr_batch_size" class="md-nav__link">
|
||
<span class="md-ellipsis">
|
||
|
||
<code class="doc-symbol doc-symbol-toc doc-symbol-attribute"></code> ocr_batch_size
|
||
|
||
</span>
|
||
</a>
|
||
|
||
</li>
|
||
|
||
<li class="md-nav__item">
|
||
<a href="#docling.datamodel.pipeline_options.ThreadedPdfPipelineOptions.ocr_options" class="md-nav__link">
|
||
<span class="md-ellipsis">
|
||
|
||
<code class="doc-symbol doc-symbol-toc doc-symbol-attribute"></code> ocr_options
|
||
|
||
</span>
|
||
</a>
|
||
|
||
</li>
|
||
|
||
<li class="md-nav__item">
|
||
<a href="#docling.datamodel.pipeline_options.ThreadedPdfPipelineOptions.picture_description_options" class="md-nav__link">
|
||
<span class="md-ellipsis">
|
||
|
||
<code class="doc-symbol doc-symbol-toc doc-symbol-attribute"></code> picture_description_options
|
||
|
||
</span>
|
||
</a>
|
||
|
||
</li>
|
||
|
||
<li class="md-nav__item">
|
||
<a href="#docling.datamodel.pipeline_options.ThreadedPdfPipelineOptions.queue_max_size" class="md-nav__link">
|
||
<span class="md-ellipsis">
|
||
|
||
<code class="doc-symbol doc-symbol-toc doc-symbol-attribute"></code> queue_max_size
|
||
|
||
</span>
|
||
</a>
|
||
|
||
</li>
|
||
|
||
<li class="md-nav__item">
|
||
<a href="#docling.datamodel.pipeline_options.ThreadedPdfPipelineOptions.table_batch_size" class="md-nav__link">
|
||
<span class="md-ellipsis">
|
||
|
||
<code class="doc-symbol doc-symbol-toc doc-symbol-attribute"></code> table_batch_size
|
||
|
||
</span>
|
||
</a>
|
||
|
||
</li>
|
||
|
||
<li class="md-nav__item">
|
||
<a href="#docling.datamodel.pipeline_options.ThreadedPdfPipelineOptions.table_structure_options" class="md-nav__link">
|
||
<span class="md-ellipsis">
|
||
|
||
<code class="doc-symbol doc-symbol-toc doc-symbol-attribute"></code> table_structure_options
|
||
|
||
</span>
|
||
</a>
|
||
|
||
</li>
|
||
|
||
</ul>
|
||
</nav>
|
||
|
||
</li>
|
||
|
||
<li class="md-nav__item">
|
||
<a href="#docling.datamodel.pipeline_options.VlmExtractionPipelineOptions" class="md-nav__link">
|
||
<span class="md-ellipsis">
|
||
|
||
<code class="doc-symbol doc-symbol-toc doc-symbol-class"></code> VlmExtractionPipelineOptions
|
||
|
||
</span>
|
||
</a>
|
||
|
||
<nav class="md-nav" aria-label=" VlmExtractionPipelineOptions">
|
||
<ul class="md-nav__list">
|
||
|
||
<li class="md-nav__item">
|
||
<a href="#docling.datamodel.pipeline_options.VlmExtractionPipelineOptions.accelerator_options" class="md-nav__link">
|
||
<span class="md-ellipsis">
|
||
|
||
<code class="doc-symbol doc-symbol-toc doc-symbol-attribute"></code> accelerator_options
|
||
|
||
</span>
|
||
</a>
|
||
|
||
</li>
|
||
|
||
<li class="md-nav__item">
|
||
<a href="#docling.datamodel.pipeline_options.VlmExtractionPipelineOptions.allow_external_plugins" class="md-nav__link">
|
||
<span class="md-ellipsis">
|
||
|
||
<code class="doc-symbol doc-symbol-toc doc-symbol-attribute"></code> allow_external_plugins
|
||
|
||
</span>
|
||
</a>
|
||
|
||
</li>
|
||
|
||
<li class="md-nav__item">
|
||
<a href="#docling.datamodel.pipeline_options.VlmExtractionPipelineOptions.artifacts_path" class="md-nav__link">
|
||
<span class="md-ellipsis">
|
||
|
||
<code class="doc-symbol doc-symbol-toc doc-symbol-attribute"></code> artifacts_path
|
||
|
||
</span>
|
||
</a>
|
||
|
||
</li>
|
||
|
||
<li class="md-nav__item">
|
||
<a href="#docling.datamodel.pipeline_options.VlmExtractionPipelineOptions.document_timeout" class="md-nav__link">
|
||
<span class="md-ellipsis">
|
||
|
||
<code class="doc-symbol doc-symbol-toc doc-symbol-attribute"></code> document_timeout
|
||
|
||
</span>
|
||
</a>
|
||
|
||
</li>
|
||
|
||
<li class="md-nav__item">
|
||
<a href="#docling.datamodel.pipeline_options.VlmExtractionPipelineOptions.enable_remote_services" class="md-nav__link">
|
||
<span class="md-ellipsis">
|
||
|
||
<code class="doc-symbol doc-symbol-toc doc-symbol-attribute"></code> enable_remote_services
|
||
|
||
</span>
|
||
</a>
|
||
|
||
</li>
|
||
|
||
<li class="md-nav__item">
|
||
<a href="#docling.datamodel.pipeline_options.VlmExtractionPipelineOptions.kind" class="md-nav__link">
|
||
<span class="md-ellipsis">
|
||
|
||
<code class="doc-symbol doc-symbol-toc doc-symbol-attribute"></code> kind
|
||
|
||
</span>
|
||
</a>
|
||
|
||
</li>
|
||
|
||
<li class="md-nav__item">
|
||
<a href="#docling.datamodel.pipeline_options.VlmExtractionPipelineOptions.vlm_options" class="md-nav__link">
|
||
<span class="md-ellipsis">
|
||
|
||
<code class="doc-symbol doc-symbol-toc doc-symbol-attribute"></code> vlm_options
|
||
|
||
</span>
|
||
</a>
|
||
|
||
</li>
|
||
|
||
</ul>
|
||
</nav>
|
||
|
||
</li>
|
||
|
||
<li class="md-nav__item">
|
||
<a href="#docling.datamodel.pipeline_options.VlmPipelineOptions" class="md-nav__link">
|
||
<span class="md-ellipsis">
|
||
|
||
<code class="doc-symbol doc-symbol-toc doc-symbol-class"></code> VlmPipelineOptions
|
||
|
||
</span>
|
||
</a>
|
||
|
||
<nav class="md-nav" aria-label=" VlmPipelineOptions">
|
||
<ul class="md-nav__list">
|
||
|
||
<li class="md-nav__item">
|
||
<a href="#docling.datamodel.pipeline_options.VlmPipelineOptions.accelerator_options" class="md-nav__link">
|
||
<span class="md-ellipsis">
|
||
|
||
<code class="doc-symbol doc-symbol-toc doc-symbol-attribute"></code> accelerator_options
|
||
|
||
</span>
|
||
</a>
|
||
|
||
</li>
|
||
|
||
<li class="md-nav__item">
|
||
<a href="#docling.datamodel.pipeline_options.VlmPipelineOptions.allow_external_plugins" class="md-nav__link">
|
||
<span class="md-ellipsis">
|
||
|
||
<code class="doc-symbol doc-symbol-toc doc-symbol-attribute"></code> allow_external_plugins
|
||
|
||
</span>
|
||
</a>
|
||
|
||
</li>
|
||
|
||
<li class="md-nav__item">
|
||
<a href="#docling.datamodel.pipeline_options.VlmPipelineOptions.artifacts_path" class="md-nav__link">
|
||
<span class="md-ellipsis">
|
||
|
||
<code class="doc-symbol doc-symbol-toc doc-symbol-attribute"></code> artifacts_path
|
||
|
||
</span>
|
||
</a>
|
||
|
||
</li>
|
||
|
||
<li class="md-nav__item">
|
||
<a href="#docling.datamodel.pipeline_options.VlmPipelineOptions.do_picture_classification" class="md-nav__link">
|
||
<span class="md-ellipsis">
|
||
|
||
<code class="doc-symbol doc-symbol-toc doc-symbol-attribute"></code> do_picture_classification
|
||
|
||
</span>
|
||
</a>
|
||
|
||
</li>
|
||
|
||
<li class="md-nav__item">
|
||
<a href="#docling.datamodel.pipeline_options.VlmPipelineOptions.do_picture_description" class="md-nav__link">
|
||
<span class="md-ellipsis">
|
||
|
||
<code class="doc-symbol doc-symbol-toc doc-symbol-attribute"></code> do_picture_description
|
||
|
||
</span>
|
||
</a>
|
||
|
||
</li>
|
||
|
||
<li class="md-nav__item">
|
||
<a href="#docling.datamodel.pipeline_options.VlmPipelineOptions.document_timeout" class="md-nav__link">
|
||
<span class="md-ellipsis">
|
||
|
||
<code class="doc-symbol doc-symbol-toc doc-symbol-attribute"></code> document_timeout
|
||
|
||
</span>
|
||
</a>
|
||
|
||
</li>
|
||
|
||
<li class="md-nav__item">
|
||
<a href="#docling.datamodel.pipeline_options.VlmPipelineOptions.enable_remote_services" class="md-nav__link">
|
||
<span class="md-ellipsis">
|
||
|
||
<code class="doc-symbol doc-symbol-toc doc-symbol-attribute"></code> enable_remote_services
|
||
|
||
</span>
|
||
</a>
|
||
|
||
</li>
|
||
|
||
<li class="md-nav__item">
|
||
<a href="#docling.datamodel.pipeline_options.VlmPipelineOptions.force_backend_text" class="md-nav__link">
|
||
<span class="md-ellipsis">
|
||
|
||
<code class="doc-symbol doc-symbol-toc doc-symbol-attribute"></code> force_backend_text
|
||
|
||
</span>
|
||
</a>
|
||
|
||
</li>
|
||
|
||
<li class="md-nav__item">
|
||
<a href="#docling.datamodel.pipeline_options.VlmPipelineOptions.generate_page_images" class="md-nav__link">
|
||
<span class="md-ellipsis">
|
||
|
||
<code class="doc-symbol doc-symbol-toc doc-symbol-attribute"></code> generate_page_images
|
||
|
||
</span>
|
||
</a>
|
||
|
||
</li>
|
||
|
||
<li class="md-nav__item">
|
||
<a href="#docling.datamodel.pipeline_options.VlmPipelineOptions.generate_picture_images" class="md-nav__link">
|
||
<span class="md-ellipsis">
|
||
|
||
<code class="doc-symbol doc-symbol-toc doc-symbol-attribute"></code> generate_picture_images
|
||
|
||
</span>
|
||
</a>
|
||
|
||
</li>
|
||
|
||
<li class="md-nav__item">
|
||
<a href="#docling.datamodel.pipeline_options.VlmPipelineOptions.images_scale" class="md-nav__link">
|
||
<span class="md-ellipsis">
|
||
|
||
<code class="doc-symbol doc-symbol-toc doc-symbol-attribute"></code> images_scale
|
||
|
||
</span>
|
||
</a>
|
||
|
||
</li>
|
||
|
||
<li class="md-nav__item">
|
||
<a href="#docling.datamodel.pipeline_options.VlmPipelineOptions.kind" class="md-nav__link">
|
||
<span class="md-ellipsis">
|
||
|
||
<code class="doc-symbol doc-symbol-toc doc-symbol-attribute"></code> kind
|
||
|
||
</span>
|
||
</a>
|
||
|
||
</li>
|
||
|
||
<li class="md-nav__item">
|
||
<a href="#docling.datamodel.pipeline_options.VlmPipelineOptions.picture_description_options" class="md-nav__link">
|
||
<span class="md-ellipsis">
|
||
|
||
<code class="doc-symbol doc-symbol-toc doc-symbol-attribute"></code> picture_description_options
|
||
|
||
</span>
|
||
</a>
|
||
|
||
</li>
|
||
|
||
<li class="md-nav__item">
|
||
<a href="#docling.datamodel.pipeline_options.VlmPipelineOptions.vlm_options" class="md-nav__link">
|
||
<span class="md-ellipsis">
|
||
|
||
<code class="doc-symbol doc-symbol-toc doc-symbol-attribute"></code> vlm_options
|
||
|
||
</span>
|
||
</a>
|
||
|
||
</li>
|
||
|
||
</ul>
|
||
</nav>
|
||
|
||
</li>
|
||
|
||
</ul>
|
||
</nav>
|
||
|
||
</li>
|
||
|
||
</ul>
|
||
|
||
</nav>
|
||
</div>
|
||
</div>
|
||
</div>
|
||
|
||
|
||
|
||
<div class="md-content" data-md-component="content">
|
||
|
||
|
||
|
||
|
||
|
||
|
||
<nav class="md-path" aria-label="Navigation" >
|
||
<ol class="md-path__list">
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
<li class="md-path__item">
|
||
<a href="../document_converter/" class="md-path__link">
|
||
|
||
<span class="md-ellipsis">
|
||
Reference
|
||
</span>
|
||
|
||
</a>
|
||
</li>
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
<li class="md-path__item">
|
||
<a href="../document_converter/" class="md-path__link">
|
||
|
||
<span class="md-ellipsis">
|
||
Python API
|
||
</span>
|
||
|
||
</a>
|
||
</li>
|
||
|
||
|
||
|
||
|
||
</ol>
|
||
</nav>
|
||
|
||
|
||
<article class="md-content__inner md-typeset">
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
<h1 id="pipeline-options">Pipeline options</h1>
|
||
<p>Pipeline options allow to customize the execution of the models during the conversion pipeline.
|
||
This includes options for the OCR engines, the table model as well as enrichment options which
|
||
can be enabled with <code>do_xyz = True</code>.</p>
|
||
<p>This is an automatic generated API reference of the all the pipeline options available in Docling.</p>
|
||
|
||
|
||
<div class="doc doc-object doc-module">
|
||
|
||
|
||
|
||
<h2 id="docling.datamodel.pipeline_options" class="doc doc-heading">
|
||
<code class="doc-symbol doc-symbol-heading doc-symbol-module"></code> <span class="doc doc-object-name doc-module-name">pipeline_options</span>
|
||
|
||
|
||
</h2>
|
||
|
||
<div class="doc doc-contents first">
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
<p><span class="doc-section-title">Classes:</span></p>
|
||
<ul>
|
||
<li class="doc-section-item field-body">
|
||
<b><code><a class="autorefs autorefs-internal" title="<code class="doc-symbol doc-symbol-heading doc-symbol-class"></code> <span class="doc doc-object-name doc-class-name">AsrPipelineOptions</span> (<code>docling.datamodel.pipeline_options.AsrPipelineOptions</code>)" href="#docling.datamodel.pipeline_options.AsrPipelineOptions">AsrPipelineOptions</a></code></b>
|
||
–
|
||
<div class="doc-md-description">
|
||
|
||
</div>
|
||
</li>
|
||
<li class="doc-section-item field-body">
|
||
<b><code><a class="autorefs autorefs-internal" title="<code class="doc-symbol doc-symbol-heading doc-symbol-class"></code> <span class="doc doc-object-name doc-class-name">BaseLayoutOptions</span> (<code>docling.datamodel.pipeline_options.BaseLayoutOptions</code>)" href="#docling.datamodel.pipeline_options.BaseLayoutOptions">BaseLayoutOptions</a></code></b>
|
||
–
|
||
<div class="doc-md-description">
|
||
<p>Base options for layout models.</p>
|
||
</div>
|
||
</li>
|
||
<li class="doc-section-item field-body">
|
||
<b><code><a class="autorefs autorefs-internal" title="<code class="doc-symbol doc-symbol-heading doc-symbol-class"></code> <span class="doc doc-object-name doc-class-name">BaseOptions</span> (<code>docling.datamodel.pipeline_options.BaseOptions</code>)" href="#docling.datamodel.pipeline_options.BaseOptions">BaseOptions</a></code></b>
|
||
–
|
||
<div class="doc-md-description">
|
||
<p>Base class for options.</p>
|
||
</div>
|
||
</li>
|
||
<li class="doc-section-item field-body">
|
||
<b><code><a class="autorefs autorefs-internal" title="<code class="doc-symbol doc-symbol-heading doc-symbol-class"></code> <span class="doc doc-object-name doc-class-name">BaseTableStructureOptions</span> (<code>docling.datamodel.pipeline_options.BaseTableStructureOptions</code>)" href="#docling.datamodel.pipeline_options.BaseTableStructureOptions">BaseTableStructureOptions</a></code></b>
|
||
–
|
||
<div class="doc-md-description">
|
||
<p>Base options for table structure models.</p>
|
||
</div>
|
||
</li>
|
||
<li class="doc-section-item field-body">
|
||
<b><code><a class="autorefs autorefs-internal" title="<code class="doc-symbol doc-symbol-heading doc-symbol-class"></code> <span class="doc doc-object-name doc-class-name">ConvertPipelineOptions</span> (<code>docling.datamodel.pipeline_options.ConvertPipelineOptions</code>)" href="#docling.datamodel.pipeline_options.ConvertPipelineOptions">ConvertPipelineOptions</a></code></b>
|
||
–
|
||
<div class="doc-md-description">
|
||
<p>Base convert pipeline options.</p>
|
||
</div>
|
||
</li>
|
||
<li class="doc-section-item field-body">
|
||
<b><code><a class="autorefs autorefs-internal" title="<code class="doc-symbol doc-symbol-heading doc-symbol-class"></code> <span class="doc doc-object-name doc-class-name">EasyOcrOptions</span> (<code>docling.datamodel.pipeline_options.EasyOcrOptions</code>)" href="#docling.datamodel.pipeline_options.EasyOcrOptions">EasyOcrOptions</a></code></b>
|
||
–
|
||
<div class="doc-md-description">
|
||
<p>Options for the EasyOCR engine.</p>
|
||
</div>
|
||
</li>
|
||
<li class="doc-section-item field-body">
|
||
<b><code><a class="autorefs autorefs-internal" title="<code class="doc-symbol doc-symbol-heading doc-symbol-class"></code> <span class="doc doc-object-name doc-class-name">LayoutOptions</span> (<code>docling.datamodel.pipeline_options.LayoutOptions</code>)" href="#docling.datamodel.pipeline_options.LayoutOptions">LayoutOptions</a></code></b>
|
||
–
|
||
<div class="doc-md-description">
|
||
<p>Options for layout processing.</p>
|
||
</div>
|
||
</li>
|
||
<li class="doc-section-item field-body">
|
||
<b><code><a class="autorefs autorefs-internal" title="<code class="doc-symbol doc-symbol-heading doc-symbol-class"></code> <span class="doc doc-object-name doc-class-name">OcrAutoOptions</span> (<code>docling.datamodel.pipeline_options.OcrAutoOptions</code>)" href="#docling.datamodel.pipeline_options.OcrAutoOptions">OcrAutoOptions</a></code></b>
|
||
–
|
||
<div class="doc-md-description">
|
||
<p>Options for pick OCR engine automatically.</p>
|
||
</div>
|
||
</li>
|
||
<li class="doc-section-item field-body">
|
||
<b><code><a class="autorefs autorefs-internal" title="<code class="doc-symbol doc-symbol-heading doc-symbol-class"></code> <span class="doc doc-object-name doc-class-name">OcrEngine</span> (<code>docling.datamodel.pipeline_options.OcrEngine</code>)" href="#docling.datamodel.pipeline_options.OcrEngine">OcrEngine</a></code></b>
|
||
–
|
||
<div class="doc-md-description">
|
||
<p>Enum of valid OCR engines.</p>
|
||
</div>
|
||
</li>
|
||
<li class="doc-section-item field-body">
|
||
<b><code><a class="autorefs autorefs-internal" title="<code class="doc-symbol doc-symbol-heading doc-symbol-class"></code> <span class="doc doc-object-name doc-class-name">OcrMacOptions</span> (<code>docling.datamodel.pipeline_options.OcrMacOptions</code>)" href="#docling.datamodel.pipeline_options.OcrMacOptions">OcrMacOptions</a></code></b>
|
||
–
|
||
<div class="doc-md-description">
|
||
<p>Options for the Mac OCR engine.</p>
|
||
</div>
|
||
</li>
|
||
<li class="doc-section-item field-body">
|
||
<b><code><a class="autorefs autorefs-internal" title="<code class="doc-symbol doc-symbol-heading doc-symbol-class"></code> <span class="doc doc-object-name doc-class-name">OcrOptions</span> (<code>docling.datamodel.pipeline_options.OcrOptions</code>)" href="#docling.datamodel.pipeline_options.OcrOptions">OcrOptions</a></code></b>
|
||
–
|
||
<div class="doc-md-description">
|
||
<p>OCR options.</p>
|
||
</div>
|
||
</li>
|
||
<li class="doc-section-item field-body">
|
||
<b><code><a class="autorefs autorefs-internal" title="<code class="doc-symbol doc-symbol-heading doc-symbol-class"></code> <span class="doc doc-object-name doc-class-name">PaginatedPipelineOptions</span> (<code>docling.datamodel.pipeline_options.PaginatedPipelineOptions</code>)" href="#docling.datamodel.pipeline_options.PaginatedPipelineOptions">PaginatedPipelineOptions</a></code></b>
|
||
–
|
||
<div class="doc-md-description">
|
||
|
||
</div>
|
||
</li>
|
||
<li class="doc-section-item field-body">
|
||
<b><code><a class="autorefs autorefs-internal" title="<code class="doc-symbol doc-symbol-heading doc-symbol-class"></code> <span class="doc doc-object-name doc-class-name">PdfBackend</span> (<code>docling.datamodel.pipeline_options.PdfBackend</code>)" href="#docling.datamodel.pipeline_options.PdfBackend">PdfBackend</a></code></b>
|
||
–
|
||
<div class="doc-md-description">
|
||
<p>Enum of valid PDF backends.</p>
|
||
</div>
|
||
</li>
|
||
<li class="doc-section-item field-body">
|
||
<b><code><a class="autorefs autorefs-internal" title="<code class="doc-symbol doc-symbol-heading doc-symbol-class"></code> <span class="doc doc-object-name doc-class-name">PdfPipelineOptions</span> (<code>docling.datamodel.pipeline_options.PdfPipelineOptions</code>)" href="#docling.datamodel.pipeline_options.PdfPipelineOptions">PdfPipelineOptions</a></code></b>
|
||
–
|
||
<div class="doc-md-description">
|
||
<p>Options for the PDF pipeline.</p>
|
||
</div>
|
||
</li>
|
||
<li class="doc-section-item field-body">
|
||
<b><code><a class="autorefs autorefs-internal" title="<code class="doc-symbol doc-symbol-heading doc-symbol-class"></code> <span class="doc doc-object-name doc-class-name">PictureDescriptionApiOptions</span> (<code>docling.datamodel.pipeline_options.PictureDescriptionApiOptions</code>)" href="#docling.datamodel.pipeline_options.PictureDescriptionApiOptions">PictureDescriptionApiOptions</a></code></b>
|
||
–
|
||
<div class="doc-md-description">
|
||
|
||
</div>
|
||
</li>
|
||
<li class="doc-section-item field-body">
|
||
<b><code><a class="autorefs autorefs-internal" title="<code class="doc-symbol doc-symbol-heading doc-symbol-class"></code> <span class="doc doc-object-name doc-class-name">PictureDescriptionBaseOptions</span> (<code>docling.datamodel.pipeline_options.PictureDescriptionBaseOptions</code>)" href="#docling.datamodel.pipeline_options.PictureDescriptionBaseOptions">PictureDescriptionBaseOptions</a></code></b>
|
||
–
|
||
<div class="doc-md-description">
|
||
|
||
</div>
|
||
</li>
|
||
<li class="doc-section-item field-body">
|
||
<b><code><a class="autorefs autorefs-internal" title="<code class="doc-symbol doc-symbol-heading doc-symbol-class"></code> <span class="doc doc-object-name doc-class-name">PictureDescriptionVlmOptions</span> (<code>docling.datamodel.pipeline_options.PictureDescriptionVlmOptions</code>)" href="#docling.datamodel.pipeline_options.PictureDescriptionVlmOptions">PictureDescriptionVlmOptions</a></code></b>
|
||
–
|
||
<div class="doc-md-description">
|
||
|
||
</div>
|
||
</li>
|
||
<li class="doc-section-item field-body">
|
||
<b><code><a class="autorefs autorefs-internal" title="<code class="doc-symbol doc-symbol-heading doc-symbol-class"></code> <span class="doc doc-object-name doc-class-name">PipelineOptions</span> (<code>docling.datamodel.pipeline_options.PipelineOptions</code>)" href="#docling.datamodel.pipeline_options.PipelineOptions">PipelineOptions</a></code></b>
|
||
–
|
||
<div class="doc-md-description">
|
||
<p>Base pipeline options.</p>
|
||
</div>
|
||
</li>
|
||
<li class="doc-section-item field-body">
|
||
<b><code><a class="autorefs autorefs-internal" title="<code class="doc-symbol doc-symbol-heading doc-symbol-class"></code> <span class="doc doc-object-name doc-class-name">ProcessingPipeline</span> (<code>docling.datamodel.pipeline_options.ProcessingPipeline</code>)" href="#docling.datamodel.pipeline_options.ProcessingPipeline">ProcessingPipeline</a></code></b>
|
||
–
|
||
<div class="doc-md-description">
|
||
|
||
</div>
|
||
</li>
|
||
<li class="doc-section-item field-body">
|
||
<b><code><a class="autorefs autorefs-internal" title="<code class="doc-symbol doc-symbol-heading doc-symbol-class"></code> <span class="doc doc-object-name doc-class-name">RapidOcrOptions</span> (<code>docling.datamodel.pipeline_options.RapidOcrOptions</code>)" href="#docling.datamodel.pipeline_options.RapidOcrOptions">RapidOcrOptions</a></code></b>
|
||
–
|
||
<div class="doc-md-description">
|
||
<p>Options for the RapidOCR engine.</p>
|
||
</div>
|
||
</li>
|
||
<li class="doc-section-item field-body">
|
||
<b><code><a class="autorefs autorefs-internal" title="<code class="doc-symbol doc-symbol-heading doc-symbol-class"></code> <span class="doc doc-object-name doc-class-name">TableFormerMode</span> (<code>docling.datamodel.pipeline_options.TableFormerMode</code>)" href="#docling.datamodel.pipeline_options.TableFormerMode">TableFormerMode</a></code></b>
|
||
–
|
||
<div class="doc-md-description">
|
||
<p>Modes for the TableFormer model.</p>
|
||
</div>
|
||
</li>
|
||
<li class="doc-section-item field-body">
|
||
<b><code><a class="autorefs autorefs-internal" title="<code class="doc-symbol doc-symbol-heading doc-symbol-class"></code> <span class="doc doc-object-name doc-class-name">TableStructureOptions</span> (<code>docling.datamodel.pipeline_options.TableStructureOptions</code>)" href="#docling.datamodel.pipeline_options.TableStructureOptions">TableStructureOptions</a></code></b>
|
||
–
|
||
<div class="doc-md-description">
|
||
<p>Options for the table structure.</p>
|
||
</div>
|
||
</li>
|
||
<li class="doc-section-item field-body">
|
||
<b><code><a class="autorefs autorefs-internal" title="<code class="doc-symbol doc-symbol-heading doc-symbol-class"></code> <span class="doc doc-object-name doc-class-name">TesseractCliOcrOptions</span> (<code>docling.datamodel.pipeline_options.TesseractCliOcrOptions</code>)" href="#docling.datamodel.pipeline_options.TesseractCliOcrOptions">TesseractCliOcrOptions</a></code></b>
|
||
–
|
||
<div class="doc-md-description">
|
||
<p>Options for the TesseractCli engine.</p>
|
||
</div>
|
||
</li>
|
||
<li class="doc-section-item field-body">
|
||
<b><code><a class="autorefs autorefs-internal" title="<code class="doc-symbol doc-symbol-heading doc-symbol-class"></code> <span class="doc doc-object-name doc-class-name">TesseractOcrOptions</span> (<code>docling.datamodel.pipeline_options.TesseractOcrOptions</code>)" href="#docling.datamodel.pipeline_options.TesseractOcrOptions">TesseractOcrOptions</a></code></b>
|
||
–
|
||
<div class="doc-md-description">
|
||
<p>Options for the Tesseract engine.</p>
|
||
</div>
|
||
</li>
|
||
<li class="doc-section-item field-body">
|
||
<b><code><a class="autorefs autorefs-internal" title="<code class="doc-symbol doc-symbol-heading doc-symbol-class"></code> <span class="doc doc-object-name doc-class-name">ThreadedPdfPipelineOptions</span> (<code>docling.datamodel.pipeline_options.ThreadedPdfPipelineOptions</code>)" href="#docling.datamodel.pipeline_options.ThreadedPdfPipelineOptions">ThreadedPdfPipelineOptions</a></code></b>
|
||
–
|
||
<div class="doc-md-description">
|
||
<p>Pipeline options for the threaded PDF pipeline with batching and backpressure control</p>
|
||
</div>
|
||
</li>
|
||
<li class="doc-section-item field-body">
|
||
<b><code><a class="autorefs autorefs-internal" title="<code class="doc-symbol doc-symbol-heading doc-symbol-class"></code> <span class="doc doc-object-name doc-class-name">VlmExtractionPipelineOptions</span> (<code>docling.datamodel.pipeline_options.VlmExtractionPipelineOptions</code>)" href="#docling.datamodel.pipeline_options.VlmExtractionPipelineOptions">VlmExtractionPipelineOptions</a></code></b>
|
||
–
|
||
<div class="doc-md-description">
|
||
<p>Options for extraction pipeline.</p>
|
||
</div>
|
||
</li>
|
||
<li class="doc-section-item field-body">
|
||
<b><code><a class="autorefs autorefs-internal" title="<code class="doc-symbol doc-symbol-heading doc-symbol-class"></code> <span class="doc doc-object-name doc-class-name">VlmPipelineOptions</span> (<code>docling.datamodel.pipeline_options.VlmPipelineOptions</code>)" href="#docling.datamodel.pipeline_options.VlmPipelineOptions">VlmPipelineOptions</a></code></b>
|
||
–
|
||
<div class="doc-md-description">
|
||
|
||
</div>
|
||
</li>
|
||
</ul>
|
||
|
||
|
||
|
||
|
||
|
||
|
||
<p><span class="doc-section-title">Attributes:</span></p>
|
||
<ul>
|
||
<li class="doc-section-item field-body">
|
||
<b><code><a class="autorefs autorefs-internal" title="<code class="doc-symbol doc-symbol-heading doc-symbol-attribute"></code> <span class="doc doc-object-name doc-attribute-name">granite_picture_description</span>
|
||
|
||
|
||
<span class="doc doc-labels">
|
||
<small class="doc doc-label doc-label-module-attribute"><code>module-attribute</code></small>
|
||
</span> (<code>docling.datamodel.pipeline_options.granite_picture_description</code>)" href="#docling.datamodel.pipeline_options.granite_picture_description">granite_picture_description</a></code></b>
|
||
–
|
||
<div class="doc-md-description">
|
||
|
||
</div>
|
||
</li>
|
||
<li class="doc-section-item field-body">
|
||
<b><code><a class="autorefs autorefs-internal" title="<code class="doc-symbol doc-symbol-heading doc-symbol-attribute"></code> <span class="doc doc-object-name doc-attribute-name">smolvlm_picture_description</span>
|
||
|
||
|
||
<span class="doc doc-labels">
|
||
<small class="doc doc-label doc-label-module-attribute"><code>module-attribute</code></small>
|
||
</span> (<code>docling.datamodel.pipeline_options.smolvlm_picture_description</code>)" href="#docling.datamodel.pipeline_options.smolvlm_picture_description">smolvlm_picture_description</a></code></b>
|
||
–
|
||
<div class="doc-md-description">
|
||
|
||
</div>
|
||
</li>
|
||
</ul>
|
||
|
||
|
||
|
||
<div class="doc doc-children">
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
<div class="doc doc-object doc-attribute">
|
||
|
||
|
||
|
||
<h3 id="docling.datamodel.pipeline_options.granite_picture_description" class="doc doc-heading">
|
||
<code class="doc-symbol doc-symbol-heading doc-symbol-attribute"></code> <span class="doc doc-object-name doc-attribute-name">granite_picture_description</span>
|
||
|
||
|
||
<span class="doc doc-labels">
|
||
<small class="doc doc-label doc-label-module-attribute"><code>module-attribute</code></small>
|
||
</span>
|
||
|
||
</h3>
|
||
<div class="doc-signature highlight"><pre><span></span><code><span class="n">granite_picture_description</span> <span class="o">=</span> <span class="n"><a class="autorefs autorefs-internal" title="<code class="doc-symbol doc-symbol-heading doc-symbol-class"></code> <span class="doc doc-object-name doc-class-name">PictureDescriptionVlmOptions</span> (<code>docling.datamodel.pipeline_options.PictureDescriptionVlmOptions</code>)" href="#docling.datamodel.pipeline_options.PictureDescriptionVlmOptions">PictureDescriptionVlmOptions</a></span><span class="p">(</span><span class="n"><span title="docling.datamodel.pipeline_options.PictureDescriptionVlmOptions(repo_id)">repo_id</span></span><span class="o">=</span><span class="s1">'ibm-granite/granite-vision-3.3-2b'</span><span class="p">,</span> <span class="n"><span title="docling.datamodel.pipeline_options.PictureDescriptionVlmOptions(prompt)">prompt</span></span><span class="o">=</span><span class="s1">'What is shown in this image?'</span><span class="p">)</span>
|
||
</code></pre></div>
|
||
|
||
<div class="doc doc-contents ">
|
||
|
||
</div>
|
||
|
||
</div>
|
||
|
||
<div class="doc doc-object doc-attribute">
|
||
|
||
|
||
|
||
<h3 id="docling.datamodel.pipeline_options.smolvlm_picture_description" class="doc doc-heading">
|
||
<code class="doc-symbol doc-symbol-heading doc-symbol-attribute"></code> <span class="doc doc-object-name doc-attribute-name">smolvlm_picture_description</span>
|
||
|
||
|
||
<span class="doc doc-labels">
|
||
<small class="doc doc-label doc-label-module-attribute"><code>module-attribute</code></small>
|
||
</span>
|
||
|
||
</h3>
|
||
<div class="doc-signature highlight"><pre><span></span><code><span class="n">smolvlm_picture_description</span> <span class="o">=</span> <span class="n"><a class="autorefs autorefs-internal" title="<code class="doc-symbol doc-symbol-heading doc-symbol-class"></code> <span class="doc doc-object-name doc-class-name">PictureDescriptionVlmOptions</span> (<code>docling.datamodel.pipeline_options.PictureDescriptionVlmOptions</code>)" href="#docling.datamodel.pipeline_options.PictureDescriptionVlmOptions">PictureDescriptionVlmOptions</a></span><span class="p">(</span><span class="n"><span title="docling.datamodel.pipeline_options.PictureDescriptionVlmOptions(repo_id)">repo_id</span></span><span class="o">=</span><span class="s1">'HuggingFaceTB/SmolVLM-256M-Instruct'</span><span class="p">)</span>
|
||
</code></pre></div>
|
||
|
||
<div class="doc doc-contents ">
|
||
|
||
</div>
|
||
|
||
</div>
|
||
|
||
|
||
|
||
<div class="doc doc-object doc-class">
|
||
|
||
|
||
|
||
<h3 id="docling.datamodel.pipeline_options.AsrPipelineOptions" class="doc doc-heading">
|
||
<code class="doc-symbol doc-symbol-heading doc-symbol-class"></code> <span class="doc doc-object-name doc-class-name">AsrPipelineOptions</span>
|
||
|
||
|
||
</h3>
|
||
|
||
|
||
<div class="doc doc-contents ">
|
||
<p class="doc doc-class-bases">
|
||
Bases: <code><a class="autorefs autorefs-internal" title="<code class="doc-symbol doc-symbol-heading doc-symbol-class"></code> <span class="doc doc-object-name doc-class-name">PipelineOptions</span> (<code>docling.datamodel.pipeline_options.PipelineOptions</code>)" href="#docling.datamodel.pipeline_options.PipelineOptions">PipelineOptions</a></code></p>
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
<p><span class="doc-section-title">Attributes:</span></p>
|
||
<ul>
|
||
<li class="doc-section-item field-body">
|
||
<b><code><a class="autorefs autorefs-internal" title="<code class="doc-symbol doc-symbol-heading doc-symbol-attribute"></code> <span class="doc doc-object-name doc-attribute-name">accelerator_options</span>
|
||
|
||
|
||
<span class="doc doc-labels">
|
||
<small class="doc doc-label doc-label-class-attribute"><code>class-attribute</code></small>
|
||
<small class="doc doc-label doc-label-instance-attribute"><code>instance-attribute</code></small>
|
||
</span> (<code>docling.datamodel.pipeline_options.AsrPipelineOptions.accelerator_options</code>)" href="#docling.datamodel.pipeline_options.AsrPipelineOptions.accelerator_options">accelerator_options</a></code></b>
|
||
(<code><span title="docling.datamodel.accelerator_options.AcceleratorOptions">AcceleratorOptions</span></code>)
|
||
–
|
||
<div class="doc-md-description">
|
||
|
||
</div>
|
||
</li>
|
||
<li class="doc-section-item field-body">
|
||
<b><code><a class="autorefs autorefs-internal" title="<code class="doc-symbol doc-symbol-heading doc-symbol-attribute"></code> <span class="doc doc-object-name doc-attribute-name">allow_external_plugins</span>
|
||
|
||
|
||
<span class="doc doc-labels">
|
||
<small class="doc doc-label doc-label-class-attribute"><code>class-attribute</code></small>
|
||
<small class="doc doc-label doc-label-instance-attribute"><code>instance-attribute</code></small>
|
||
</span> (<code>docling.datamodel.pipeline_options.AsrPipelineOptions.allow_external_plugins</code>)" href="#docling.datamodel.pipeline_options.AsrPipelineOptions.allow_external_plugins">allow_external_plugins</a></code></b>
|
||
(<code><span title="bool">bool</span></code>)
|
||
–
|
||
<div class="doc-md-description">
|
||
|
||
</div>
|
||
</li>
|
||
<li class="doc-section-item field-body">
|
||
<b><code><a class="autorefs autorefs-internal" title="<code class="doc-symbol doc-symbol-heading doc-symbol-attribute"></code> <span class="doc doc-object-name doc-attribute-name">artifacts_path</span>
|
||
|
||
|
||
<span class="doc doc-labels">
|
||
<small class="doc doc-label doc-label-class-attribute"><code>class-attribute</code></small>
|
||
<small class="doc doc-label doc-label-instance-attribute"><code>instance-attribute</code></small>
|
||
</span> (<code>docling.datamodel.pipeline_options.AsrPipelineOptions.artifacts_path</code>)" href="#docling.datamodel.pipeline_options.AsrPipelineOptions.artifacts_path">artifacts_path</a></code></b>
|
||
(<code><span title="typing.Optional">Optional</span>[<span title="typing.Union">Union</span>[<span title="pathlib.Path">Path</span>, <span title="str">str</span>]]</code>)
|
||
–
|
||
<div class="doc-md-description">
|
||
|
||
</div>
|
||
</li>
|
||
<li class="doc-section-item field-body">
|
||
<b><code><a class="autorefs autorefs-internal" title="<code class="doc-symbol doc-symbol-heading doc-symbol-attribute"></code> <span class="doc doc-object-name doc-attribute-name">asr_options</span>
|
||
|
||
|
||
<span class="doc doc-labels">
|
||
<small class="doc doc-label doc-label-class-attribute"><code>class-attribute</code></small>
|
||
<small class="doc doc-label doc-label-instance-attribute"><code>instance-attribute</code></small>
|
||
</span> (<code>docling.datamodel.pipeline_options.AsrPipelineOptions.asr_options</code>)" href="#docling.datamodel.pipeline_options.AsrPipelineOptions.asr_options">asr_options</a></code></b>
|
||
(<code><span title="typing.Union">Union</span>[<span title="docling.datamodel.pipeline_options_asr_model.InlineAsrOptions">InlineAsrOptions</span>]</code>)
|
||
–
|
||
<div class="doc-md-description">
|
||
|
||
</div>
|
||
</li>
|
||
<li class="doc-section-item field-body">
|
||
<b><code><a class="autorefs autorefs-internal" title="<code class="doc-symbol doc-symbol-heading doc-symbol-attribute"></code> <span class="doc doc-object-name doc-attribute-name">document_timeout</span>
|
||
|
||
|
||
<span class="doc doc-labels">
|
||
<small class="doc doc-label doc-label-class-attribute"><code>class-attribute</code></small>
|
||
<small class="doc doc-label doc-label-instance-attribute"><code>instance-attribute</code></small>
|
||
</span> (<code>docling.datamodel.pipeline_options.AsrPipelineOptions.document_timeout</code>)" href="#docling.datamodel.pipeline_options.AsrPipelineOptions.document_timeout">document_timeout</a></code></b>
|
||
(<code><span title="typing.Optional">Optional</span>[<span title="float">float</span>]</code>)
|
||
–
|
||
<div class="doc-md-description">
|
||
|
||
</div>
|
||
</li>
|
||
<li class="doc-section-item field-body">
|
||
<b><code><a class="autorefs autorefs-internal" title="<code class="doc-symbol doc-symbol-heading doc-symbol-attribute"></code> <span class="doc doc-object-name doc-attribute-name">enable_remote_services</span>
|
||
|
||
|
||
<span class="doc doc-labels">
|
||
<small class="doc doc-label doc-label-class-attribute"><code>class-attribute</code></small>
|
||
<small class="doc doc-label doc-label-instance-attribute"><code>instance-attribute</code></small>
|
||
</span> (<code>docling.datamodel.pipeline_options.AsrPipelineOptions.enable_remote_services</code>)" href="#docling.datamodel.pipeline_options.AsrPipelineOptions.enable_remote_services">enable_remote_services</a></code></b>
|
||
(<code><span title="bool">bool</span></code>)
|
||
–
|
||
<div class="doc-md-description">
|
||
|
||
</div>
|
||
</li>
|
||
<li class="doc-section-item field-body">
|
||
<b><code><a class="autorefs autorefs-internal" title="<code class="doc-symbol doc-symbol-heading doc-symbol-attribute"></code> <span class="doc doc-object-name doc-attribute-name">kind</span>
|
||
|
||
|
||
<span class="doc doc-labels">
|
||
<small class="doc doc-label doc-label-class-attribute"><code>class-attribute</code></small>
|
||
</span> (<code>docling.datamodel.pipeline_options.AsrPipelineOptions.kind</code>)" href="#docling.datamodel.pipeline_options.AsrPipelineOptions.kind">kind</a></code></b>
|
||
(<code><span title="str">str</span></code>)
|
||
–
|
||
<div class="doc-md-description">
|
||
|
||
</div>
|
||
</li>
|
||
</ul>
|
||
|
||
|
||
|
||
|
||
<div class="doc doc-children">
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
<div class="doc doc-object doc-attribute">
|
||
|
||
|
||
|
||
<h4 id="docling.datamodel.pipeline_options.AsrPipelineOptions.accelerator_options" class="doc doc-heading">
|
||
<code class="doc-symbol doc-symbol-heading doc-symbol-attribute"></code> <span class="doc doc-object-name doc-attribute-name">accelerator_options</span>
|
||
|
||
|
||
<span class="doc doc-labels">
|
||
<small class="doc doc-label doc-label-class-attribute"><code>class-attribute</code></small>
|
||
<small class="doc doc-label doc-label-instance-attribute"><code>instance-attribute</code></small>
|
||
</span>
|
||
|
||
</h4>
|
||
<div class="doc-signature highlight"><pre><span></span><code><span class="n">accelerator_options</span><span class="p">:</span> <span class="n"><span title="docling.datamodel.accelerator_options.AcceleratorOptions">AcceleratorOptions</span></span> <span class="o">=</span> <span class="n"><span title="docling.datamodel.accelerator_options.AcceleratorOptions">AcceleratorOptions</span></span><span class="p">()</span>
|
||
</code></pre></div>
|
||
|
||
<div class="doc doc-contents ">
|
||
|
||
</div>
|
||
|
||
</div>
|
||
|
||
<div class="doc doc-object doc-attribute">
|
||
|
||
|
||
|
||
<h4 id="docling.datamodel.pipeline_options.AsrPipelineOptions.allow_external_plugins" class="doc doc-heading">
|
||
<code class="doc-symbol doc-symbol-heading doc-symbol-attribute"></code> <span class="doc doc-object-name doc-attribute-name">allow_external_plugins</span>
|
||
|
||
|
||
<span class="doc doc-labels">
|
||
<small class="doc doc-label doc-label-class-attribute"><code>class-attribute</code></small>
|
||
<small class="doc doc-label doc-label-instance-attribute"><code>instance-attribute</code></small>
|
||
</span>
|
||
|
||
</h4>
|
||
<div class="doc-signature highlight"><pre><span></span><code><span class="n">allow_external_plugins</span><span class="p">:</span> <span class="n"><span title="bool">bool</span></span> <span class="o">=</span> <span class="kc">False</span>
|
||
</code></pre></div>
|
||
|
||
<div class="doc doc-contents ">
|
||
|
||
</div>
|
||
|
||
</div>
|
||
|
||
<div class="doc doc-object doc-attribute">
|
||
|
||
|
||
|
||
<h4 id="docling.datamodel.pipeline_options.AsrPipelineOptions.artifacts_path" class="doc doc-heading">
|
||
<code class="doc-symbol doc-symbol-heading doc-symbol-attribute"></code> <span class="doc doc-object-name doc-attribute-name">artifacts_path</span>
|
||
|
||
|
||
<span class="doc doc-labels">
|
||
<small class="doc doc-label doc-label-class-attribute"><code>class-attribute</code></small>
|
||
<small class="doc doc-label doc-label-instance-attribute"><code>instance-attribute</code></small>
|
||
</span>
|
||
|
||
</h4>
|
||
<div class="doc-signature highlight"><pre><span></span><code><span class="n">artifacts_path</span><span class="p">:</span> <span class="n"><span title="typing.Optional">Optional</span></span><span class="p">[</span><span class="n"><span title="typing.Union">Union</span></span><span class="p">[</span><span class="n"><span title="pathlib.Path">Path</span></span><span class="p">,</span> <span class="n"><span title="str">str</span></span><span class="p">]]</span> <span class="o">=</span> <span class="kc">None</span>
|
||
</code></pre></div>
|
||
|
||
<div class="doc doc-contents ">
|
||
|
||
</div>
|
||
|
||
</div>
|
||
|
||
<div class="doc doc-object doc-attribute">
|
||
|
||
|
||
|
||
<h4 id="docling.datamodel.pipeline_options.AsrPipelineOptions.asr_options" class="doc doc-heading">
|
||
<code class="doc-symbol doc-symbol-heading doc-symbol-attribute"></code> <span class="doc doc-object-name doc-attribute-name">asr_options</span>
|
||
|
||
|
||
<span class="doc doc-labels">
|
||
<small class="doc doc-label doc-label-class-attribute"><code>class-attribute</code></small>
|
||
<small class="doc doc-label doc-label-instance-attribute"><code>instance-attribute</code></small>
|
||
</span>
|
||
|
||
</h4>
|
||
<div class="doc-signature highlight"><pre><span></span><code><span class="n">asr_options</span><span class="p">:</span> <span class="n"><span title="typing.Union">Union</span></span><span class="p">[</span><span class="n"><span title="docling.datamodel.pipeline_options_asr_model.InlineAsrOptions">InlineAsrOptions</span></span><span class="p">]</span> <span class="o">=</span> <span class="n"><span title="docling.datamodel.asr_model_specs.WHISPER_TINY">WHISPER_TINY</span></span>
|
||
</code></pre></div>
|
||
|
||
<div class="doc doc-contents ">
|
||
|
||
</div>
|
||
|
||
</div>
|
||
|
||
<div class="doc doc-object doc-attribute">
|
||
|
||
|
||
|
||
<h4 id="docling.datamodel.pipeline_options.AsrPipelineOptions.document_timeout" class="doc doc-heading">
|
||
<code class="doc-symbol doc-symbol-heading doc-symbol-attribute"></code> <span class="doc doc-object-name doc-attribute-name">document_timeout</span>
|
||
|
||
|
||
<span class="doc doc-labels">
|
||
<small class="doc doc-label doc-label-class-attribute"><code>class-attribute</code></small>
|
||
<small class="doc doc-label doc-label-instance-attribute"><code>instance-attribute</code></small>
|
||
</span>
|
||
|
||
</h4>
|
||
<div class="doc-signature highlight"><pre><span></span><code><span class="n">document_timeout</span><span class="p">:</span> <span class="n"><span title="typing.Optional">Optional</span></span><span class="p">[</span><span class="n"><span title="float">float</span></span><span class="p">]</span> <span class="o">=</span> <span class="kc">None</span>
|
||
</code></pre></div>
|
||
|
||
<div class="doc doc-contents ">
|
||
|
||
</div>
|
||
|
||
</div>
|
||
|
||
<div class="doc doc-object doc-attribute">
|
||
|
||
|
||
|
||
<h4 id="docling.datamodel.pipeline_options.AsrPipelineOptions.enable_remote_services" class="doc doc-heading">
|
||
<code class="doc-symbol doc-symbol-heading doc-symbol-attribute"></code> <span class="doc doc-object-name doc-attribute-name">enable_remote_services</span>
|
||
|
||
|
||
<span class="doc doc-labels">
|
||
<small class="doc doc-label doc-label-class-attribute"><code>class-attribute</code></small>
|
||
<small class="doc doc-label doc-label-instance-attribute"><code>instance-attribute</code></small>
|
||
</span>
|
||
|
||
</h4>
|
||
<div class="doc-signature highlight"><pre><span></span><code><span class="n">enable_remote_services</span><span class="p">:</span> <span class="n"><span title="bool">bool</span></span> <span class="o">=</span> <span class="kc">False</span>
|
||
</code></pre></div>
|
||
|
||
<div class="doc doc-contents ">
|
||
|
||
</div>
|
||
|
||
</div>
|
||
|
||
<div class="doc doc-object doc-attribute">
|
||
|
||
|
||
|
||
<h4 id="docling.datamodel.pipeline_options.AsrPipelineOptions.kind" class="doc doc-heading">
|
||
<code class="doc-symbol doc-symbol-heading doc-symbol-attribute"></code> <span class="doc doc-object-name doc-attribute-name">kind</span>
|
||
|
||
|
||
<span class="doc doc-labels">
|
||
<small class="doc doc-label doc-label-class-attribute"><code>class-attribute</code></small>
|
||
</span>
|
||
|
||
</h4>
|
||
<div class="doc-signature highlight"><pre><span></span><code><span class="n">kind</span><span class="p">:</span> <span class="n"><span title="str">str</span></span>
|
||
</code></pre></div>
|
||
|
||
<div class="doc doc-contents ">
|
||
|
||
</div>
|
||
|
||
</div>
|
||
|
||
|
||
|
||
|
||
|
||
|
||
</div>
|
||
|
||
</div>
|
||
|
||
</div>
|
||
|
||
<div class="doc doc-object doc-class">
|
||
|
||
|
||
|
||
<h3 id="docling.datamodel.pipeline_options.BaseLayoutOptions" class="doc doc-heading">
|
||
<code class="doc-symbol doc-symbol-heading doc-symbol-class"></code> <span class="doc doc-object-name doc-class-name">BaseLayoutOptions</span>
|
||
|
||
|
||
</h3>
|
||
|
||
|
||
<div class="doc doc-contents ">
|
||
<p class="doc doc-class-bases">
|
||
Bases: <code><a class="autorefs autorefs-internal" title="<code class="doc-symbol doc-symbol-heading doc-symbol-class"></code> <span class="doc doc-object-name doc-class-name">BaseOptions</span> (<code>docling.datamodel.pipeline_options.BaseOptions</code>)" href="#docling.datamodel.pipeline_options.BaseOptions">BaseOptions</a></code></p>
|
||
|
||
|
||
|
||
<p>Base options for layout models.</p>
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
<p><span class="doc-section-title">Attributes:</span></p>
|
||
<ul>
|
||
<li class="doc-section-item field-body">
|
||
<b><code><a class="autorefs autorefs-internal" title="<code class="doc-symbol doc-symbol-heading doc-symbol-attribute"></code> <span class="doc doc-object-name doc-attribute-name">keep_empty_clusters</span>
|
||
|
||
|
||
<span class="doc doc-labels">
|
||
<small class="doc doc-label doc-label-class-attribute"><code>class-attribute</code></small>
|
||
<small class="doc doc-label doc-label-instance-attribute"><code>instance-attribute</code></small>
|
||
</span> (<code>docling.datamodel.pipeline_options.BaseLayoutOptions.keep_empty_clusters</code>)" href="#docling.datamodel.pipeline_options.BaseLayoutOptions.keep_empty_clusters">keep_empty_clusters</a></code></b>
|
||
(<code><span title="bool">bool</span></code>)
|
||
–
|
||
<div class="doc-md-description">
|
||
|
||
</div>
|
||
</li>
|
||
<li class="doc-section-item field-body">
|
||
<b><code><a class="autorefs autorefs-internal" title="<code class="doc-symbol doc-symbol-heading doc-symbol-attribute"></code> <span class="doc doc-object-name doc-attribute-name">kind</span>
|
||
|
||
|
||
<span class="doc doc-labels">
|
||
<small class="doc doc-label doc-label-class-attribute"><code>class-attribute</code></small>
|
||
</span> (<code>docling.datamodel.pipeline_options.BaseLayoutOptions.kind</code>)" href="#docling.datamodel.pipeline_options.BaseLayoutOptions.kind">kind</a></code></b>
|
||
(<code><span title="str">str</span></code>)
|
||
–
|
||
<div class="doc-md-description">
|
||
|
||
</div>
|
||
</li>
|
||
<li class="doc-section-item field-body">
|
||
<b><code><a class="autorefs autorefs-internal" title="<code class="doc-symbol doc-symbol-heading doc-symbol-attribute"></code> <span class="doc doc-object-name doc-attribute-name">skip_cell_assignment</span>
|
||
|
||
|
||
<span class="doc doc-labels">
|
||
<small class="doc doc-label doc-label-class-attribute"><code>class-attribute</code></small>
|
||
<small class="doc doc-label doc-label-instance-attribute"><code>instance-attribute</code></small>
|
||
</span> (<code>docling.datamodel.pipeline_options.BaseLayoutOptions.skip_cell_assignment</code>)" href="#docling.datamodel.pipeline_options.BaseLayoutOptions.skip_cell_assignment">skip_cell_assignment</a></code></b>
|
||
(<code><span title="bool">bool</span></code>)
|
||
–
|
||
<div class="doc-md-description">
|
||
|
||
</div>
|
||
</li>
|
||
</ul>
|
||
|
||
|
||
|
||
|
||
<div class="doc doc-children">
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
<div class="doc doc-object doc-attribute">
|
||
|
||
|
||
|
||
<h4 id="docling.datamodel.pipeline_options.BaseLayoutOptions.keep_empty_clusters" class="doc doc-heading">
|
||
<code class="doc-symbol doc-symbol-heading doc-symbol-attribute"></code> <span class="doc doc-object-name doc-attribute-name">keep_empty_clusters</span>
|
||
|
||
|
||
<span class="doc doc-labels">
|
||
<small class="doc doc-label doc-label-class-attribute"><code>class-attribute</code></small>
|
||
<small class="doc doc-label doc-label-instance-attribute"><code>instance-attribute</code></small>
|
||
</span>
|
||
|
||
</h4>
|
||
<div class="doc-signature highlight"><pre><span></span><code><span class="n">keep_empty_clusters</span><span class="p">:</span> <span class="n"><span title="bool">bool</span></span> <span class="o">=</span> <span class="kc">False</span>
|
||
</code></pre></div>
|
||
|
||
<div class="doc doc-contents ">
|
||
|
||
</div>
|
||
|
||
</div>
|
||
|
||
<div class="doc doc-object doc-attribute">
|
||
|
||
|
||
|
||
<h4 id="docling.datamodel.pipeline_options.BaseLayoutOptions.kind" class="doc doc-heading">
|
||
<code class="doc-symbol doc-symbol-heading doc-symbol-attribute"></code> <span class="doc doc-object-name doc-attribute-name">kind</span>
|
||
|
||
|
||
<span class="doc doc-labels">
|
||
<small class="doc doc-label doc-label-class-attribute"><code>class-attribute</code></small>
|
||
</span>
|
||
|
||
</h4>
|
||
<div class="doc-signature highlight"><pre><span></span><code><span class="n">kind</span><span class="p">:</span> <span class="n"><span title="str">str</span></span>
|
||
</code></pre></div>
|
||
|
||
<div class="doc doc-contents ">
|
||
|
||
</div>
|
||
|
||
</div>
|
||
|
||
<div class="doc doc-object doc-attribute">
|
||
|
||
|
||
|
||
<h4 id="docling.datamodel.pipeline_options.BaseLayoutOptions.skip_cell_assignment" class="doc doc-heading">
|
||
<code class="doc-symbol doc-symbol-heading doc-symbol-attribute"></code> <span class="doc doc-object-name doc-attribute-name">skip_cell_assignment</span>
|
||
|
||
|
||
<span class="doc doc-labels">
|
||
<small class="doc doc-label doc-label-class-attribute"><code>class-attribute</code></small>
|
||
<small class="doc doc-label doc-label-instance-attribute"><code>instance-attribute</code></small>
|
||
</span>
|
||
|
||
</h4>
|
||
<div class="doc-signature highlight"><pre><span></span><code><span class="n">skip_cell_assignment</span><span class="p">:</span> <span class="n"><span title="bool">bool</span></span> <span class="o">=</span> <span class="kc">False</span>
|
||
</code></pre></div>
|
||
|
||
<div class="doc doc-contents ">
|
||
|
||
</div>
|
||
|
||
</div>
|
||
|
||
|
||
|
||
|
||
|
||
|
||
</div>
|
||
|
||
</div>
|
||
|
||
</div>
|
||
|
||
<div class="doc doc-object doc-class">
|
||
|
||
|
||
|
||
<h3 id="docling.datamodel.pipeline_options.BaseOptions" class="doc doc-heading">
|
||
<code class="doc-symbol doc-symbol-heading doc-symbol-class"></code> <span class="doc doc-object-name doc-class-name">BaseOptions</span>
|
||
|
||
|
||
</h3>
|
||
|
||
|
||
<div class="doc doc-contents ">
|
||
<p class="doc doc-class-bases">
|
||
Bases: <code><span title="pydantic.BaseModel">BaseModel</span></code></p>
|
||
|
||
|
||
|
||
<p>Base class for options.</p>
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
<p><span class="doc-section-title">Attributes:</span></p>
|
||
<ul>
|
||
<li class="doc-section-item field-body">
|
||
<b><code><a class="autorefs autorefs-internal" title="<code class="doc-symbol doc-symbol-heading doc-symbol-attribute"></code> <span class="doc doc-object-name doc-attribute-name">kind</span>
|
||
|
||
|
||
<span class="doc doc-labels">
|
||
<small class="doc doc-label doc-label-class-attribute"><code>class-attribute</code></small>
|
||
</span> (<code>docling.datamodel.pipeline_options.BaseOptions.kind</code>)" href="#docling.datamodel.pipeline_options.BaseOptions.kind">kind</a></code></b>
|
||
(<code><span title="str">str</span></code>)
|
||
–
|
||
<div class="doc-md-description">
|
||
|
||
</div>
|
||
</li>
|
||
</ul>
|
||
|
||
|
||
|
||
|
||
<div class="doc doc-children">
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
<div class="doc doc-object doc-attribute">
|
||
|
||
|
||
|
||
<h4 id="docling.datamodel.pipeline_options.BaseOptions.kind" class="doc doc-heading">
|
||
<code class="doc-symbol doc-symbol-heading doc-symbol-attribute"></code> <span class="doc doc-object-name doc-attribute-name">kind</span>
|
||
|
||
|
||
<span class="doc doc-labels">
|
||
<small class="doc doc-label doc-label-class-attribute"><code>class-attribute</code></small>
|
||
</span>
|
||
|
||
</h4>
|
||
<div class="doc-signature highlight"><pre><span></span><code><span class="n">kind</span><span class="p">:</span> <span class="n"><span title="str">str</span></span>
|
||
</code></pre></div>
|
||
|
||
<div class="doc doc-contents ">
|
||
|
||
</div>
|
||
|
||
</div>
|
||
|
||
|
||
|
||
|
||
|
||
|
||
</div>
|
||
|
||
</div>
|
||
|
||
</div>
|
||
|
||
<div class="doc doc-object doc-class">
|
||
|
||
|
||
|
||
<h3 id="docling.datamodel.pipeline_options.BaseTableStructureOptions" class="doc doc-heading">
|
||
<code class="doc-symbol doc-symbol-heading doc-symbol-class"></code> <span class="doc doc-object-name doc-class-name">BaseTableStructureOptions</span>
|
||
|
||
|
||
</h3>
|
||
|
||
|
||
<div class="doc doc-contents ">
|
||
<p class="doc doc-class-bases">
|
||
Bases: <code><a class="autorefs autorefs-internal" title="<code class="doc-symbol doc-symbol-heading doc-symbol-class"></code> <span class="doc doc-object-name doc-class-name">BaseOptions</span> (<code>docling.datamodel.pipeline_options.BaseOptions</code>)" href="#docling.datamodel.pipeline_options.BaseOptions">BaseOptions</a></code></p>
|
||
|
||
|
||
|
||
<p>Base options for table structure models.</p>
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
<p><span class="doc-section-title">Attributes:</span></p>
|
||
<ul>
|
||
<li class="doc-section-item field-body">
|
||
<b><code><a class="autorefs autorefs-internal" title="<code class="doc-symbol doc-symbol-heading doc-symbol-attribute"></code> <span class="doc doc-object-name doc-attribute-name">kind</span>
|
||
|
||
|
||
<span class="doc doc-labels">
|
||
<small class="doc doc-label doc-label-class-attribute"><code>class-attribute</code></small>
|
||
</span> (<code>docling.datamodel.pipeline_options.BaseTableStructureOptions.kind</code>)" href="#docling.datamodel.pipeline_options.BaseTableStructureOptions.kind">kind</a></code></b>
|
||
(<code><span title="str">str</span></code>)
|
||
–
|
||
<div class="doc-md-description">
|
||
|
||
</div>
|
||
</li>
|
||
</ul>
|
||
|
||
|
||
|
||
|
||
<div class="doc doc-children">
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
<div class="doc doc-object doc-attribute">
|
||
|
||
|
||
|
||
<h4 id="docling.datamodel.pipeline_options.BaseTableStructureOptions.kind" class="doc doc-heading">
|
||
<code class="doc-symbol doc-symbol-heading doc-symbol-attribute"></code> <span class="doc doc-object-name doc-attribute-name">kind</span>
|
||
|
||
|
||
<span class="doc doc-labels">
|
||
<small class="doc doc-label doc-label-class-attribute"><code>class-attribute</code></small>
|
||
</span>
|
||
|
||
</h4>
|
||
<div class="doc-signature highlight"><pre><span></span><code><span class="n">kind</span><span class="p">:</span> <span class="n"><span title="str">str</span></span>
|
||
</code></pre></div>
|
||
|
||
<div class="doc doc-contents ">
|
||
|
||
</div>
|
||
|
||
</div>
|
||
|
||
|
||
|
||
|
||
|
||
|
||
</div>
|
||
|
||
</div>
|
||
|
||
</div>
|
||
|
||
<div class="doc doc-object doc-class">
|
||
|
||
|
||
|
||
<h3 id="docling.datamodel.pipeline_options.ConvertPipelineOptions" class="doc doc-heading">
|
||
<code class="doc-symbol doc-symbol-heading doc-symbol-class"></code> <span class="doc doc-object-name doc-class-name">ConvertPipelineOptions</span>
|
||
|
||
|
||
</h3>
|
||
|
||
|
||
<div class="doc doc-contents ">
|
||
<p class="doc doc-class-bases">
|
||
Bases: <code><a class="autorefs autorefs-internal" title="<code class="doc-symbol doc-symbol-heading doc-symbol-class"></code> <span class="doc doc-object-name doc-class-name">PipelineOptions</span> (<code>docling.datamodel.pipeline_options.PipelineOptions</code>)" href="#docling.datamodel.pipeline_options.PipelineOptions">PipelineOptions</a></code></p>
|
||
|
||
|
||
|
||
<p>Base convert pipeline options.</p>
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
<p><span class="doc-section-title">Attributes:</span></p>
|
||
<ul>
|
||
<li class="doc-section-item field-body">
|
||
<b><code><a class="autorefs autorefs-internal" title="<code class="doc-symbol doc-symbol-heading doc-symbol-attribute"></code> <span class="doc doc-object-name doc-attribute-name">accelerator_options</span>
|
||
|
||
|
||
<span class="doc doc-labels">
|
||
<small class="doc doc-label doc-label-class-attribute"><code>class-attribute</code></small>
|
||
<small class="doc doc-label doc-label-instance-attribute"><code>instance-attribute</code></small>
|
||
</span> (<code>docling.datamodel.pipeline_options.ConvertPipelineOptions.accelerator_options</code>)" href="#docling.datamodel.pipeline_options.ConvertPipelineOptions.accelerator_options">accelerator_options</a></code></b>
|
||
(<code><span title="docling.datamodel.accelerator_options.AcceleratorOptions">AcceleratorOptions</span></code>)
|
||
–
|
||
<div class="doc-md-description">
|
||
|
||
</div>
|
||
</li>
|
||
<li class="doc-section-item field-body">
|
||
<b><code><a class="autorefs autorefs-internal" title="<code class="doc-symbol doc-symbol-heading doc-symbol-attribute"></code> <span class="doc doc-object-name doc-attribute-name">allow_external_plugins</span>
|
||
|
||
|
||
<span class="doc doc-labels">
|
||
<small class="doc doc-label doc-label-class-attribute"><code>class-attribute</code></small>
|
||
<small class="doc doc-label doc-label-instance-attribute"><code>instance-attribute</code></small>
|
||
</span> (<code>docling.datamodel.pipeline_options.ConvertPipelineOptions.allow_external_plugins</code>)" href="#docling.datamodel.pipeline_options.ConvertPipelineOptions.allow_external_plugins">allow_external_plugins</a></code></b>
|
||
(<code><span title="bool">bool</span></code>)
|
||
–
|
||
<div class="doc-md-description">
|
||
|
||
</div>
|
||
</li>
|
||
<li class="doc-section-item field-body">
|
||
<b><code><a class="autorefs autorefs-internal" title="<code class="doc-symbol doc-symbol-heading doc-symbol-attribute"></code> <span class="doc doc-object-name doc-attribute-name">artifacts_path</span>
|
||
|
||
|
||
<span class="doc doc-labels">
|
||
<small class="doc doc-label doc-label-class-attribute"><code>class-attribute</code></small>
|
||
<small class="doc doc-label doc-label-instance-attribute"><code>instance-attribute</code></small>
|
||
</span> (<code>docling.datamodel.pipeline_options.ConvertPipelineOptions.artifacts_path</code>)" href="#docling.datamodel.pipeline_options.ConvertPipelineOptions.artifacts_path">artifacts_path</a></code></b>
|
||
(<code><span title="typing.Optional">Optional</span>[<span title="typing.Union">Union</span>[<span title="pathlib.Path">Path</span>, <span title="str">str</span>]]</code>)
|
||
–
|
||
<div class="doc-md-description">
|
||
|
||
</div>
|
||
</li>
|
||
<li class="doc-section-item field-body">
|
||
<b><code><a class="autorefs autorefs-internal" title="<code class="doc-symbol doc-symbol-heading doc-symbol-attribute"></code> <span class="doc doc-object-name doc-attribute-name">do_picture_classification</span>
|
||
|
||
|
||
<span class="doc doc-labels">
|
||
<small class="doc doc-label doc-label-class-attribute"><code>class-attribute</code></small>
|
||
<small class="doc doc-label doc-label-instance-attribute"><code>instance-attribute</code></small>
|
||
</span> (<code>docling.datamodel.pipeline_options.ConvertPipelineOptions.do_picture_classification</code>)" href="#docling.datamodel.pipeline_options.ConvertPipelineOptions.do_picture_classification">do_picture_classification</a></code></b>
|
||
(<code><span title="bool">bool</span></code>)
|
||
–
|
||
<div class="doc-md-description">
|
||
|
||
</div>
|
||
</li>
|
||
<li class="doc-section-item field-body">
|
||
<b><code><a class="autorefs autorefs-internal" title="<code class="doc-symbol doc-symbol-heading doc-symbol-attribute"></code> <span class="doc doc-object-name doc-attribute-name">do_picture_description</span>
|
||
|
||
|
||
<span class="doc doc-labels">
|
||
<small class="doc doc-label doc-label-class-attribute"><code>class-attribute</code></small>
|
||
<small class="doc doc-label doc-label-instance-attribute"><code>instance-attribute</code></small>
|
||
</span> (<code>docling.datamodel.pipeline_options.ConvertPipelineOptions.do_picture_description</code>)" href="#docling.datamodel.pipeline_options.ConvertPipelineOptions.do_picture_description">do_picture_description</a></code></b>
|
||
(<code><span title="bool">bool</span></code>)
|
||
–
|
||
<div class="doc-md-description">
|
||
|
||
</div>
|
||
</li>
|
||
<li class="doc-section-item field-body">
|
||
<b><code><a class="autorefs autorefs-internal" title="<code class="doc-symbol doc-symbol-heading doc-symbol-attribute"></code> <span class="doc doc-object-name doc-attribute-name">document_timeout</span>
|
||
|
||
|
||
<span class="doc doc-labels">
|
||
<small class="doc doc-label doc-label-class-attribute"><code>class-attribute</code></small>
|
||
<small class="doc doc-label doc-label-instance-attribute"><code>instance-attribute</code></small>
|
||
</span> (<code>docling.datamodel.pipeline_options.ConvertPipelineOptions.document_timeout</code>)" href="#docling.datamodel.pipeline_options.ConvertPipelineOptions.document_timeout">document_timeout</a></code></b>
|
||
(<code><span title="typing.Optional">Optional</span>[<span title="float">float</span>]</code>)
|
||
–
|
||
<div class="doc-md-description">
|
||
|
||
</div>
|
||
</li>
|
||
<li class="doc-section-item field-body">
|
||
<b><code><a class="autorefs autorefs-internal" title="<code class="doc-symbol doc-symbol-heading doc-symbol-attribute"></code> <span class="doc doc-object-name doc-attribute-name">enable_remote_services</span>
|
||
|
||
|
||
<span class="doc doc-labels">
|
||
<small class="doc doc-label doc-label-class-attribute"><code>class-attribute</code></small>
|
||
<small class="doc doc-label doc-label-instance-attribute"><code>instance-attribute</code></small>
|
||
</span> (<code>docling.datamodel.pipeline_options.ConvertPipelineOptions.enable_remote_services</code>)" href="#docling.datamodel.pipeline_options.ConvertPipelineOptions.enable_remote_services">enable_remote_services</a></code></b>
|
||
(<code><span title="bool">bool</span></code>)
|
||
–
|
||
<div class="doc-md-description">
|
||
|
||
</div>
|
||
</li>
|
||
<li class="doc-section-item field-body">
|
||
<b><code><a class="autorefs autorefs-internal" title="<code class="doc-symbol doc-symbol-heading doc-symbol-attribute"></code> <span class="doc doc-object-name doc-attribute-name">kind</span>
|
||
|
||
|
||
<span class="doc doc-labels">
|
||
<small class="doc doc-label doc-label-class-attribute"><code>class-attribute</code></small>
|
||
</span> (<code>docling.datamodel.pipeline_options.ConvertPipelineOptions.kind</code>)" href="#docling.datamodel.pipeline_options.ConvertPipelineOptions.kind">kind</a></code></b>
|
||
(<code><span title="str">str</span></code>)
|
||
–
|
||
<div class="doc-md-description">
|
||
|
||
</div>
|
||
</li>
|
||
<li class="doc-section-item field-body">
|
||
<b><code><a class="autorefs autorefs-internal" title="<code class="doc-symbol doc-symbol-heading doc-symbol-attribute"></code> <span class="doc doc-object-name doc-attribute-name">picture_description_options</span>
|
||
|
||
|
||
<span class="doc doc-labels">
|
||
<small class="doc doc-label doc-label-class-attribute"><code>class-attribute</code></small>
|
||
<small class="doc doc-label doc-label-instance-attribute"><code>instance-attribute</code></small>
|
||
</span> (<code>docling.datamodel.pipeline_options.ConvertPipelineOptions.picture_description_options</code>)" href="#docling.datamodel.pipeline_options.ConvertPipelineOptions.picture_description_options">picture_description_options</a></code></b>
|
||
(<code><a class="autorefs autorefs-internal" title="<code class="doc-symbol doc-symbol-heading doc-symbol-class"></code> <span class="doc doc-object-name doc-class-name">PictureDescriptionBaseOptions</span> (<code>docling.datamodel.pipeline_options.PictureDescriptionBaseOptions</code>)" href="#docling.datamodel.pipeline_options.PictureDescriptionBaseOptions">PictureDescriptionBaseOptions</a></code>)
|
||
–
|
||
<div class="doc-md-description">
|
||
|
||
</div>
|
||
</li>
|
||
</ul>
|
||
|
||
|
||
|
||
|
||
<div class="doc doc-children">
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
<div class="doc doc-object doc-attribute">
|
||
|
||
|
||
|
||
<h4 id="docling.datamodel.pipeline_options.ConvertPipelineOptions.accelerator_options" class="doc doc-heading">
|
||
<code class="doc-symbol doc-symbol-heading doc-symbol-attribute"></code> <span class="doc doc-object-name doc-attribute-name">accelerator_options</span>
|
||
|
||
|
||
<span class="doc doc-labels">
|
||
<small class="doc doc-label doc-label-class-attribute"><code>class-attribute</code></small>
|
||
<small class="doc doc-label doc-label-instance-attribute"><code>instance-attribute</code></small>
|
||
</span>
|
||
|
||
</h4>
|
||
<div class="doc-signature highlight"><pre><span></span><code><span class="n">accelerator_options</span><span class="p">:</span> <span class="n"><span title="docling.datamodel.accelerator_options.AcceleratorOptions">AcceleratorOptions</span></span> <span class="o">=</span> <span class="n"><span title="docling.datamodel.accelerator_options.AcceleratorOptions">AcceleratorOptions</span></span><span class="p">()</span>
|
||
</code></pre></div>
|
||
|
||
<div class="doc doc-contents ">
|
||
|
||
</div>
|
||
|
||
</div>
|
||
|
||
<div class="doc doc-object doc-attribute">
|
||
|
||
|
||
|
||
<h4 id="docling.datamodel.pipeline_options.ConvertPipelineOptions.allow_external_plugins" class="doc doc-heading">
|
||
<code class="doc-symbol doc-symbol-heading doc-symbol-attribute"></code> <span class="doc doc-object-name doc-attribute-name">allow_external_plugins</span>
|
||
|
||
|
||
<span class="doc doc-labels">
|
||
<small class="doc doc-label doc-label-class-attribute"><code>class-attribute</code></small>
|
||
<small class="doc doc-label doc-label-instance-attribute"><code>instance-attribute</code></small>
|
||
</span>
|
||
|
||
</h4>
|
||
<div class="doc-signature highlight"><pre><span></span><code><span class="n">allow_external_plugins</span><span class="p">:</span> <span class="n"><span title="bool">bool</span></span> <span class="o">=</span> <span class="kc">False</span>
|
||
</code></pre></div>
|
||
|
||
<div class="doc doc-contents ">
|
||
|
||
</div>
|
||
|
||
</div>
|
||
|
||
<div class="doc doc-object doc-attribute">
|
||
|
||
|
||
|
||
<h4 id="docling.datamodel.pipeline_options.ConvertPipelineOptions.artifacts_path" class="doc doc-heading">
|
||
<code class="doc-symbol doc-symbol-heading doc-symbol-attribute"></code> <span class="doc doc-object-name doc-attribute-name">artifacts_path</span>
|
||
|
||
|
||
<span class="doc doc-labels">
|
||
<small class="doc doc-label doc-label-class-attribute"><code>class-attribute</code></small>
|
||
<small class="doc doc-label doc-label-instance-attribute"><code>instance-attribute</code></small>
|
||
</span>
|
||
|
||
</h4>
|
||
<div class="doc-signature highlight"><pre><span></span><code><span class="n">artifacts_path</span><span class="p">:</span> <span class="n"><span title="typing.Optional">Optional</span></span><span class="p">[</span><span class="n"><span title="typing.Union">Union</span></span><span class="p">[</span><span class="n"><span title="pathlib.Path">Path</span></span><span class="p">,</span> <span class="n"><span title="str">str</span></span><span class="p">]]</span> <span class="o">=</span> <span class="kc">None</span>
|
||
</code></pre></div>
|
||
|
||
<div class="doc doc-contents ">
|
||
|
||
</div>
|
||
|
||
</div>
|
||
|
||
<div class="doc doc-object doc-attribute">
|
||
|
||
|
||
|
||
<h4 id="docling.datamodel.pipeline_options.ConvertPipelineOptions.do_picture_classification" class="doc doc-heading">
|
||
<code class="doc-symbol doc-symbol-heading doc-symbol-attribute"></code> <span class="doc doc-object-name doc-attribute-name">do_picture_classification</span>
|
||
|
||
|
||
<span class="doc doc-labels">
|
||
<small class="doc doc-label doc-label-class-attribute"><code>class-attribute</code></small>
|
||
<small class="doc doc-label doc-label-instance-attribute"><code>instance-attribute</code></small>
|
||
</span>
|
||
|
||
</h4>
|
||
<div class="doc-signature highlight"><pre><span></span><code><span class="n">do_picture_classification</span><span class="p">:</span> <span class="n"><span title="bool">bool</span></span> <span class="o">=</span> <span class="kc">False</span>
|
||
</code></pre></div>
|
||
|
||
<div class="doc doc-contents ">
|
||
|
||
</div>
|
||
|
||
</div>
|
||
|
||
<div class="doc doc-object doc-attribute">
|
||
|
||
|
||
|
||
<h4 id="docling.datamodel.pipeline_options.ConvertPipelineOptions.do_picture_description" class="doc doc-heading">
|
||
<code class="doc-symbol doc-symbol-heading doc-symbol-attribute"></code> <span class="doc doc-object-name doc-attribute-name">do_picture_description</span>
|
||
|
||
|
||
<span class="doc doc-labels">
|
||
<small class="doc doc-label doc-label-class-attribute"><code>class-attribute</code></small>
|
||
<small class="doc doc-label doc-label-instance-attribute"><code>instance-attribute</code></small>
|
||
</span>
|
||
|
||
</h4>
|
||
<div class="doc-signature highlight"><pre><span></span><code><span class="n">do_picture_description</span><span class="p">:</span> <span class="n"><span title="bool">bool</span></span> <span class="o">=</span> <span class="kc">False</span>
|
||
</code></pre></div>
|
||
|
||
<div class="doc doc-contents ">
|
||
|
||
</div>
|
||
|
||
</div>
|
||
|
||
<div class="doc doc-object doc-attribute">
|
||
|
||
|
||
|
||
<h4 id="docling.datamodel.pipeline_options.ConvertPipelineOptions.document_timeout" class="doc doc-heading">
|
||
<code class="doc-symbol doc-symbol-heading doc-symbol-attribute"></code> <span class="doc doc-object-name doc-attribute-name">document_timeout</span>
|
||
|
||
|
||
<span class="doc doc-labels">
|
||
<small class="doc doc-label doc-label-class-attribute"><code>class-attribute</code></small>
|
||
<small class="doc doc-label doc-label-instance-attribute"><code>instance-attribute</code></small>
|
||
</span>
|
||
|
||
</h4>
|
||
<div class="doc-signature highlight"><pre><span></span><code><span class="n">document_timeout</span><span class="p">:</span> <span class="n"><span title="typing.Optional">Optional</span></span><span class="p">[</span><span class="n"><span title="float">float</span></span><span class="p">]</span> <span class="o">=</span> <span class="kc">None</span>
|
||
</code></pre></div>
|
||
|
||
<div class="doc doc-contents ">
|
||
|
||
</div>
|
||
|
||
</div>
|
||
|
||
<div class="doc doc-object doc-attribute">
|
||
|
||
|
||
|
||
<h4 id="docling.datamodel.pipeline_options.ConvertPipelineOptions.enable_remote_services" class="doc doc-heading">
|
||
<code class="doc-symbol doc-symbol-heading doc-symbol-attribute"></code> <span class="doc doc-object-name doc-attribute-name">enable_remote_services</span>
|
||
|
||
|
||
<span class="doc doc-labels">
|
||
<small class="doc doc-label doc-label-class-attribute"><code>class-attribute</code></small>
|
||
<small class="doc doc-label doc-label-instance-attribute"><code>instance-attribute</code></small>
|
||
</span>
|
||
|
||
</h4>
|
||
<div class="doc-signature highlight"><pre><span></span><code><span class="n">enable_remote_services</span><span class="p">:</span> <span class="n"><span title="bool">bool</span></span> <span class="o">=</span> <span class="kc">False</span>
|
||
</code></pre></div>
|
||
|
||
<div class="doc doc-contents ">
|
||
|
||
</div>
|
||
|
||
</div>
|
||
|
||
<div class="doc doc-object doc-attribute">
|
||
|
||
|
||
|
||
<h4 id="docling.datamodel.pipeline_options.ConvertPipelineOptions.kind" class="doc doc-heading">
|
||
<code class="doc-symbol doc-symbol-heading doc-symbol-attribute"></code> <span class="doc doc-object-name doc-attribute-name">kind</span>
|
||
|
||
|
||
<span class="doc doc-labels">
|
||
<small class="doc doc-label doc-label-class-attribute"><code>class-attribute</code></small>
|
||
</span>
|
||
|
||
</h4>
|
||
<div class="doc-signature highlight"><pre><span></span><code><span class="n">kind</span><span class="p">:</span> <span class="n"><span title="str">str</span></span>
|
||
</code></pre></div>
|
||
|
||
<div class="doc doc-contents ">
|
||
|
||
</div>
|
||
|
||
</div>
|
||
|
||
<div class="doc doc-object doc-attribute">
|
||
|
||
|
||
|
||
<h4 id="docling.datamodel.pipeline_options.ConvertPipelineOptions.picture_description_options" class="doc doc-heading">
|
||
<code class="doc-symbol doc-symbol-heading doc-symbol-attribute"></code> <span class="doc doc-object-name doc-attribute-name">picture_description_options</span>
|
||
|
||
|
||
<span class="doc doc-labels">
|
||
<small class="doc doc-label doc-label-class-attribute"><code>class-attribute</code></small>
|
||
<small class="doc doc-label doc-label-instance-attribute"><code>instance-attribute</code></small>
|
||
</span>
|
||
|
||
</h4>
|
||
<div class="doc-signature highlight"><pre><span></span><code><span class="n">picture_description_options</span><span class="p">:</span> <span class="n"><a class="autorefs autorefs-internal" title="<code class="doc-symbol doc-symbol-heading doc-symbol-class"></code> <span class="doc doc-object-name doc-class-name">PictureDescriptionBaseOptions</span> (<code>docling.datamodel.pipeline_options.PictureDescriptionBaseOptions</code>)" href="#docling.datamodel.pipeline_options.PictureDescriptionBaseOptions">PictureDescriptionBaseOptions</a></span> <span class="o">=</span> <span class="n"><a class="autorefs autorefs-internal" title="<code class="doc-symbol doc-symbol-heading doc-symbol-attribute"></code> <span class="doc doc-object-name doc-attribute-name">smolvlm_picture_description</span>
|
||
|
||
|
||
<span class="doc doc-labels">
|
||
<small class="doc doc-label doc-label-module-attribute"><code>module-attribute</code></small>
|
||
</span> (<code>docling.datamodel.pipeline_options.smolvlm_picture_description</code>)" href="#docling.datamodel.pipeline_options.smolvlm_picture_description">smolvlm_picture_description</a></span>
|
||
</code></pre></div>
|
||
|
||
<div class="doc doc-contents ">
|
||
|
||
</div>
|
||
|
||
</div>
|
||
|
||
|
||
|
||
|
||
|
||
|
||
</div>
|
||
|
||
</div>
|
||
|
||
</div>
|
||
|
||
<div class="doc doc-object doc-class">
|
||
|
||
|
||
|
||
<h3 id="docling.datamodel.pipeline_options.EasyOcrOptions" class="doc doc-heading">
|
||
<code class="doc-symbol doc-symbol-heading doc-symbol-class"></code> <span class="doc doc-object-name doc-class-name">EasyOcrOptions</span>
|
||
|
||
|
||
</h3>
|
||
|
||
|
||
<div class="doc doc-contents ">
|
||
<p class="doc doc-class-bases">
|
||
Bases: <code><a class="autorefs autorefs-internal" title="<code class="doc-symbol doc-symbol-heading doc-symbol-class"></code> <span class="doc doc-object-name doc-class-name">OcrOptions</span> (<code>docling.datamodel.pipeline_options.OcrOptions</code>)" href="#docling.datamodel.pipeline_options.OcrOptions">OcrOptions</a></code></p>
|
||
|
||
|
||
|
||
<p>Options for the EasyOCR engine.</p>
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
<p><span class="doc-section-title">Attributes:</span></p>
|
||
<ul>
|
||
<li class="doc-section-item field-body">
|
||
<b><code><a class="autorefs autorefs-internal" title="<code class="doc-symbol doc-symbol-heading doc-symbol-attribute"></code> <span class="doc doc-object-name doc-attribute-name">bitmap_area_threshold</span>
|
||
|
||
|
||
<span class="doc doc-labels">
|
||
<small class="doc doc-label doc-label-class-attribute"><code>class-attribute</code></small>
|
||
<small class="doc doc-label doc-label-instance-attribute"><code>instance-attribute</code></small>
|
||
</span> (<code>docling.datamodel.pipeline_options.EasyOcrOptions.bitmap_area_threshold</code>)" href="#docling.datamodel.pipeline_options.EasyOcrOptions.bitmap_area_threshold">bitmap_area_threshold</a></code></b>
|
||
(<code><span title="float">float</span></code>)
|
||
–
|
||
<div class="doc-md-description">
|
||
|
||
</div>
|
||
</li>
|
||
<li class="doc-section-item field-body">
|
||
<b><code><a class="autorefs autorefs-internal" title="<code class="doc-symbol doc-symbol-heading doc-symbol-attribute"></code> <span class="doc doc-object-name doc-attribute-name">confidence_threshold</span>
|
||
|
||
|
||
<span class="doc doc-labels">
|
||
<small class="doc doc-label doc-label-class-attribute"><code>class-attribute</code></small>
|
||
<small class="doc doc-label doc-label-instance-attribute"><code>instance-attribute</code></small>
|
||
</span> (<code>docling.datamodel.pipeline_options.EasyOcrOptions.confidence_threshold</code>)" href="#docling.datamodel.pipeline_options.EasyOcrOptions.confidence_threshold">confidence_threshold</a></code></b>
|
||
(<code><span title="float">float</span></code>)
|
||
–
|
||
<div class="doc-md-description">
|
||
|
||
</div>
|
||
</li>
|
||
<li class="doc-section-item field-body">
|
||
<b><code><a class="autorefs autorefs-internal" title="<code class="doc-symbol doc-symbol-heading doc-symbol-attribute"></code> <span class="doc doc-object-name doc-attribute-name">download_enabled</span>
|
||
|
||
|
||
<span class="doc doc-labels">
|
||
<small class="doc doc-label doc-label-class-attribute"><code>class-attribute</code></small>
|
||
<small class="doc doc-label doc-label-instance-attribute"><code>instance-attribute</code></small>
|
||
</span> (<code>docling.datamodel.pipeline_options.EasyOcrOptions.download_enabled</code>)" href="#docling.datamodel.pipeline_options.EasyOcrOptions.download_enabled">download_enabled</a></code></b>
|
||
(<code><span title="bool">bool</span></code>)
|
||
–
|
||
<div class="doc-md-description">
|
||
|
||
</div>
|
||
</li>
|
||
<li class="doc-section-item field-body">
|
||
<b><code><a class="autorefs autorefs-internal" title="<code class="doc-symbol doc-symbol-heading doc-symbol-attribute"></code> <span class="doc doc-object-name doc-attribute-name">force_full_page_ocr</span>
|
||
|
||
|
||
<span class="doc doc-labels">
|
||
<small class="doc doc-label doc-label-class-attribute"><code>class-attribute</code></small>
|
||
<small class="doc doc-label doc-label-instance-attribute"><code>instance-attribute</code></small>
|
||
</span> (<code>docling.datamodel.pipeline_options.EasyOcrOptions.force_full_page_ocr</code>)" href="#docling.datamodel.pipeline_options.EasyOcrOptions.force_full_page_ocr">force_full_page_ocr</a></code></b>
|
||
(<code><span title="bool">bool</span></code>)
|
||
–
|
||
<div class="doc-md-description">
|
||
|
||
</div>
|
||
</li>
|
||
<li class="doc-section-item field-body">
|
||
<b><code><a class="autorefs autorefs-internal" title="<code class="doc-symbol doc-symbol-heading doc-symbol-attribute"></code> <span class="doc doc-object-name doc-attribute-name">kind</span>
|
||
|
||
|
||
<span class="doc doc-labels">
|
||
<small class="doc doc-label doc-label-class-attribute"><code>class-attribute</code></small>
|
||
</span> (<code>docling.datamodel.pipeline_options.EasyOcrOptions.kind</code>)" href="#docling.datamodel.pipeline_options.EasyOcrOptions.kind">kind</a></code></b>
|
||
(<code><span title="typing.Literal">Literal</span>['easyocr']</code>)
|
||
–
|
||
<div class="doc-md-description">
|
||
|
||
</div>
|
||
</li>
|
||
<li class="doc-section-item field-body">
|
||
<b><code><a class="autorefs autorefs-internal" title="<code class="doc-symbol doc-symbol-heading doc-symbol-attribute"></code> <span class="doc doc-object-name doc-attribute-name">lang</span>
|
||
|
||
|
||
<span class="doc doc-labels">
|
||
<small class="doc doc-label doc-label-class-attribute"><code>class-attribute</code></small>
|
||
<small class="doc doc-label doc-label-instance-attribute"><code>instance-attribute</code></small>
|
||
</span> (<code>docling.datamodel.pipeline_options.EasyOcrOptions.lang</code>)" href="#docling.datamodel.pipeline_options.EasyOcrOptions.lang">lang</a></code></b>
|
||
(<code><span title="typing.List">List</span>[<span title="str">str</span>]</code>)
|
||
–
|
||
<div class="doc-md-description">
|
||
|
||
</div>
|
||
</li>
|
||
<li class="doc-section-item field-body">
|
||
<b><code><a class="autorefs autorefs-internal" title="<code class="doc-symbol doc-symbol-heading doc-symbol-attribute"></code> <span class="doc doc-object-name doc-attribute-name">model_config</span>
|
||
|
||
|
||
<span class="doc doc-labels">
|
||
<small class="doc doc-label doc-label-class-attribute"><code>class-attribute</code></small>
|
||
<small class="doc doc-label doc-label-instance-attribute"><code>instance-attribute</code></small>
|
||
</span> (<code>docling.datamodel.pipeline_options.EasyOcrOptions.model_config</code>)" href="#docling.datamodel.pipeline_options.EasyOcrOptions.model_config">model_config</a></code></b>
|
||
–
|
||
<div class="doc-md-description">
|
||
|
||
</div>
|
||
</li>
|
||
<li class="doc-section-item field-body">
|
||
<b><code><a class="autorefs autorefs-internal" title="<code class="doc-symbol doc-symbol-heading doc-symbol-attribute"></code> <span class="doc doc-object-name doc-attribute-name">model_storage_directory</span>
|
||
|
||
|
||
<span class="doc doc-labels">
|
||
<small class="doc doc-label doc-label-class-attribute"><code>class-attribute</code></small>
|
||
<small class="doc doc-label doc-label-instance-attribute"><code>instance-attribute</code></small>
|
||
</span> (<code>docling.datamodel.pipeline_options.EasyOcrOptions.model_storage_directory</code>)" href="#docling.datamodel.pipeline_options.EasyOcrOptions.model_storage_directory">model_storage_directory</a></code></b>
|
||
(<code><span title="typing.Optional">Optional</span>[<span title="str">str</span>]</code>)
|
||
–
|
||
<div class="doc-md-description">
|
||
|
||
</div>
|
||
</li>
|
||
<li class="doc-section-item field-body">
|
||
<b><code><a class="autorefs autorefs-internal" title="<code class="doc-symbol doc-symbol-heading doc-symbol-attribute"></code> <span class="doc doc-object-name doc-attribute-name">recog_network</span>
|
||
|
||
|
||
<span class="doc doc-labels">
|
||
<small class="doc doc-label doc-label-class-attribute"><code>class-attribute</code></small>
|
||
<small class="doc doc-label doc-label-instance-attribute"><code>instance-attribute</code></small>
|
||
</span> (<code>docling.datamodel.pipeline_options.EasyOcrOptions.recog_network</code>)" href="#docling.datamodel.pipeline_options.EasyOcrOptions.recog_network">recog_network</a></code></b>
|
||
(<code><span title="typing.Optional">Optional</span>[<span title="str">str</span>]</code>)
|
||
–
|
||
<div class="doc-md-description">
|
||
|
||
</div>
|
||
</li>
|
||
<li class="doc-section-item field-body">
|
||
<b><code><a class="autorefs autorefs-internal" title="<code class="doc-symbol doc-symbol-heading doc-symbol-attribute"></code> <span class="doc doc-object-name doc-attribute-name">suppress_mps_warnings</span>
|
||
|
||
|
||
<span class="doc doc-labels">
|
||
<small class="doc doc-label doc-label-class-attribute"><code>class-attribute</code></small>
|
||
<small class="doc doc-label doc-label-instance-attribute"><code>instance-attribute</code></small>
|
||
</span> (<code>docling.datamodel.pipeline_options.EasyOcrOptions.suppress_mps_warnings</code>)" href="#docling.datamodel.pipeline_options.EasyOcrOptions.suppress_mps_warnings">suppress_mps_warnings</a></code></b>
|
||
(<code><span title="bool">bool</span></code>)
|
||
–
|
||
<div class="doc-md-description">
|
||
|
||
</div>
|
||
</li>
|
||
<li class="doc-section-item field-body">
|
||
<b><code><a class="autorefs autorefs-internal" title="<code class="doc-symbol doc-symbol-heading doc-symbol-attribute"></code> <span class="doc doc-object-name doc-attribute-name">use_gpu</span>
|
||
|
||
|
||
<span class="doc doc-labels">
|
||
<small class="doc doc-label doc-label-class-attribute"><code>class-attribute</code></small>
|
||
<small class="doc doc-label doc-label-instance-attribute"><code>instance-attribute</code></small>
|
||
</span> (<code>docling.datamodel.pipeline_options.EasyOcrOptions.use_gpu</code>)" href="#docling.datamodel.pipeline_options.EasyOcrOptions.use_gpu">use_gpu</a></code></b>
|
||
(<code><span title="typing.Optional">Optional</span>[<span title="bool">bool</span>]</code>)
|
||
–
|
||
<div class="doc-md-description">
|
||
|
||
</div>
|
||
</li>
|
||
</ul>
|
||
|
||
|
||
|
||
|
||
<div class="doc doc-children">
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
<div class="doc doc-object doc-attribute">
|
||
|
||
|
||
|
||
<h4 id="docling.datamodel.pipeline_options.EasyOcrOptions.bitmap_area_threshold" class="doc doc-heading">
|
||
<code class="doc-symbol doc-symbol-heading doc-symbol-attribute"></code> <span class="doc doc-object-name doc-attribute-name">bitmap_area_threshold</span>
|
||
|
||
|
||
<span class="doc doc-labels">
|
||
<small class="doc doc-label doc-label-class-attribute"><code>class-attribute</code></small>
|
||
<small class="doc doc-label doc-label-instance-attribute"><code>instance-attribute</code></small>
|
||
</span>
|
||
|
||
</h4>
|
||
<div class="doc-signature highlight"><pre><span></span><code><span class="n">bitmap_area_threshold</span><span class="p">:</span> <span class="n"><span title="float">float</span></span> <span class="o">=</span> <span class="mf">0.05</span>
|
||
</code></pre></div>
|
||
|
||
<div class="doc doc-contents ">
|
||
|
||
</div>
|
||
|
||
</div>
|
||
|
||
<div class="doc doc-object doc-attribute">
|
||
|
||
|
||
|
||
<h4 id="docling.datamodel.pipeline_options.EasyOcrOptions.confidence_threshold" class="doc doc-heading">
|
||
<code class="doc-symbol doc-symbol-heading doc-symbol-attribute"></code> <span class="doc doc-object-name doc-attribute-name">confidence_threshold</span>
|
||
|
||
|
||
<span class="doc doc-labels">
|
||
<small class="doc doc-label doc-label-class-attribute"><code>class-attribute</code></small>
|
||
<small class="doc doc-label doc-label-instance-attribute"><code>instance-attribute</code></small>
|
||
</span>
|
||
|
||
</h4>
|
||
<div class="doc-signature highlight"><pre><span></span><code><span class="n">confidence_threshold</span><span class="p">:</span> <span class="n"><span title="float">float</span></span> <span class="o">=</span> <span class="mf">0.5</span>
|
||
</code></pre></div>
|
||
|
||
<div class="doc doc-contents ">
|
||
|
||
</div>
|
||
|
||
</div>
|
||
|
||
<div class="doc doc-object doc-attribute">
|
||
|
||
|
||
|
||
<h4 id="docling.datamodel.pipeline_options.EasyOcrOptions.download_enabled" class="doc doc-heading">
|
||
<code class="doc-symbol doc-symbol-heading doc-symbol-attribute"></code> <span class="doc doc-object-name doc-attribute-name">download_enabled</span>
|
||
|
||
|
||
<span class="doc doc-labels">
|
||
<small class="doc doc-label doc-label-class-attribute"><code>class-attribute</code></small>
|
||
<small class="doc doc-label doc-label-instance-attribute"><code>instance-attribute</code></small>
|
||
</span>
|
||
|
||
</h4>
|
||
<div class="doc-signature highlight"><pre><span></span><code><span class="n">download_enabled</span><span class="p">:</span> <span class="n"><span title="bool">bool</span></span> <span class="o">=</span> <span class="kc">True</span>
|
||
</code></pre></div>
|
||
|
||
<div class="doc doc-contents ">
|
||
|
||
</div>
|
||
|
||
</div>
|
||
|
||
<div class="doc doc-object doc-attribute">
|
||
|
||
|
||
|
||
<h4 id="docling.datamodel.pipeline_options.EasyOcrOptions.force_full_page_ocr" class="doc doc-heading">
|
||
<code class="doc-symbol doc-symbol-heading doc-symbol-attribute"></code> <span class="doc doc-object-name doc-attribute-name">force_full_page_ocr</span>
|
||
|
||
|
||
<span class="doc doc-labels">
|
||
<small class="doc doc-label doc-label-class-attribute"><code>class-attribute</code></small>
|
||
<small class="doc doc-label doc-label-instance-attribute"><code>instance-attribute</code></small>
|
||
</span>
|
||
|
||
</h4>
|
||
<div class="doc-signature highlight"><pre><span></span><code><span class="n">force_full_page_ocr</span><span class="p">:</span> <span class="n"><span title="bool">bool</span></span> <span class="o">=</span> <span class="kc">False</span>
|
||
</code></pre></div>
|
||
|
||
<div class="doc doc-contents ">
|
||
|
||
</div>
|
||
|
||
</div>
|
||
|
||
<div class="doc doc-object doc-attribute">
|
||
|
||
|
||
|
||
<h4 id="docling.datamodel.pipeline_options.EasyOcrOptions.kind" class="doc doc-heading">
|
||
<code class="doc-symbol doc-symbol-heading doc-symbol-attribute"></code> <span class="doc doc-object-name doc-attribute-name">kind</span>
|
||
|
||
|
||
<span class="doc doc-labels">
|
||
<small class="doc doc-label doc-label-class-attribute"><code>class-attribute</code></small>
|
||
</span>
|
||
|
||
</h4>
|
||
<div class="doc-signature highlight"><pre><span></span><code><span class="n">kind</span><span class="p">:</span> <span class="n"><span title="typing.Literal">Literal</span></span><span class="p">[</span><span class="s1">'easyocr'</span><span class="p">]</span> <span class="o">=</span> <span class="s1">'easyocr'</span>
|
||
</code></pre></div>
|
||
|
||
<div class="doc doc-contents ">
|
||
|
||
</div>
|
||
|
||
</div>
|
||
|
||
<div class="doc doc-object doc-attribute">
|
||
|
||
|
||
|
||
<h4 id="docling.datamodel.pipeline_options.EasyOcrOptions.lang" class="doc doc-heading">
|
||
<code class="doc-symbol doc-symbol-heading doc-symbol-attribute"></code> <span class="doc doc-object-name doc-attribute-name">lang</span>
|
||
|
||
|
||
<span class="doc doc-labels">
|
||
<small class="doc doc-label doc-label-class-attribute"><code>class-attribute</code></small>
|
||
<small class="doc doc-label doc-label-instance-attribute"><code>instance-attribute</code></small>
|
||
</span>
|
||
|
||
</h4>
|
||
<div class="doc-signature highlight"><pre><span></span><code><span class="n">lang</span><span class="p">:</span> <span class="n"><span title="typing.List">List</span></span><span class="p">[</span><span class="n"><span title="str">str</span></span><span class="p">]</span> <span class="o">=</span> <span class="p">[</span><span class="s1">'fr'</span><span class="p">,</span> <span class="s1">'de'</span><span class="p">,</span> <span class="s1">'es'</span><span class="p">,</span> <span class="s1">'en'</span><span class="p">]</span>
|
||
</code></pre></div>
|
||
|
||
<div class="doc doc-contents ">
|
||
|
||
</div>
|
||
|
||
</div>
|
||
|
||
<div class="doc doc-object doc-attribute">
|
||
|
||
|
||
|
||
<h4 id="docling.datamodel.pipeline_options.EasyOcrOptions.model_config" class="doc doc-heading">
|
||
<code class="doc-symbol doc-symbol-heading doc-symbol-attribute"></code> <span class="doc doc-object-name doc-attribute-name">model_config</span>
|
||
|
||
|
||
<span class="doc doc-labels">
|
||
<small class="doc doc-label doc-label-class-attribute"><code>class-attribute</code></small>
|
||
<small class="doc doc-label doc-label-instance-attribute"><code>instance-attribute</code></small>
|
||
</span>
|
||
|
||
</h4>
|
||
<div class="doc-signature highlight"><pre><span></span><code><span class="n">model_config</span> <span class="o">=</span> <span class="n"><span title="pydantic.ConfigDict">ConfigDict</span></span><span class="p">(</span><span class="n"><span title="pydantic.ConfigDict(extra)">extra</span></span><span class="o">=</span><span class="s1">'forbid'</span><span class="p">,</span> <span class="n"><span title="pydantic.ConfigDict(protected_namespaces)">protected_namespaces</span></span><span class="o">=</span><span class="p">())</span>
|
||
</code></pre></div>
|
||
|
||
<div class="doc doc-contents ">
|
||
|
||
</div>
|
||
|
||
</div>
|
||
|
||
<div class="doc doc-object doc-attribute">
|
||
|
||
|
||
|
||
<h4 id="docling.datamodel.pipeline_options.EasyOcrOptions.model_storage_directory" class="doc doc-heading">
|
||
<code class="doc-symbol doc-symbol-heading doc-symbol-attribute"></code> <span class="doc doc-object-name doc-attribute-name">model_storage_directory</span>
|
||
|
||
|
||
<span class="doc doc-labels">
|
||
<small class="doc doc-label doc-label-class-attribute"><code>class-attribute</code></small>
|
||
<small class="doc doc-label doc-label-instance-attribute"><code>instance-attribute</code></small>
|
||
</span>
|
||
|
||
</h4>
|
||
<div class="doc-signature highlight"><pre><span></span><code><span class="n">model_storage_directory</span><span class="p">:</span> <span class="n"><span title="typing.Optional">Optional</span></span><span class="p">[</span><span class="n"><span title="str">str</span></span><span class="p">]</span> <span class="o">=</span> <span class="kc">None</span>
|
||
</code></pre></div>
|
||
|
||
<div class="doc doc-contents ">
|
||
|
||
</div>
|
||
|
||
</div>
|
||
|
||
<div class="doc doc-object doc-attribute">
|
||
|
||
|
||
|
||
<h4 id="docling.datamodel.pipeline_options.EasyOcrOptions.recog_network" class="doc doc-heading">
|
||
<code class="doc-symbol doc-symbol-heading doc-symbol-attribute"></code> <span class="doc doc-object-name doc-attribute-name">recog_network</span>
|
||
|
||
|
||
<span class="doc doc-labels">
|
||
<small class="doc doc-label doc-label-class-attribute"><code>class-attribute</code></small>
|
||
<small class="doc doc-label doc-label-instance-attribute"><code>instance-attribute</code></small>
|
||
</span>
|
||
|
||
</h4>
|
||
<div class="doc-signature highlight"><pre><span></span><code><span class="n">recog_network</span><span class="p">:</span> <span class="n"><span title="typing.Optional">Optional</span></span><span class="p">[</span><span class="n"><span title="str">str</span></span><span class="p">]</span> <span class="o">=</span> <span class="s1">'standard'</span>
|
||
</code></pre></div>
|
||
|
||
<div class="doc doc-contents ">
|
||
|
||
</div>
|
||
|
||
</div>
|
||
|
||
<div class="doc doc-object doc-attribute">
|
||
|
||
|
||
|
||
<h4 id="docling.datamodel.pipeline_options.EasyOcrOptions.suppress_mps_warnings" class="doc doc-heading">
|
||
<code class="doc-symbol doc-symbol-heading doc-symbol-attribute"></code> <span class="doc doc-object-name doc-attribute-name">suppress_mps_warnings</span>
|
||
|
||
|
||
<span class="doc doc-labels">
|
||
<small class="doc doc-label doc-label-class-attribute"><code>class-attribute</code></small>
|
||
<small class="doc doc-label doc-label-instance-attribute"><code>instance-attribute</code></small>
|
||
</span>
|
||
|
||
</h4>
|
||
<div class="doc-signature highlight"><pre><span></span><code><span class="n">suppress_mps_warnings</span><span class="p">:</span> <span class="n"><span title="bool">bool</span></span> <span class="o">=</span> <span class="kc">True</span>
|
||
</code></pre></div>
|
||
|
||
<div class="doc doc-contents ">
|
||
|
||
</div>
|
||
|
||
</div>
|
||
|
||
<div class="doc doc-object doc-attribute">
|
||
|
||
|
||
|
||
<h4 id="docling.datamodel.pipeline_options.EasyOcrOptions.use_gpu" class="doc doc-heading">
|
||
<code class="doc-symbol doc-symbol-heading doc-symbol-attribute"></code> <span class="doc doc-object-name doc-attribute-name">use_gpu</span>
|
||
|
||
|
||
<span class="doc doc-labels">
|
||
<small class="doc doc-label doc-label-class-attribute"><code>class-attribute</code></small>
|
||
<small class="doc doc-label doc-label-instance-attribute"><code>instance-attribute</code></small>
|
||
</span>
|
||
|
||
</h4>
|
||
<div class="doc-signature highlight"><pre><span></span><code><span class="n">use_gpu</span><span class="p">:</span> <span class="n"><span title="typing.Optional">Optional</span></span><span class="p">[</span><span class="n"><span title="bool">bool</span></span><span class="p">]</span> <span class="o">=</span> <span class="kc">None</span>
|
||
</code></pre></div>
|
||
|
||
<div class="doc doc-contents ">
|
||
|
||
</div>
|
||
|
||
</div>
|
||
|
||
|
||
|
||
|
||
|
||
|
||
</div>
|
||
|
||
</div>
|
||
|
||
</div>
|
||
|
||
<div class="doc doc-object doc-class">
|
||
|
||
|
||
|
||
<h3 id="docling.datamodel.pipeline_options.LayoutOptions" class="doc doc-heading">
|
||
<code class="doc-symbol doc-symbol-heading doc-symbol-class"></code> <span class="doc doc-object-name doc-class-name">LayoutOptions</span>
|
||
|
||
|
||
</h3>
|
||
|
||
|
||
<div class="doc doc-contents ">
|
||
<p class="doc doc-class-bases">
|
||
Bases: <code><a class="autorefs autorefs-internal" title="<code class="doc-symbol doc-symbol-heading doc-symbol-class"></code> <span class="doc doc-object-name doc-class-name">BaseLayoutOptions</span> (<code>docling.datamodel.pipeline_options.BaseLayoutOptions</code>)" href="#docling.datamodel.pipeline_options.BaseLayoutOptions">BaseLayoutOptions</a></code></p>
|
||
|
||
|
||
|
||
<p>Options for layout processing.</p>
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
<p><span class="doc-section-title">Attributes:</span></p>
|
||
<ul>
|
||
<li class="doc-section-item field-body">
|
||
<b><code><a class="autorefs autorefs-internal" title="<code class="doc-symbol doc-symbol-heading doc-symbol-attribute"></code> <span class="doc doc-object-name doc-attribute-name">create_orphan_clusters</span>
|
||
|
||
|
||
<span class="doc doc-labels">
|
||
<small class="doc doc-label doc-label-class-attribute"><code>class-attribute</code></small>
|
||
<small class="doc doc-label doc-label-instance-attribute"><code>instance-attribute</code></small>
|
||
</span> (<code>docling.datamodel.pipeline_options.LayoutOptions.create_orphan_clusters</code>)" href="#docling.datamodel.pipeline_options.LayoutOptions.create_orphan_clusters">create_orphan_clusters</a></code></b>
|
||
(<code><span title="bool">bool</span></code>)
|
||
–
|
||
<div class="doc-md-description">
|
||
|
||
</div>
|
||
</li>
|
||
<li class="doc-section-item field-body">
|
||
<b><code><a class="autorefs autorefs-internal" title="<code class="doc-symbol doc-symbol-heading doc-symbol-attribute"></code> <span class="doc doc-object-name doc-attribute-name">keep_empty_clusters</span>
|
||
|
||
|
||
<span class="doc doc-labels">
|
||
<small class="doc doc-label doc-label-class-attribute"><code>class-attribute</code></small>
|
||
<small class="doc doc-label doc-label-instance-attribute"><code>instance-attribute</code></small>
|
||
</span> (<code>docling.datamodel.pipeline_options.LayoutOptions.keep_empty_clusters</code>)" href="#docling.datamodel.pipeline_options.LayoutOptions.keep_empty_clusters">keep_empty_clusters</a></code></b>
|
||
(<code><span title="bool">bool</span></code>)
|
||
–
|
||
<div class="doc-md-description">
|
||
|
||
</div>
|
||
</li>
|
||
<li class="doc-section-item field-body">
|
||
<b><code><a class="autorefs autorefs-internal" title="<code class="doc-symbol doc-symbol-heading doc-symbol-attribute"></code> <span class="doc doc-object-name doc-attribute-name">kind</span>
|
||
|
||
|
||
<span class="doc doc-labels">
|
||
<small class="doc doc-label doc-label-class-attribute"><code>class-attribute</code></small>
|
||
</span> (<code>docling.datamodel.pipeline_options.LayoutOptions.kind</code>)" href="#docling.datamodel.pipeline_options.LayoutOptions.kind">kind</a></code></b>
|
||
(<code><span title="str">str</span></code>)
|
||
–
|
||
<div class="doc-md-description">
|
||
|
||
</div>
|
||
</li>
|
||
<li class="doc-section-item field-body">
|
||
<b><code><a class="autorefs autorefs-internal" title="<code class="doc-symbol doc-symbol-heading doc-symbol-attribute"></code> <span class="doc doc-object-name doc-attribute-name">model_spec</span>
|
||
|
||
|
||
<span class="doc doc-labels">
|
||
<small class="doc doc-label doc-label-class-attribute"><code>class-attribute</code></small>
|
||
<small class="doc doc-label doc-label-instance-attribute"><code>instance-attribute</code></small>
|
||
</span> (<code>docling.datamodel.pipeline_options.LayoutOptions.model_spec</code>)" href="#docling.datamodel.pipeline_options.LayoutOptions.model_spec">model_spec</a></code></b>
|
||
(<code><span title="docling.datamodel.layout_model_specs.LayoutModelConfig">LayoutModelConfig</span></code>)
|
||
–
|
||
<div class="doc-md-description">
|
||
|
||
</div>
|
||
</li>
|
||
<li class="doc-section-item field-body">
|
||
<b><code><a class="autorefs autorefs-internal" title="<code class="doc-symbol doc-symbol-heading doc-symbol-attribute"></code> <span class="doc doc-object-name doc-attribute-name">skip_cell_assignment</span>
|
||
|
||
|
||
<span class="doc doc-labels">
|
||
<small class="doc doc-label doc-label-class-attribute"><code>class-attribute</code></small>
|
||
<small class="doc doc-label doc-label-instance-attribute"><code>instance-attribute</code></small>
|
||
</span> (<code>docling.datamodel.pipeline_options.LayoutOptions.skip_cell_assignment</code>)" href="#docling.datamodel.pipeline_options.LayoutOptions.skip_cell_assignment">skip_cell_assignment</a></code></b>
|
||
(<code><span title="bool">bool</span></code>)
|
||
–
|
||
<div class="doc-md-description">
|
||
|
||
</div>
|
||
</li>
|
||
</ul>
|
||
|
||
|
||
|
||
|
||
<div class="doc doc-children">
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
<div class="doc doc-object doc-attribute">
|
||
|
||
|
||
|
||
<h4 id="docling.datamodel.pipeline_options.LayoutOptions.create_orphan_clusters" class="doc doc-heading">
|
||
<code class="doc-symbol doc-symbol-heading doc-symbol-attribute"></code> <span class="doc doc-object-name doc-attribute-name">create_orphan_clusters</span>
|
||
|
||
|
||
<span class="doc doc-labels">
|
||
<small class="doc doc-label doc-label-class-attribute"><code>class-attribute</code></small>
|
||
<small class="doc doc-label doc-label-instance-attribute"><code>instance-attribute</code></small>
|
||
</span>
|
||
|
||
</h4>
|
||
<div class="doc-signature highlight"><pre><span></span><code><span class="n">create_orphan_clusters</span><span class="p">:</span> <span class="n"><span title="bool">bool</span></span> <span class="o">=</span> <span class="kc">True</span>
|
||
</code></pre></div>
|
||
|
||
<div class="doc doc-contents ">
|
||
|
||
</div>
|
||
|
||
</div>
|
||
|
||
<div class="doc doc-object doc-attribute">
|
||
|
||
|
||
|
||
<h4 id="docling.datamodel.pipeline_options.LayoutOptions.keep_empty_clusters" class="doc doc-heading">
|
||
<code class="doc-symbol doc-symbol-heading doc-symbol-attribute"></code> <span class="doc doc-object-name doc-attribute-name">keep_empty_clusters</span>
|
||
|
||
|
||
<span class="doc doc-labels">
|
||
<small class="doc doc-label doc-label-class-attribute"><code>class-attribute</code></small>
|
||
<small class="doc doc-label doc-label-instance-attribute"><code>instance-attribute</code></small>
|
||
</span>
|
||
|
||
</h4>
|
||
<div class="doc-signature highlight"><pre><span></span><code><span class="n">keep_empty_clusters</span><span class="p">:</span> <span class="n"><span title="bool">bool</span></span> <span class="o">=</span> <span class="kc">False</span>
|
||
</code></pre></div>
|
||
|
||
<div class="doc doc-contents ">
|
||
|
||
</div>
|
||
|
||
</div>
|
||
|
||
<div class="doc doc-object doc-attribute">
|
||
|
||
|
||
|
||
<h4 id="docling.datamodel.pipeline_options.LayoutOptions.kind" class="doc doc-heading">
|
||
<code class="doc-symbol doc-symbol-heading doc-symbol-attribute"></code> <span class="doc doc-object-name doc-attribute-name">kind</span>
|
||
|
||
|
||
<span class="doc doc-labels">
|
||
<small class="doc doc-label doc-label-class-attribute"><code>class-attribute</code></small>
|
||
</span>
|
||
|
||
</h4>
|
||
<div class="doc-signature highlight"><pre><span></span><code><span class="n">kind</span><span class="p">:</span> <span class="n"><span title="str">str</span></span> <span class="o">=</span> <span class="s1">'docling_layout_default'</span>
|
||
</code></pre></div>
|
||
|
||
<div class="doc doc-contents ">
|
||
|
||
</div>
|
||
|
||
</div>
|
||
|
||
<div class="doc doc-object doc-attribute">
|
||
|
||
|
||
|
||
<h4 id="docling.datamodel.pipeline_options.LayoutOptions.model_spec" class="doc doc-heading">
|
||
<code class="doc-symbol doc-symbol-heading doc-symbol-attribute"></code> <span class="doc doc-object-name doc-attribute-name">model_spec</span>
|
||
|
||
|
||
<span class="doc doc-labels">
|
||
<small class="doc doc-label doc-label-class-attribute"><code>class-attribute</code></small>
|
||
<small class="doc doc-label doc-label-instance-attribute"><code>instance-attribute</code></small>
|
||
</span>
|
||
|
||
</h4>
|
||
<div class="doc-signature highlight"><pre><span></span><code><span class="n">model_spec</span><span class="p">:</span> <span class="n"><span title="docling.datamodel.layout_model_specs.LayoutModelConfig">LayoutModelConfig</span></span> <span class="o">=</span> <span class="n"><span title="docling.datamodel.layout_model_specs.DOCLING_LAYOUT_HERON">DOCLING_LAYOUT_HERON</span></span>
|
||
</code></pre></div>
|
||
|
||
<div class="doc doc-contents ">
|
||
|
||
</div>
|
||
|
||
</div>
|
||
|
||
<div class="doc doc-object doc-attribute">
|
||
|
||
|
||
|
||
<h4 id="docling.datamodel.pipeline_options.LayoutOptions.skip_cell_assignment" class="doc doc-heading">
|
||
<code class="doc-symbol doc-symbol-heading doc-symbol-attribute"></code> <span class="doc doc-object-name doc-attribute-name">skip_cell_assignment</span>
|
||
|
||
|
||
<span class="doc doc-labels">
|
||
<small class="doc doc-label doc-label-class-attribute"><code>class-attribute</code></small>
|
||
<small class="doc doc-label doc-label-instance-attribute"><code>instance-attribute</code></small>
|
||
</span>
|
||
|
||
</h4>
|
||
<div class="doc-signature highlight"><pre><span></span><code><span class="n">skip_cell_assignment</span><span class="p">:</span> <span class="n"><span title="bool">bool</span></span> <span class="o">=</span> <span class="kc">False</span>
|
||
</code></pre></div>
|
||
|
||
<div class="doc doc-contents ">
|
||
|
||
</div>
|
||
|
||
</div>
|
||
|
||
|
||
|
||
|
||
|
||
|
||
</div>
|
||
|
||
</div>
|
||
|
||
</div>
|
||
|
||
<div class="doc doc-object doc-class">
|
||
|
||
|
||
|
||
<h3 id="docling.datamodel.pipeline_options.OcrAutoOptions" class="doc doc-heading">
|
||
<code class="doc-symbol doc-symbol-heading doc-symbol-class"></code> <span class="doc doc-object-name doc-class-name">OcrAutoOptions</span>
|
||
|
||
|
||
</h3>
|
||
|
||
|
||
<div class="doc doc-contents ">
|
||
<p class="doc doc-class-bases">
|
||
Bases: <code><a class="autorefs autorefs-internal" title="<code class="doc-symbol doc-symbol-heading doc-symbol-class"></code> <span class="doc doc-object-name doc-class-name">OcrOptions</span> (<code>docling.datamodel.pipeline_options.OcrOptions</code>)" href="#docling.datamodel.pipeline_options.OcrOptions">OcrOptions</a></code></p>
|
||
|
||
|
||
|
||
<p>Options for pick OCR engine automatically.</p>
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
<p><span class="doc-section-title">Attributes:</span></p>
|
||
<ul>
|
||
<li class="doc-section-item field-body">
|
||
<b><code><a class="autorefs autorefs-internal" title="<code class="doc-symbol doc-symbol-heading doc-symbol-attribute"></code> <span class="doc doc-object-name doc-attribute-name">bitmap_area_threshold</span>
|
||
|
||
|
||
<span class="doc doc-labels">
|
||
<small class="doc doc-label doc-label-class-attribute"><code>class-attribute</code></small>
|
||
<small class="doc doc-label doc-label-instance-attribute"><code>instance-attribute</code></small>
|
||
</span> (<code>docling.datamodel.pipeline_options.OcrAutoOptions.bitmap_area_threshold</code>)" href="#docling.datamodel.pipeline_options.OcrAutoOptions.bitmap_area_threshold">bitmap_area_threshold</a></code></b>
|
||
(<code><span title="float">float</span></code>)
|
||
–
|
||
<div class="doc-md-description">
|
||
|
||
</div>
|
||
</li>
|
||
<li class="doc-section-item field-body">
|
||
<b><code><a class="autorefs autorefs-internal" title="<code class="doc-symbol doc-symbol-heading doc-symbol-attribute"></code> <span class="doc doc-object-name doc-attribute-name">force_full_page_ocr</span>
|
||
|
||
|
||
<span class="doc doc-labels">
|
||
<small class="doc doc-label doc-label-class-attribute"><code>class-attribute</code></small>
|
||
<small class="doc doc-label doc-label-instance-attribute"><code>instance-attribute</code></small>
|
||
</span> (<code>docling.datamodel.pipeline_options.OcrAutoOptions.force_full_page_ocr</code>)" href="#docling.datamodel.pipeline_options.OcrAutoOptions.force_full_page_ocr">force_full_page_ocr</a></code></b>
|
||
(<code><span title="bool">bool</span></code>)
|
||
–
|
||
<div class="doc-md-description">
|
||
|
||
</div>
|
||
</li>
|
||
<li class="doc-section-item field-body">
|
||
<b><code><a class="autorefs autorefs-internal" title="<code class="doc-symbol doc-symbol-heading doc-symbol-attribute"></code> <span class="doc doc-object-name doc-attribute-name">kind</span>
|
||
|
||
|
||
<span class="doc doc-labels">
|
||
<small class="doc doc-label doc-label-class-attribute"><code>class-attribute</code></small>
|
||
</span> (<code>docling.datamodel.pipeline_options.OcrAutoOptions.kind</code>)" href="#docling.datamodel.pipeline_options.OcrAutoOptions.kind">kind</a></code></b>
|
||
(<code><span title="typing.Literal">Literal</span>['auto']</code>)
|
||
–
|
||
<div class="doc-md-description">
|
||
|
||
</div>
|
||
</li>
|
||
<li class="doc-section-item field-body">
|
||
<b><code><a class="autorefs autorefs-internal" title="<code class="doc-symbol doc-symbol-heading doc-symbol-attribute"></code> <span class="doc doc-object-name doc-attribute-name">lang</span>
|
||
|
||
|
||
<span class="doc doc-labels">
|
||
<small class="doc doc-label doc-label-class-attribute"><code>class-attribute</code></small>
|
||
<small class="doc doc-label doc-label-instance-attribute"><code>instance-attribute</code></small>
|
||
</span> (<code>docling.datamodel.pipeline_options.OcrAutoOptions.lang</code>)" href="#docling.datamodel.pipeline_options.OcrAutoOptions.lang">lang</a></code></b>
|
||
(<code><span title="typing.List">List</span>[<span title="str">str</span>]</code>)
|
||
–
|
||
<div class="doc-md-description">
|
||
|
||
</div>
|
||
</li>
|
||
</ul>
|
||
|
||
|
||
|
||
|
||
<div class="doc doc-children">
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
<div class="doc doc-object doc-attribute">
|
||
|
||
|
||
|
||
<h4 id="docling.datamodel.pipeline_options.OcrAutoOptions.bitmap_area_threshold" class="doc doc-heading">
|
||
<code class="doc-symbol doc-symbol-heading doc-symbol-attribute"></code> <span class="doc doc-object-name doc-attribute-name">bitmap_area_threshold</span>
|
||
|
||
|
||
<span class="doc doc-labels">
|
||
<small class="doc doc-label doc-label-class-attribute"><code>class-attribute</code></small>
|
||
<small class="doc doc-label doc-label-instance-attribute"><code>instance-attribute</code></small>
|
||
</span>
|
||
|
||
</h4>
|
||
<div class="doc-signature highlight"><pre><span></span><code><span class="n">bitmap_area_threshold</span><span class="p">:</span> <span class="n"><span title="float">float</span></span> <span class="o">=</span> <span class="mf">0.05</span>
|
||
</code></pre></div>
|
||
|
||
<div class="doc doc-contents ">
|
||
|
||
</div>
|
||
|
||
</div>
|
||
|
||
<div class="doc doc-object doc-attribute">
|
||
|
||
|
||
|
||
<h4 id="docling.datamodel.pipeline_options.OcrAutoOptions.force_full_page_ocr" class="doc doc-heading">
|
||
<code class="doc-symbol doc-symbol-heading doc-symbol-attribute"></code> <span class="doc doc-object-name doc-attribute-name">force_full_page_ocr</span>
|
||
|
||
|
||
<span class="doc doc-labels">
|
||
<small class="doc doc-label doc-label-class-attribute"><code>class-attribute</code></small>
|
||
<small class="doc doc-label doc-label-instance-attribute"><code>instance-attribute</code></small>
|
||
</span>
|
||
|
||
</h4>
|
||
<div class="doc-signature highlight"><pre><span></span><code><span class="n">force_full_page_ocr</span><span class="p">:</span> <span class="n"><span title="bool">bool</span></span> <span class="o">=</span> <span class="kc">False</span>
|
||
</code></pre></div>
|
||
|
||
<div class="doc doc-contents ">
|
||
|
||
</div>
|
||
|
||
</div>
|
||
|
||
<div class="doc doc-object doc-attribute">
|
||
|
||
|
||
|
||
<h4 id="docling.datamodel.pipeline_options.OcrAutoOptions.kind" class="doc doc-heading">
|
||
<code class="doc-symbol doc-symbol-heading doc-symbol-attribute"></code> <span class="doc doc-object-name doc-attribute-name">kind</span>
|
||
|
||
|
||
<span class="doc doc-labels">
|
||
<small class="doc doc-label doc-label-class-attribute"><code>class-attribute</code></small>
|
||
</span>
|
||
|
||
</h4>
|
||
<div class="doc-signature highlight"><pre><span></span><code><span class="n">kind</span><span class="p">:</span> <span class="n"><span title="typing.Literal">Literal</span></span><span class="p">[</span><span class="s1">'auto'</span><span class="p">]</span> <span class="o">=</span> <span class="s1">'auto'</span>
|
||
</code></pre></div>
|
||
|
||
<div class="doc doc-contents ">
|
||
|
||
</div>
|
||
|
||
</div>
|
||
|
||
<div class="doc doc-object doc-attribute">
|
||
|
||
|
||
|
||
<h4 id="docling.datamodel.pipeline_options.OcrAutoOptions.lang" class="doc doc-heading">
|
||
<code class="doc-symbol doc-symbol-heading doc-symbol-attribute"></code> <span class="doc doc-object-name doc-attribute-name">lang</span>
|
||
|
||
|
||
<span class="doc doc-labels">
|
||
<small class="doc doc-label doc-label-class-attribute"><code>class-attribute</code></small>
|
||
<small class="doc doc-label doc-label-instance-attribute"><code>instance-attribute</code></small>
|
||
</span>
|
||
|
||
</h4>
|
||
<div class="doc-signature highlight"><pre><span></span><code><span class="n">lang</span><span class="p">:</span> <span class="n"><span title="typing.List">List</span></span><span class="p">[</span><span class="n"><span title="str">str</span></span><span class="p">]</span> <span class="o">=</span> <span class="p">[]</span>
|
||
</code></pre></div>
|
||
|
||
<div class="doc doc-contents ">
|
||
|
||
</div>
|
||
|
||
</div>
|
||
|
||
|
||
|
||
|
||
|
||
|
||
</div>
|
||
|
||
</div>
|
||
|
||
</div>
|
||
|
||
<div class="doc doc-object doc-class">
|
||
|
||
|
||
|
||
<h3 id="docling.datamodel.pipeline_options.OcrEngine" class="doc doc-heading">
|
||
<code class="doc-symbol doc-symbol-heading doc-symbol-class"></code> <span class="doc doc-object-name doc-class-name">OcrEngine</span>
|
||
|
||
|
||
</h3>
|
||
|
||
|
||
<div class="doc doc-contents ">
|
||
<p class="doc doc-class-bases">
|
||
Bases: <code><span title="str">str</span></code>, <code><span title="enum.Enum">Enum</span></code></p>
|
||
|
||
|
||
|
||
<p>Enum of valid OCR engines.</p>
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
<p><span class="doc-section-title">Attributes:</span></p>
|
||
<ul>
|
||
<li class="doc-section-item field-body">
|
||
<b><code><a class="autorefs autorefs-internal" title="<code class="doc-symbol doc-symbol-heading doc-symbol-attribute"></code> <span class="doc doc-object-name doc-attribute-name">AUTO</span>
|
||
|
||
|
||
<span class="doc doc-labels">
|
||
<small class="doc doc-label doc-label-class-attribute"><code>class-attribute</code></small>
|
||
<small class="doc doc-label doc-label-instance-attribute"><code>instance-attribute</code></small>
|
||
</span> (<code>docling.datamodel.pipeline_options.OcrEngine.AUTO</code>)" href="#docling.datamodel.pipeline_options.OcrEngine.AUTO">AUTO</a></code></b>
|
||
–
|
||
<div class="doc-md-description">
|
||
|
||
</div>
|
||
</li>
|
||
<li class="doc-section-item field-body">
|
||
<b><code><a class="autorefs autorefs-internal" title="<code class="doc-symbol doc-symbol-heading doc-symbol-attribute"></code> <span class="doc doc-object-name doc-attribute-name">EASYOCR</span>
|
||
|
||
|
||
<span class="doc doc-labels">
|
||
<small class="doc doc-label doc-label-class-attribute"><code>class-attribute</code></small>
|
||
<small class="doc doc-label doc-label-instance-attribute"><code>instance-attribute</code></small>
|
||
</span> (<code>docling.datamodel.pipeline_options.OcrEngine.EASYOCR</code>)" href="#docling.datamodel.pipeline_options.OcrEngine.EASYOCR">EASYOCR</a></code></b>
|
||
–
|
||
<div class="doc-md-description">
|
||
|
||
</div>
|
||
</li>
|
||
<li class="doc-section-item field-body">
|
||
<b><code><a class="autorefs autorefs-internal" title="<code class="doc-symbol doc-symbol-heading doc-symbol-attribute"></code> <span class="doc doc-object-name doc-attribute-name">OCRMAC</span>
|
||
|
||
|
||
<span class="doc doc-labels">
|
||
<small class="doc doc-label doc-label-class-attribute"><code>class-attribute</code></small>
|
||
<small class="doc doc-label doc-label-instance-attribute"><code>instance-attribute</code></small>
|
||
</span> (<code>docling.datamodel.pipeline_options.OcrEngine.OCRMAC</code>)" href="#docling.datamodel.pipeline_options.OcrEngine.OCRMAC">OCRMAC</a></code></b>
|
||
–
|
||
<div class="doc-md-description">
|
||
|
||
</div>
|
||
</li>
|
||
<li class="doc-section-item field-body">
|
||
<b><code><a class="autorefs autorefs-internal" title="<code class="doc-symbol doc-symbol-heading doc-symbol-attribute"></code> <span class="doc doc-object-name doc-attribute-name">RAPIDOCR</span>
|
||
|
||
|
||
<span class="doc doc-labels">
|
||
<small class="doc doc-label doc-label-class-attribute"><code>class-attribute</code></small>
|
||
<small class="doc doc-label doc-label-instance-attribute"><code>instance-attribute</code></small>
|
||
</span> (<code>docling.datamodel.pipeline_options.OcrEngine.RAPIDOCR</code>)" href="#docling.datamodel.pipeline_options.OcrEngine.RAPIDOCR">RAPIDOCR</a></code></b>
|
||
–
|
||
<div class="doc-md-description">
|
||
|
||
</div>
|
||
</li>
|
||
<li class="doc-section-item field-body">
|
||
<b><code><a class="autorefs autorefs-internal" title="<code class="doc-symbol doc-symbol-heading doc-symbol-attribute"></code> <span class="doc doc-object-name doc-attribute-name">TESSERACT</span>
|
||
|
||
|
||
<span class="doc doc-labels">
|
||
<small class="doc doc-label doc-label-class-attribute"><code>class-attribute</code></small>
|
||
<small class="doc doc-label doc-label-instance-attribute"><code>instance-attribute</code></small>
|
||
</span> (<code>docling.datamodel.pipeline_options.OcrEngine.TESSERACT</code>)" href="#docling.datamodel.pipeline_options.OcrEngine.TESSERACT">TESSERACT</a></code></b>
|
||
–
|
||
<div class="doc-md-description">
|
||
|
||
</div>
|
||
</li>
|
||
<li class="doc-section-item field-body">
|
||
<b><code><a class="autorefs autorefs-internal" title="<code class="doc-symbol doc-symbol-heading doc-symbol-attribute"></code> <span class="doc doc-object-name doc-attribute-name">TESSERACT_CLI</span>
|
||
|
||
|
||
<span class="doc doc-labels">
|
||
<small class="doc doc-label doc-label-class-attribute"><code>class-attribute</code></small>
|
||
<small class="doc doc-label doc-label-instance-attribute"><code>instance-attribute</code></small>
|
||
</span> (<code>docling.datamodel.pipeline_options.OcrEngine.TESSERACT_CLI</code>)" href="#docling.datamodel.pipeline_options.OcrEngine.TESSERACT_CLI">TESSERACT_CLI</a></code></b>
|
||
–
|
||
<div class="doc-md-description">
|
||
|
||
</div>
|
||
</li>
|
||
</ul>
|
||
|
||
|
||
|
||
|
||
<div class="doc doc-children">
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
<div class="doc doc-object doc-attribute">
|
||
|
||
|
||
|
||
<h4 id="docling.datamodel.pipeline_options.OcrEngine.AUTO" class="doc doc-heading">
|
||
<code class="doc-symbol doc-symbol-heading doc-symbol-attribute"></code> <span class="doc doc-object-name doc-attribute-name">AUTO</span>
|
||
|
||
|
||
<span class="doc doc-labels">
|
||
<small class="doc doc-label doc-label-class-attribute"><code>class-attribute</code></small>
|
||
<small class="doc doc-label doc-label-instance-attribute"><code>instance-attribute</code></small>
|
||
</span>
|
||
|
||
</h4>
|
||
<div class="doc-signature highlight"><pre><span></span><code><span class="n">AUTO</span> <span class="o">=</span> <span class="s1">'auto'</span>
|
||
</code></pre></div>
|
||
|
||
<div class="doc doc-contents ">
|
||
|
||
</div>
|
||
|
||
</div>
|
||
|
||
<div class="doc doc-object doc-attribute">
|
||
|
||
|
||
|
||
<h4 id="docling.datamodel.pipeline_options.OcrEngine.EASYOCR" class="doc doc-heading">
|
||
<code class="doc-symbol doc-symbol-heading doc-symbol-attribute"></code> <span class="doc doc-object-name doc-attribute-name">EASYOCR</span>
|
||
|
||
|
||
<span class="doc doc-labels">
|
||
<small class="doc doc-label doc-label-class-attribute"><code>class-attribute</code></small>
|
||
<small class="doc doc-label doc-label-instance-attribute"><code>instance-attribute</code></small>
|
||
</span>
|
||
|
||
</h4>
|
||
<div class="doc-signature highlight"><pre><span></span><code><span class="n">EASYOCR</span> <span class="o">=</span> <span class="s1">'easyocr'</span>
|
||
</code></pre></div>
|
||
|
||
<div class="doc doc-contents ">
|
||
|
||
</div>
|
||
|
||
</div>
|
||
|
||
<div class="doc doc-object doc-attribute">
|
||
|
||
|
||
|
||
<h4 id="docling.datamodel.pipeline_options.OcrEngine.OCRMAC" class="doc doc-heading">
|
||
<code class="doc-symbol doc-symbol-heading doc-symbol-attribute"></code> <span class="doc doc-object-name doc-attribute-name">OCRMAC</span>
|
||
|
||
|
||
<span class="doc doc-labels">
|
||
<small class="doc doc-label doc-label-class-attribute"><code>class-attribute</code></small>
|
||
<small class="doc doc-label doc-label-instance-attribute"><code>instance-attribute</code></small>
|
||
</span>
|
||
|
||
</h4>
|
||
<div class="doc-signature highlight"><pre><span></span><code><span class="n">OCRMAC</span> <span class="o">=</span> <span class="s1">'ocrmac'</span>
|
||
</code></pre></div>
|
||
|
||
<div class="doc doc-contents ">
|
||
|
||
</div>
|
||
|
||
</div>
|
||
|
||
<div class="doc doc-object doc-attribute">
|
||
|
||
|
||
|
||
<h4 id="docling.datamodel.pipeline_options.OcrEngine.RAPIDOCR" class="doc doc-heading">
|
||
<code class="doc-symbol doc-symbol-heading doc-symbol-attribute"></code> <span class="doc doc-object-name doc-attribute-name">RAPIDOCR</span>
|
||
|
||
|
||
<span class="doc doc-labels">
|
||
<small class="doc doc-label doc-label-class-attribute"><code>class-attribute</code></small>
|
||
<small class="doc doc-label doc-label-instance-attribute"><code>instance-attribute</code></small>
|
||
</span>
|
||
|
||
</h4>
|
||
<div class="doc-signature highlight"><pre><span></span><code><span class="n">RAPIDOCR</span> <span class="o">=</span> <span class="s1">'rapidocr'</span>
|
||
</code></pre></div>
|
||
|
||
<div class="doc doc-contents ">
|
||
|
||
</div>
|
||
|
||
</div>
|
||
|
||
<div class="doc doc-object doc-attribute">
|
||
|
||
|
||
|
||
<h4 id="docling.datamodel.pipeline_options.OcrEngine.TESSERACT" class="doc doc-heading">
|
||
<code class="doc-symbol doc-symbol-heading doc-symbol-attribute"></code> <span class="doc doc-object-name doc-attribute-name">TESSERACT</span>
|
||
|
||
|
||
<span class="doc doc-labels">
|
||
<small class="doc doc-label doc-label-class-attribute"><code>class-attribute</code></small>
|
||
<small class="doc doc-label doc-label-instance-attribute"><code>instance-attribute</code></small>
|
||
</span>
|
||
|
||
</h4>
|
||
<div class="doc-signature highlight"><pre><span></span><code><span class="n">TESSERACT</span> <span class="o">=</span> <span class="s1">'tesseract'</span>
|
||
</code></pre></div>
|
||
|
||
<div class="doc doc-contents ">
|
||
|
||
</div>
|
||
|
||
</div>
|
||
|
||
<div class="doc doc-object doc-attribute">
|
||
|
||
|
||
|
||
<h4 id="docling.datamodel.pipeline_options.OcrEngine.TESSERACT_CLI" class="doc doc-heading">
|
||
<code class="doc-symbol doc-symbol-heading doc-symbol-attribute"></code> <span class="doc doc-object-name doc-attribute-name">TESSERACT_CLI</span>
|
||
|
||
|
||
<span class="doc doc-labels">
|
||
<small class="doc doc-label doc-label-class-attribute"><code>class-attribute</code></small>
|
||
<small class="doc doc-label doc-label-instance-attribute"><code>instance-attribute</code></small>
|
||
</span>
|
||
|
||
</h4>
|
||
<div class="doc-signature highlight"><pre><span></span><code><span class="n">TESSERACT_CLI</span> <span class="o">=</span> <span class="s1">'tesseract_cli'</span>
|
||
</code></pre></div>
|
||
|
||
<div class="doc doc-contents ">
|
||
|
||
</div>
|
||
|
||
</div>
|
||
|
||
|
||
|
||
|
||
|
||
|
||
</div>
|
||
|
||
</div>
|
||
|
||
</div>
|
||
|
||
<div class="doc doc-object doc-class">
|
||
|
||
|
||
|
||
<h3 id="docling.datamodel.pipeline_options.OcrMacOptions" class="doc doc-heading">
|
||
<code class="doc-symbol doc-symbol-heading doc-symbol-class"></code> <span class="doc doc-object-name doc-class-name">OcrMacOptions</span>
|
||
|
||
|
||
</h3>
|
||
|
||
|
||
<div class="doc doc-contents ">
|
||
<p class="doc doc-class-bases">
|
||
Bases: <code><a class="autorefs autorefs-internal" title="<code class="doc-symbol doc-symbol-heading doc-symbol-class"></code> <span class="doc doc-object-name doc-class-name">OcrOptions</span> (<code>docling.datamodel.pipeline_options.OcrOptions</code>)" href="#docling.datamodel.pipeline_options.OcrOptions">OcrOptions</a></code></p>
|
||
|
||
|
||
|
||
<p>Options for the Mac OCR engine.</p>
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
<p><span class="doc-section-title">Attributes:</span></p>
|
||
<ul>
|
||
<li class="doc-section-item field-body">
|
||
<b><code><a class="autorefs autorefs-internal" title="<code class="doc-symbol doc-symbol-heading doc-symbol-attribute"></code> <span class="doc doc-object-name doc-attribute-name">bitmap_area_threshold</span>
|
||
|
||
|
||
<span class="doc doc-labels">
|
||
<small class="doc doc-label doc-label-class-attribute"><code>class-attribute</code></small>
|
||
<small class="doc doc-label doc-label-instance-attribute"><code>instance-attribute</code></small>
|
||
</span> (<code>docling.datamodel.pipeline_options.OcrMacOptions.bitmap_area_threshold</code>)" href="#docling.datamodel.pipeline_options.OcrMacOptions.bitmap_area_threshold">bitmap_area_threshold</a></code></b>
|
||
(<code><span title="float">float</span></code>)
|
||
–
|
||
<div class="doc-md-description">
|
||
|
||
</div>
|
||
</li>
|
||
<li class="doc-section-item field-body">
|
||
<b><code><a class="autorefs autorefs-internal" title="<code class="doc-symbol doc-symbol-heading doc-symbol-attribute"></code> <span class="doc doc-object-name doc-attribute-name">force_full_page_ocr</span>
|
||
|
||
|
||
<span class="doc doc-labels">
|
||
<small class="doc doc-label doc-label-class-attribute"><code>class-attribute</code></small>
|
||
<small class="doc doc-label doc-label-instance-attribute"><code>instance-attribute</code></small>
|
||
</span> (<code>docling.datamodel.pipeline_options.OcrMacOptions.force_full_page_ocr</code>)" href="#docling.datamodel.pipeline_options.OcrMacOptions.force_full_page_ocr">force_full_page_ocr</a></code></b>
|
||
(<code><span title="bool">bool</span></code>)
|
||
–
|
||
<div class="doc-md-description">
|
||
|
||
</div>
|
||
</li>
|
||
<li class="doc-section-item field-body">
|
||
<b><code><a class="autorefs autorefs-internal" title="<code class="doc-symbol doc-symbol-heading doc-symbol-attribute"></code> <span class="doc doc-object-name doc-attribute-name">framework</span>
|
||
|
||
|
||
<span class="doc doc-labels">
|
||
<small class="doc doc-label doc-label-class-attribute"><code>class-attribute</code></small>
|
||
<small class="doc doc-label doc-label-instance-attribute"><code>instance-attribute</code></small>
|
||
</span> (<code>docling.datamodel.pipeline_options.OcrMacOptions.framework</code>)" href="#docling.datamodel.pipeline_options.OcrMacOptions.framework">framework</a></code></b>
|
||
(<code><span title="str">str</span></code>)
|
||
–
|
||
<div class="doc-md-description">
|
||
|
||
</div>
|
||
</li>
|
||
<li class="doc-section-item field-body">
|
||
<b><code><a class="autorefs autorefs-internal" title="<code class="doc-symbol doc-symbol-heading doc-symbol-attribute"></code> <span class="doc doc-object-name doc-attribute-name">kind</span>
|
||
|
||
|
||
<span class="doc doc-labels">
|
||
<small class="doc doc-label doc-label-class-attribute"><code>class-attribute</code></small>
|
||
</span> (<code>docling.datamodel.pipeline_options.OcrMacOptions.kind</code>)" href="#docling.datamodel.pipeline_options.OcrMacOptions.kind">kind</a></code></b>
|
||
(<code><span title="typing.Literal">Literal</span>['ocrmac']</code>)
|
||
–
|
||
<div class="doc-md-description">
|
||
|
||
</div>
|
||
</li>
|
||
<li class="doc-section-item field-body">
|
||
<b><code><a class="autorefs autorefs-internal" title="<code class="doc-symbol doc-symbol-heading doc-symbol-attribute"></code> <span class="doc doc-object-name doc-attribute-name">lang</span>
|
||
|
||
|
||
<span class="doc doc-labels">
|
||
<small class="doc doc-label doc-label-class-attribute"><code>class-attribute</code></small>
|
||
<small class="doc doc-label doc-label-instance-attribute"><code>instance-attribute</code></small>
|
||
</span> (<code>docling.datamodel.pipeline_options.OcrMacOptions.lang</code>)" href="#docling.datamodel.pipeline_options.OcrMacOptions.lang">lang</a></code></b>
|
||
(<code><span title="typing.List">List</span>[<span title="str">str</span>]</code>)
|
||
–
|
||
<div class="doc-md-description">
|
||
|
||
</div>
|
||
</li>
|
||
<li class="doc-section-item field-body">
|
||
<b><code><a class="autorefs autorefs-internal" title="<code class="doc-symbol doc-symbol-heading doc-symbol-attribute"></code> <span class="doc doc-object-name doc-attribute-name">model_config</span>
|
||
|
||
|
||
<span class="doc doc-labels">
|
||
<small class="doc doc-label doc-label-class-attribute"><code>class-attribute</code></small>
|
||
<small class="doc doc-label doc-label-instance-attribute"><code>instance-attribute</code></small>
|
||
</span> (<code>docling.datamodel.pipeline_options.OcrMacOptions.model_config</code>)" href="#docling.datamodel.pipeline_options.OcrMacOptions.model_config">model_config</a></code></b>
|
||
–
|
||
<div class="doc-md-description">
|
||
|
||
</div>
|
||
</li>
|
||
<li class="doc-section-item field-body">
|
||
<b><code><a class="autorefs autorefs-internal" title="<code class="doc-symbol doc-symbol-heading doc-symbol-attribute"></code> <span class="doc doc-object-name doc-attribute-name">recognition</span>
|
||
|
||
|
||
<span class="doc doc-labels">
|
||
<small class="doc doc-label doc-label-class-attribute"><code>class-attribute</code></small>
|
||
<small class="doc doc-label doc-label-instance-attribute"><code>instance-attribute</code></small>
|
||
</span> (<code>docling.datamodel.pipeline_options.OcrMacOptions.recognition</code>)" href="#docling.datamodel.pipeline_options.OcrMacOptions.recognition">recognition</a></code></b>
|
||
(<code><span title="str">str</span></code>)
|
||
–
|
||
<div class="doc-md-description">
|
||
|
||
</div>
|
||
</li>
|
||
</ul>
|
||
|
||
|
||
|
||
|
||
<div class="doc doc-children">
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
<div class="doc doc-object doc-attribute">
|
||
|
||
|
||
|
||
<h4 id="docling.datamodel.pipeline_options.OcrMacOptions.bitmap_area_threshold" class="doc doc-heading">
|
||
<code class="doc-symbol doc-symbol-heading doc-symbol-attribute"></code> <span class="doc doc-object-name doc-attribute-name">bitmap_area_threshold</span>
|
||
|
||
|
||
<span class="doc doc-labels">
|
||
<small class="doc doc-label doc-label-class-attribute"><code>class-attribute</code></small>
|
||
<small class="doc doc-label doc-label-instance-attribute"><code>instance-attribute</code></small>
|
||
</span>
|
||
|
||
</h4>
|
||
<div class="doc-signature highlight"><pre><span></span><code><span class="n">bitmap_area_threshold</span><span class="p">:</span> <span class="n"><span title="float">float</span></span> <span class="o">=</span> <span class="mf">0.05</span>
|
||
</code></pre></div>
|
||
|
||
<div class="doc doc-contents ">
|
||
|
||
</div>
|
||
|
||
</div>
|
||
|
||
<div class="doc doc-object doc-attribute">
|
||
|
||
|
||
|
||
<h4 id="docling.datamodel.pipeline_options.OcrMacOptions.force_full_page_ocr" class="doc doc-heading">
|
||
<code class="doc-symbol doc-symbol-heading doc-symbol-attribute"></code> <span class="doc doc-object-name doc-attribute-name">force_full_page_ocr</span>
|
||
|
||
|
||
<span class="doc doc-labels">
|
||
<small class="doc doc-label doc-label-class-attribute"><code>class-attribute</code></small>
|
||
<small class="doc doc-label doc-label-instance-attribute"><code>instance-attribute</code></small>
|
||
</span>
|
||
|
||
</h4>
|
||
<div class="doc-signature highlight"><pre><span></span><code><span class="n">force_full_page_ocr</span><span class="p">:</span> <span class="n"><span title="bool">bool</span></span> <span class="o">=</span> <span class="kc">False</span>
|
||
</code></pre></div>
|
||
|
||
<div class="doc doc-contents ">
|
||
|
||
</div>
|
||
|
||
</div>
|
||
|
||
<div class="doc doc-object doc-attribute">
|
||
|
||
|
||
|
||
<h4 id="docling.datamodel.pipeline_options.OcrMacOptions.framework" class="doc doc-heading">
|
||
<code class="doc-symbol doc-symbol-heading doc-symbol-attribute"></code> <span class="doc doc-object-name doc-attribute-name">framework</span>
|
||
|
||
|
||
<span class="doc doc-labels">
|
||
<small class="doc doc-label doc-label-class-attribute"><code>class-attribute</code></small>
|
||
<small class="doc doc-label doc-label-instance-attribute"><code>instance-attribute</code></small>
|
||
</span>
|
||
|
||
</h4>
|
||
<div class="doc-signature highlight"><pre><span></span><code><span class="n">framework</span><span class="p">:</span> <span class="n"><span title="str">str</span></span> <span class="o">=</span> <span class="s1">'vision'</span>
|
||
</code></pre></div>
|
||
|
||
<div class="doc doc-contents ">
|
||
|
||
</div>
|
||
|
||
</div>
|
||
|
||
<div class="doc doc-object doc-attribute">
|
||
|
||
|
||
|
||
<h4 id="docling.datamodel.pipeline_options.OcrMacOptions.kind" class="doc doc-heading">
|
||
<code class="doc-symbol doc-symbol-heading doc-symbol-attribute"></code> <span class="doc doc-object-name doc-attribute-name">kind</span>
|
||
|
||
|
||
<span class="doc doc-labels">
|
||
<small class="doc doc-label doc-label-class-attribute"><code>class-attribute</code></small>
|
||
</span>
|
||
|
||
</h4>
|
||
<div class="doc-signature highlight"><pre><span></span><code><span class="n">kind</span><span class="p">:</span> <span class="n"><span title="typing.Literal">Literal</span></span><span class="p">[</span><span class="s1">'ocrmac'</span><span class="p">]</span> <span class="o">=</span> <span class="s1">'ocrmac'</span>
|
||
</code></pre></div>
|
||
|
||
<div class="doc doc-contents ">
|
||
|
||
</div>
|
||
|
||
</div>
|
||
|
||
<div class="doc doc-object doc-attribute">
|
||
|
||
|
||
|
||
<h4 id="docling.datamodel.pipeline_options.OcrMacOptions.lang" class="doc doc-heading">
|
||
<code class="doc-symbol doc-symbol-heading doc-symbol-attribute"></code> <span class="doc doc-object-name doc-attribute-name">lang</span>
|
||
|
||
|
||
<span class="doc doc-labels">
|
||
<small class="doc doc-label doc-label-class-attribute"><code>class-attribute</code></small>
|
||
<small class="doc doc-label doc-label-instance-attribute"><code>instance-attribute</code></small>
|
||
</span>
|
||
|
||
</h4>
|
||
<div class="doc-signature highlight"><pre><span></span><code><span class="n">lang</span><span class="p">:</span> <span class="n"><span title="typing.List">List</span></span><span class="p">[</span><span class="n"><span title="str">str</span></span><span class="p">]</span> <span class="o">=</span> <span class="p">[</span><span class="s1">'fr-FR'</span><span class="p">,</span> <span class="s1">'de-DE'</span><span class="p">,</span> <span class="s1">'es-ES'</span><span class="p">,</span> <span class="s1">'en-US'</span><span class="p">]</span>
|
||
</code></pre></div>
|
||
|
||
<div class="doc doc-contents ">
|
||
|
||
</div>
|
||
|
||
</div>
|
||
|
||
<div class="doc doc-object doc-attribute">
|
||
|
||
|
||
|
||
<h4 id="docling.datamodel.pipeline_options.OcrMacOptions.model_config" class="doc doc-heading">
|
||
<code class="doc-symbol doc-symbol-heading doc-symbol-attribute"></code> <span class="doc doc-object-name doc-attribute-name">model_config</span>
|
||
|
||
|
||
<span class="doc doc-labels">
|
||
<small class="doc doc-label doc-label-class-attribute"><code>class-attribute</code></small>
|
||
<small class="doc doc-label doc-label-instance-attribute"><code>instance-attribute</code></small>
|
||
</span>
|
||
|
||
</h4>
|
||
<div class="doc-signature highlight"><pre><span></span><code><span class="n">model_config</span> <span class="o">=</span> <span class="n"><span title="pydantic.ConfigDict">ConfigDict</span></span><span class="p">(</span><span class="n"><span title="pydantic.ConfigDict(extra)">extra</span></span><span class="o">=</span><span class="s1">'forbid'</span><span class="p">)</span>
|
||
</code></pre></div>
|
||
|
||
<div class="doc doc-contents ">
|
||
|
||
</div>
|
||
|
||
</div>
|
||
|
||
<div class="doc doc-object doc-attribute">
|
||
|
||
|
||
|
||
<h4 id="docling.datamodel.pipeline_options.OcrMacOptions.recognition" class="doc doc-heading">
|
||
<code class="doc-symbol doc-symbol-heading doc-symbol-attribute"></code> <span class="doc doc-object-name doc-attribute-name">recognition</span>
|
||
|
||
|
||
<span class="doc doc-labels">
|
||
<small class="doc doc-label doc-label-class-attribute"><code>class-attribute</code></small>
|
||
<small class="doc doc-label doc-label-instance-attribute"><code>instance-attribute</code></small>
|
||
</span>
|
||
|
||
</h4>
|
||
<div class="doc-signature highlight"><pre><span></span><code><span class="n">recognition</span><span class="p">:</span> <span class="n"><span title="str">str</span></span> <span class="o">=</span> <span class="s1">'accurate'</span>
|
||
</code></pre></div>
|
||
|
||
<div class="doc doc-contents ">
|
||
|
||
</div>
|
||
|
||
</div>
|
||
|
||
|
||
|
||
|
||
|
||
|
||
</div>
|
||
|
||
</div>
|
||
|
||
</div>
|
||
|
||
<div class="doc doc-object doc-class">
|
||
|
||
|
||
|
||
<h3 id="docling.datamodel.pipeline_options.OcrOptions" class="doc doc-heading">
|
||
<code class="doc-symbol doc-symbol-heading doc-symbol-class"></code> <span class="doc doc-object-name doc-class-name">OcrOptions</span>
|
||
|
||
|
||
</h3>
|
||
|
||
|
||
<div class="doc doc-contents ">
|
||
<p class="doc doc-class-bases">
|
||
Bases: <code><a class="autorefs autorefs-internal" title="<code class="doc-symbol doc-symbol-heading doc-symbol-class"></code> <span class="doc doc-object-name doc-class-name">BaseOptions</span> (<code>docling.datamodel.pipeline_options.BaseOptions</code>)" href="#docling.datamodel.pipeline_options.BaseOptions">BaseOptions</a></code></p>
|
||
|
||
|
||
|
||
<p>OCR options.</p>
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
<p><span class="doc-section-title">Attributes:</span></p>
|
||
<ul>
|
||
<li class="doc-section-item field-body">
|
||
<b><code><a class="autorefs autorefs-internal" title="<code class="doc-symbol doc-symbol-heading doc-symbol-attribute"></code> <span class="doc doc-object-name doc-attribute-name">bitmap_area_threshold</span>
|
||
|
||
|
||
<span class="doc doc-labels">
|
||
<small class="doc doc-label doc-label-class-attribute"><code>class-attribute</code></small>
|
||
<small class="doc doc-label doc-label-instance-attribute"><code>instance-attribute</code></small>
|
||
</span> (<code>docling.datamodel.pipeline_options.OcrOptions.bitmap_area_threshold</code>)" href="#docling.datamodel.pipeline_options.OcrOptions.bitmap_area_threshold">bitmap_area_threshold</a></code></b>
|
||
(<code><span title="float">float</span></code>)
|
||
–
|
||
<div class="doc-md-description">
|
||
|
||
</div>
|
||
</li>
|
||
<li class="doc-section-item field-body">
|
||
<b><code><a class="autorefs autorefs-internal" title="<code class="doc-symbol doc-symbol-heading doc-symbol-attribute"></code> <span class="doc doc-object-name doc-attribute-name">force_full_page_ocr</span>
|
||
|
||
|
||
<span class="doc doc-labels">
|
||
<small class="doc doc-label doc-label-class-attribute"><code>class-attribute</code></small>
|
||
<small class="doc doc-label doc-label-instance-attribute"><code>instance-attribute</code></small>
|
||
</span> (<code>docling.datamodel.pipeline_options.OcrOptions.force_full_page_ocr</code>)" href="#docling.datamodel.pipeline_options.OcrOptions.force_full_page_ocr">force_full_page_ocr</a></code></b>
|
||
(<code><span title="bool">bool</span></code>)
|
||
–
|
||
<div class="doc-md-description">
|
||
|
||
</div>
|
||
</li>
|
||
<li class="doc-section-item field-body">
|
||
<b><code><a class="autorefs autorefs-internal" title="<code class="doc-symbol doc-symbol-heading doc-symbol-attribute"></code> <span class="doc doc-object-name doc-attribute-name">kind</span>
|
||
|
||
|
||
<span class="doc doc-labels">
|
||
<small class="doc doc-label doc-label-class-attribute"><code>class-attribute</code></small>
|
||
</span> (<code>docling.datamodel.pipeline_options.OcrOptions.kind</code>)" href="#docling.datamodel.pipeline_options.OcrOptions.kind">kind</a></code></b>
|
||
(<code><span title="str">str</span></code>)
|
||
–
|
||
<div class="doc-md-description">
|
||
|
||
</div>
|
||
</li>
|
||
<li class="doc-section-item field-body">
|
||
<b><code><a class="autorefs autorefs-internal" title="<code class="doc-symbol doc-symbol-heading doc-symbol-attribute"></code> <span class="doc doc-object-name doc-attribute-name">lang</span>
|
||
|
||
|
||
<span class="doc doc-labels">
|
||
<small class="doc doc-label doc-label-instance-attribute"><code>instance-attribute</code></small>
|
||
</span> (<code>docling.datamodel.pipeline_options.OcrOptions.lang</code>)" href="#docling.datamodel.pipeline_options.OcrOptions.lang">lang</a></code></b>
|
||
(<code><span title="typing.List">List</span>[<span title="str">str</span>]</code>)
|
||
–
|
||
<div class="doc-md-description">
|
||
|
||
</div>
|
||
</li>
|
||
</ul>
|
||
|
||
|
||
|
||
|
||
<div class="doc doc-children">
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
<div class="doc doc-object doc-attribute">
|
||
|
||
|
||
|
||
<h4 id="docling.datamodel.pipeline_options.OcrOptions.bitmap_area_threshold" class="doc doc-heading">
|
||
<code class="doc-symbol doc-symbol-heading doc-symbol-attribute"></code> <span class="doc doc-object-name doc-attribute-name">bitmap_area_threshold</span>
|
||
|
||
|
||
<span class="doc doc-labels">
|
||
<small class="doc doc-label doc-label-class-attribute"><code>class-attribute</code></small>
|
||
<small class="doc doc-label doc-label-instance-attribute"><code>instance-attribute</code></small>
|
||
</span>
|
||
|
||
</h4>
|
||
<div class="doc-signature highlight"><pre><span></span><code><span class="n">bitmap_area_threshold</span><span class="p">:</span> <span class="n"><span title="float">float</span></span> <span class="o">=</span> <span class="mf">0.05</span>
|
||
</code></pre></div>
|
||
|
||
<div class="doc doc-contents ">
|
||
|
||
</div>
|
||
|
||
</div>
|
||
|
||
<div class="doc doc-object doc-attribute">
|
||
|
||
|
||
|
||
<h4 id="docling.datamodel.pipeline_options.OcrOptions.force_full_page_ocr" class="doc doc-heading">
|
||
<code class="doc-symbol doc-symbol-heading doc-symbol-attribute"></code> <span class="doc doc-object-name doc-attribute-name">force_full_page_ocr</span>
|
||
|
||
|
||
<span class="doc doc-labels">
|
||
<small class="doc doc-label doc-label-class-attribute"><code>class-attribute</code></small>
|
||
<small class="doc doc-label doc-label-instance-attribute"><code>instance-attribute</code></small>
|
||
</span>
|
||
|
||
</h4>
|
||
<div class="doc-signature highlight"><pre><span></span><code><span class="n">force_full_page_ocr</span><span class="p">:</span> <span class="n"><span title="bool">bool</span></span> <span class="o">=</span> <span class="kc">False</span>
|
||
</code></pre></div>
|
||
|
||
<div class="doc doc-contents ">
|
||
|
||
</div>
|
||
|
||
</div>
|
||
|
||
<div class="doc doc-object doc-attribute">
|
||
|
||
|
||
|
||
<h4 id="docling.datamodel.pipeline_options.OcrOptions.kind" class="doc doc-heading">
|
||
<code class="doc-symbol doc-symbol-heading doc-symbol-attribute"></code> <span class="doc doc-object-name doc-attribute-name">kind</span>
|
||
|
||
|
||
<span class="doc doc-labels">
|
||
<small class="doc doc-label doc-label-class-attribute"><code>class-attribute</code></small>
|
||
</span>
|
||
|
||
</h4>
|
||
<div class="doc-signature highlight"><pre><span></span><code><span class="n">kind</span><span class="p">:</span> <span class="n"><span title="str">str</span></span>
|
||
</code></pre></div>
|
||
|
||
<div class="doc doc-contents ">
|
||
|
||
</div>
|
||
|
||
</div>
|
||
|
||
<div class="doc doc-object doc-attribute">
|
||
|
||
|
||
|
||
<h4 id="docling.datamodel.pipeline_options.OcrOptions.lang" class="doc doc-heading">
|
||
<code class="doc-symbol doc-symbol-heading doc-symbol-attribute"></code> <span class="doc doc-object-name doc-attribute-name">lang</span>
|
||
|
||
|
||
<span class="doc doc-labels">
|
||
<small class="doc doc-label doc-label-instance-attribute"><code>instance-attribute</code></small>
|
||
</span>
|
||
|
||
</h4>
|
||
<div class="doc-signature highlight"><pre><span></span><code><span class="n">lang</span><span class="p">:</span> <span class="n"><span title="typing.List">List</span></span><span class="p">[</span><span class="n"><span title="str">str</span></span><span class="p">]</span>
|
||
</code></pre></div>
|
||
|
||
<div class="doc doc-contents ">
|
||
|
||
</div>
|
||
|
||
</div>
|
||
|
||
|
||
|
||
|
||
|
||
|
||
</div>
|
||
|
||
</div>
|
||
|
||
</div>
|
||
|
||
<div class="doc doc-object doc-class">
|
||
|
||
|
||
|
||
<h3 id="docling.datamodel.pipeline_options.PaginatedPipelineOptions" class="doc doc-heading">
|
||
<code class="doc-symbol doc-symbol-heading doc-symbol-class"></code> <span class="doc doc-object-name doc-class-name">PaginatedPipelineOptions</span>
|
||
|
||
|
||
</h3>
|
||
|
||
|
||
<div class="doc doc-contents ">
|
||
<p class="doc doc-class-bases">
|
||
Bases: <code><a class="autorefs autorefs-internal" title="<code class="doc-symbol doc-symbol-heading doc-symbol-class"></code> <span class="doc doc-object-name doc-class-name">ConvertPipelineOptions</span> (<code>docling.datamodel.pipeline_options.ConvertPipelineOptions</code>)" href="#docling.datamodel.pipeline_options.ConvertPipelineOptions">ConvertPipelineOptions</a></code></p>
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
<p><span class="doc-section-title">Attributes:</span></p>
|
||
<ul>
|
||
<li class="doc-section-item field-body">
|
||
<b><code><a class="autorefs autorefs-internal" title="<code class="doc-symbol doc-symbol-heading doc-symbol-attribute"></code> <span class="doc doc-object-name doc-attribute-name">accelerator_options</span>
|
||
|
||
|
||
<span class="doc doc-labels">
|
||
<small class="doc doc-label doc-label-class-attribute"><code>class-attribute</code></small>
|
||
<small class="doc doc-label doc-label-instance-attribute"><code>instance-attribute</code></small>
|
||
</span> (<code>docling.datamodel.pipeline_options.PaginatedPipelineOptions.accelerator_options</code>)" href="#docling.datamodel.pipeline_options.PaginatedPipelineOptions.accelerator_options">accelerator_options</a></code></b>
|
||
(<code><span title="docling.datamodel.accelerator_options.AcceleratorOptions">AcceleratorOptions</span></code>)
|
||
–
|
||
<div class="doc-md-description">
|
||
|
||
</div>
|
||
</li>
|
||
<li class="doc-section-item field-body">
|
||
<b><code><a class="autorefs autorefs-internal" title="<code class="doc-symbol doc-symbol-heading doc-symbol-attribute"></code> <span class="doc doc-object-name doc-attribute-name">allow_external_plugins</span>
|
||
|
||
|
||
<span class="doc doc-labels">
|
||
<small class="doc doc-label doc-label-class-attribute"><code>class-attribute</code></small>
|
||
<small class="doc doc-label doc-label-instance-attribute"><code>instance-attribute</code></small>
|
||
</span> (<code>docling.datamodel.pipeline_options.PaginatedPipelineOptions.allow_external_plugins</code>)" href="#docling.datamodel.pipeline_options.PaginatedPipelineOptions.allow_external_plugins">allow_external_plugins</a></code></b>
|
||
(<code><span title="bool">bool</span></code>)
|
||
–
|
||
<div class="doc-md-description">
|
||
|
||
</div>
|
||
</li>
|
||
<li class="doc-section-item field-body">
|
||
<b><code><a class="autorefs autorefs-internal" title="<code class="doc-symbol doc-symbol-heading doc-symbol-attribute"></code> <span class="doc doc-object-name doc-attribute-name">artifacts_path</span>
|
||
|
||
|
||
<span class="doc doc-labels">
|
||
<small class="doc doc-label doc-label-class-attribute"><code>class-attribute</code></small>
|
||
<small class="doc doc-label doc-label-instance-attribute"><code>instance-attribute</code></small>
|
||
</span> (<code>docling.datamodel.pipeline_options.PaginatedPipelineOptions.artifacts_path</code>)" href="#docling.datamodel.pipeline_options.PaginatedPipelineOptions.artifacts_path">artifacts_path</a></code></b>
|
||
(<code><span title="typing.Optional">Optional</span>[<span title="typing.Union">Union</span>[<span title="pathlib.Path">Path</span>, <span title="str">str</span>]]</code>)
|
||
–
|
||
<div class="doc-md-description">
|
||
|
||
</div>
|
||
</li>
|
||
<li class="doc-section-item field-body">
|
||
<b><code><a class="autorefs autorefs-internal" title="<code class="doc-symbol doc-symbol-heading doc-symbol-attribute"></code> <span class="doc doc-object-name doc-attribute-name">do_picture_classification</span>
|
||
|
||
|
||
<span class="doc doc-labels">
|
||
<small class="doc doc-label doc-label-class-attribute"><code>class-attribute</code></small>
|
||
<small class="doc doc-label doc-label-instance-attribute"><code>instance-attribute</code></small>
|
||
</span> (<code>docling.datamodel.pipeline_options.PaginatedPipelineOptions.do_picture_classification</code>)" href="#docling.datamodel.pipeline_options.PaginatedPipelineOptions.do_picture_classification">do_picture_classification</a></code></b>
|
||
(<code><span title="bool">bool</span></code>)
|
||
–
|
||
<div class="doc-md-description">
|
||
|
||
</div>
|
||
</li>
|
||
<li class="doc-section-item field-body">
|
||
<b><code><a class="autorefs autorefs-internal" title="<code class="doc-symbol doc-symbol-heading doc-symbol-attribute"></code> <span class="doc doc-object-name doc-attribute-name">do_picture_description</span>
|
||
|
||
|
||
<span class="doc doc-labels">
|
||
<small class="doc doc-label doc-label-class-attribute"><code>class-attribute</code></small>
|
||
<small class="doc doc-label doc-label-instance-attribute"><code>instance-attribute</code></small>
|
||
</span> (<code>docling.datamodel.pipeline_options.PaginatedPipelineOptions.do_picture_description</code>)" href="#docling.datamodel.pipeline_options.PaginatedPipelineOptions.do_picture_description">do_picture_description</a></code></b>
|
||
(<code><span title="bool">bool</span></code>)
|
||
–
|
||
<div class="doc-md-description">
|
||
|
||
</div>
|
||
</li>
|
||
<li class="doc-section-item field-body">
|
||
<b><code><a class="autorefs autorefs-internal" title="<code class="doc-symbol doc-symbol-heading doc-symbol-attribute"></code> <span class="doc doc-object-name doc-attribute-name">document_timeout</span>
|
||
|
||
|
||
<span class="doc doc-labels">
|
||
<small class="doc doc-label doc-label-class-attribute"><code>class-attribute</code></small>
|
||
<small class="doc doc-label doc-label-instance-attribute"><code>instance-attribute</code></small>
|
||
</span> (<code>docling.datamodel.pipeline_options.PaginatedPipelineOptions.document_timeout</code>)" href="#docling.datamodel.pipeline_options.PaginatedPipelineOptions.document_timeout">document_timeout</a></code></b>
|
||
(<code><span title="typing.Optional">Optional</span>[<span title="float">float</span>]</code>)
|
||
–
|
||
<div class="doc-md-description">
|
||
|
||
</div>
|
||
</li>
|
||
<li class="doc-section-item field-body">
|
||
<b><code><a class="autorefs autorefs-internal" title="<code class="doc-symbol doc-symbol-heading doc-symbol-attribute"></code> <span class="doc doc-object-name doc-attribute-name">enable_remote_services</span>
|
||
|
||
|
||
<span class="doc doc-labels">
|
||
<small class="doc doc-label doc-label-class-attribute"><code>class-attribute</code></small>
|
||
<small class="doc doc-label doc-label-instance-attribute"><code>instance-attribute</code></small>
|
||
</span> (<code>docling.datamodel.pipeline_options.PaginatedPipelineOptions.enable_remote_services</code>)" href="#docling.datamodel.pipeline_options.PaginatedPipelineOptions.enable_remote_services">enable_remote_services</a></code></b>
|
||
(<code><span title="bool">bool</span></code>)
|
||
–
|
||
<div class="doc-md-description">
|
||
|
||
</div>
|
||
</li>
|
||
<li class="doc-section-item field-body">
|
||
<b><code><a class="autorefs autorefs-internal" title="<code class="doc-symbol doc-symbol-heading doc-symbol-attribute"></code> <span class="doc doc-object-name doc-attribute-name">generate_page_images</span>
|
||
|
||
|
||
<span class="doc doc-labels">
|
||
<small class="doc doc-label doc-label-class-attribute"><code>class-attribute</code></small>
|
||
<small class="doc doc-label doc-label-instance-attribute"><code>instance-attribute</code></small>
|
||
</span> (<code>docling.datamodel.pipeline_options.PaginatedPipelineOptions.generate_page_images</code>)" href="#docling.datamodel.pipeline_options.PaginatedPipelineOptions.generate_page_images">generate_page_images</a></code></b>
|
||
(<code><span title="bool">bool</span></code>)
|
||
–
|
||
<div class="doc-md-description">
|
||
|
||
</div>
|
||
</li>
|
||
<li class="doc-section-item field-body">
|
||
<b><code><a class="autorefs autorefs-internal" title="<code class="doc-symbol doc-symbol-heading doc-symbol-attribute"></code> <span class="doc doc-object-name doc-attribute-name">generate_picture_images</span>
|
||
|
||
|
||
<span class="doc doc-labels">
|
||
<small class="doc doc-label doc-label-class-attribute"><code>class-attribute</code></small>
|
||
<small class="doc doc-label doc-label-instance-attribute"><code>instance-attribute</code></small>
|
||
</span> (<code>docling.datamodel.pipeline_options.PaginatedPipelineOptions.generate_picture_images</code>)" href="#docling.datamodel.pipeline_options.PaginatedPipelineOptions.generate_picture_images">generate_picture_images</a></code></b>
|
||
(<code><span title="bool">bool</span></code>)
|
||
–
|
||
<div class="doc-md-description">
|
||
|
||
</div>
|
||
</li>
|
||
<li class="doc-section-item field-body">
|
||
<b><code><a class="autorefs autorefs-internal" title="<code class="doc-symbol doc-symbol-heading doc-symbol-attribute"></code> <span class="doc doc-object-name doc-attribute-name">images_scale</span>
|
||
|
||
|
||
<span class="doc doc-labels">
|
||
<small class="doc doc-label doc-label-class-attribute"><code>class-attribute</code></small>
|
||
<small class="doc doc-label doc-label-instance-attribute"><code>instance-attribute</code></small>
|
||
</span> (<code>docling.datamodel.pipeline_options.PaginatedPipelineOptions.images_scale</code>)" href="#docling.datamodel.pipeline_options.PaginatedPipelineOptions.images_scale">images_scale</a></code></b>
|
||
(<code><span title="float">float</span></code>)
|
||
–
|
||
<div class="doc-md-description">
|
||
|
||
</div>
|
||
</li>
|
||
<li class="doc-section-item field-body">
|
||
<b><code><a class="autorefs autorefs-internal" title="<code class="doc-symbol doc-symbol-heading doc-symbol-attribute"></code> <span class="doc doc-object-name doc-attribute-name">kind</span>
|
||
|
||
|
||
<span class="doc doc-labels">
|
||
<small class="doc doc-label doc-label-class-attribute"><code>class-attribute</code></small>
|
||
</span> (<code>docling.datamodel.pipeline_options.PaginatedPipelineOptions.kind</code>)" href="#docling.datamodel.pipeline_options.PaginatedPipelineOptions.kind">kind</a></code></b>
|
||
(<code><span title="str">str</span></code>)
|
||
–
|
||
<div class="doc-md-description">
|
||
|
||
</div>
|
||
</li>
|
||
<li class="doc-section-item field-body">
|
||
<b><code><a class="autorefs autorefs-internal" title="<code class="doc-symbol doc-symbol-heading doc-symbol-attribute"></code> <span class="doc doc-object-name doc-attribute-name">picture_description_options</span>
|
||
|
||
|
||
<span class="doc doc-labels">
|
||
<small class="doc doc-label doc-label-class-attribute"><code>class-attribute</code></small>
|
||
<small class="doc doc-label doc-label-instance-attribute"><code>instance-attribute</code></small>
|
||
</span> (<code>docling.datamodel.pipeline_options.PaginatedPipelineOptions.picture_description_options</code>)" href="#docling.datamodel.pipeline_options.PaginatedPipelineOptions.picture_description_options">picture_description_options</a></code></b>
|
||
(<code><a class="autorefs autorefs-internal" title="<code class="doc-symbol doc-symbol-heading doc-symbol-class"></code> <span class="doc doc-object-name doc-class-name">PictureDescriptionBaseOptions</span> (<code>docling.datamodel.pipeline_options.PictureDescriptionBaseOptions</code>)" href="#docling.datamodel.pipeline_options.PictureDescriptionBaseOptions">PictureDescriptionBaseOptions</a></code>)
|
||
–
|
||
<div class="doc-md-description">
|
||
|
||
</div>
|
||
</li>
|
||
</ul>
|
||
|
||
|
||
|
||
|
||
<div class="doc doc-children">
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
<div class="doc doc-object doc-attribute">
|
||
|
||
|
||
|
||
<h4 id="docling.datamodel.pipeline_options.PaginatedPipelineOptions.accelerator_options" class="doc doc-heading">
|
||
<code class="doc-symbol doc-symbol-heading doc-symbol-attribute"></code> <span class="doc doc-object-name doc-attribute-name">accelerator_options</span>
|
||
|
||
|
||
<span class="doc doc-labels">
|
||
<small class="doc doc-label doc-label-class-attribute"><code>class-attribute</code></small>
|
||
<small class="doc doc-label doc-label-instance-attribute"><code>instance-attribute</code></small>
|
||
</span>
|
||
|
||
</h4>
|
||
<div class="doc-signature highlight"><pre><span></span><code><span class="n">accelerator_options</span><span class="p">:</span> <span class="n"><span title="docling.datamodel.accelerator_options.AcceleratorOptions">AcceleratorOptions</span></span> <span class="o">=</span> <span class="n"><span title="docling.datamodel.accelerator_options.AcceleratorOptions">AcceleratorOptions</span></span><span class="p">()</span>
|
||
</code></pre></div>
|
||
|
||
<div class="doc doc-contents ">
|
||
|
||
</div>
|
||
|
||
</div>
|
||
|
||
<div class="doc doc-object doc-attribute">
|
||
|
||
|
||
|
||
<h4 id="docling.datamodel.pipeline_options.PaginatedPipelineOptions.allow_external_plugins" class="doc doc-heading">
|
||
<code class="doc-symbol doc-symbol-heading doc-symbol-attribute"></code> <span class="doc doc-object-name doc-attribute-name">allow_external_plugins</span>
|
||
|
||
|
||
<span class="doc doc-labels">
|
||
<small class="doc doc-label doc-label-class-attribute"><code>class-attribute</code></small>
|
||
<small class="doc doc-label doc-label-instance-attribute"><code>instance-attribute</code></small>
|
||
</span>
|
||
|
||
</h4>
|
||
<div class="doc-signature highlight"><pre><span></span><code><span class="n">allow_external_plugins</span><span class="p">:</span> <span class="n"><span title="bool">bool</span></span> <span class="o">=</span> <span class="kc">False</span>
|
||
</code></pre></div>
|
||
|
||
<div class="doc doc-contents ">
|
||
|
||
</div>
|
||
|
||
</div>
|
||
|
||
<div class="doc doc-object doc-attribute">
|
||
|
||
|
||
|
||
<h4 id="docling.datamodel.pipeline_options.PaginatedPipelineOptions.artifacts_path" class="doc doc-heading">
|
||
<code class="doc-symbol doc-symbol-heading doc-symbol-attribute"></code> <span class="doc doc-object-name doc-attribute-name">artifacts_path</span>
|
||
|
||
|
||
<span class="doc doc-labels">
|
||
<small class="doc doc-label doc-label-class-attribute"><code>class-attribute</code></small>
|
||
<small class="doc doc-label doc-label-instance-attribute"><code>instance-attribute</code></small>
|
||
</span>
|
||
|
||
</h4>
|
||
<div class="doc-signature highlight"><pre><span></span><code><span class="n">artifacts_path</span><span class="p">:</span> <span class="n"><span title="typing.Optional">Optional</span></span><span class="p">[</span><span class="n"><span title="typing.Union">Union</span></span><span class="p">[</span><span class="n"><span title="pathlib.Path">Path</span></span><span class="p">,</span> <span class="n"><span title="str">str</span></span><span class="p">]]</span> <span class="o">=</span> <span class="kc">None</span>
|
||
</code></pre></div>
|
||
|
||
<div class="doc doc-contents ">
|
||
|
||
</div>
|
||
|
||
</div>
|
||
|
||
<div class="doc doc-object doc-attribute">
|
||
|
||
|
||
|
||
<h4 id="docling.datamodel.pipeline_options.PaginatedPipelineOptions.do_picture_classification" class="doc doc-heading">
|
||
<code class="doc-symbol doc-symbol-heading doc-symbol-attribute"></code> <span class="doc doc-object-name doc-attribute-name">do_picture_classification</span>
|
||
|
||
|
||
<span class="doc doc-labels">
|
||
<small class="doc doc-label doc-label-class-attribute"><code>class-attribute</code></small>
|
||
<small class="doc doc-label doc-label-instance-attribute"><code>instance-attribute</code></small>
|
||
</span>
|
||
|
||
</h4>
|
||
<div class="doc-signature highlight"><pre><span></span><code><span class="n">do_picture_classification</span><span class="p">:</span> <span class="n"><span title="bool">bool</span></span> <span class="o">=</span> <span class="kc">False</span>
|
||
</code></pre></div>
|
||
|
||
<div class="doc doc-contents ">
|
||
|
||
</div>
|
||
|
||
</div>
|
||
|
||
<div class="doc doc-object doc-attribute">
|
||
|
||
|
||
|
||
<h4 id="docling.datamodel.pipeline_options.PaginatedPipelineOptions.do_picture_description" class="doc doc-heading">
|
||
<code class="doc-symbol doc-symbol-heading doc-symbol-attribute"></code> <span class="doc doc-object-name doc-attribute-name">do_picture_description</span>
|
||
|
||
|
||
<span class="doc doc-labels">
|
||
<small class="doc doc-label doc-label-class-attribute"><code>class-attribute</code></small>
|
||
<small class="doc doc-label doc-label-instance-attribute"><code>instance-attribute</code></small>
|
||
</span>
|
||
|
||
</h4>
|
||
<div class="doc-signature highlight"><pre><span></span><code><span class="n">do_picture_description</span><span class="p">:</span> <span class="n"><span title="bool">bool</span></span> <span class="o">=</span> <span class="kc">False</span>
|
||
</code></pre></div>
|
||
|
||
<div class="doc doc-contents ">
|
||
|
||
</div>
|
||
|
||
</div>
|
||
|
||
<div class="doc doc-object doc-attribute">
|
||
|
||
|
||
|
||
<h4 id="docling.datamodel.pipeline_options.PaginatedPipelineOptions.document_timeout" class="doc doc-heading">
|
||
<code class="doc-symbol doc-symbol-heading doc-symbol-attribute"></code> <span class="doc doc-object-name doc-attribute-name">document_timeout</span>
|
||
|
||
|
||
<span class="doc doc-labels">
|
||
<small class="doc doc-label doc-label-class-attribute"><code>class-attribute</code></small>
|
||
<small class="doc doc-label doc-label-instance-attribute"><code>instance-attribute</code></small>
|
||
</span>
|
||
|
||
</h4>
|
||
<div class="doc-signature highlight"><pre><span></span><code><span class="n">document_timeout</span><span class="p">:</span> <span class="n"><span title="typing.Optional">Optional</span></span><span class="p">[</span><span class="n"><span title="float">float</span></span><span class="p">]</span> <span class="o">=</span> <span class="kc">None</span>
|
||
</code></pre></div>
|
||
|
||
<div class="doc doc-contents ">
|
||
|
||
</div>
|
||
|
||
</div>
|
||
|
||
<div class="doc doc-object doc-attribute">
|
||
|
||
|
||
|
||
<h4 id="docling.datamodel.pipeline_options.PaginatedPipelineOptions.enable_remote_services" class="doc doc-heading">
|
||
<code class="doc-symbol doc-symbol-heading doc-symbol-attribute"></code> <span class="doc doc-object-name doc-attribute-name">enable_remote_services</span>
|
||
|
||
|
||
<span class="doc doc-labels">
|
||
<small class="doc doc-label doc-label-class-attribute"><code>class-attribute</code></small>
|
||
<small class="doc doc-label doc-label-instance-attribute"><code>instance-attribute</code></small>
|
||
</span>
|
||
|
||
</h4>
|
||
<div class="doc-signature highlight"><pre><span></span><code><span class="n">enable_remote_services</span><span class="p">:</span> <span class="n"><span title="bool">bool</span></span> <span class="o">=</span> <span class="kc">False</span>
|
||
</code></pre></div>
|
||
|
||
<div class="doc doc-contents ">
|
||
|
||
</div>
|
||
|
||
</div>
|
||
|
||
<div class="doc doc-object doc-attribute">
|
||
|
||
|
||
|
||
<h4 id="docling.datamodel.pipeline_options.PaginatedPipelineOptions.generate_page_images" class="doc doc-heading">
|
||
<code class="doc-symbol doc-symbol-heading doc-symbol-attribute"></code> <span class="doc doc-object-name doc-attribute-name">generate_page_images</span>
|
||
|
||
|
||
<span class="doc doc-labels">
|
||
<small class="doc doc-label doc-label-class-attribute"><code>class-attribute</code></small>
|
||
<small class="doc doc-label doc-label-instance-attribute"><code>instance-attribute</code></small>
|
||
</span>
|
||
|
||
</h4>
|
||
<div class="doc-signature highlight"><pre><span></span><code><span class="n">generate_page_images</span><span class="p">:</span> <span class="n"><span title="bool">bool</span></span> <span class="o">=</span> <span class="kc">False</span>
|
||
</code></pre></div>
|
||
|
||
<div class="doc doc-contents ">
|
||
|
||
</div>
|
||
|
||
</div>
|
||
|
||
<div class="doc doc-object doc-attribute">
|
||
|
||
|
||
|
||
<h4 id="docling.datamodel.pipeline_options.PaginatedPipelineOptions.generate_picture_images" class="doc doc-heading">
|
||
<code class="doc-symbol doc-symbol-heading doc-symbol-attribute"></code> <span class="doc doc-object-name doc-attribute-name">generate_picture_images</span>
|
||
|
||
|
||
<span class="doc doc-labels">
|
||
<small class="doc doc-label doc-label-class-attribute"><code>class-attribute</code></small>
|
||
<small class="doc doc-label doc-label-instance-attribute"><code>instance-attribute</code></small>
|
||
</span>
|
||
|
||
</h4>
|
||
<div class="doc-signature highlight"><pre><span></span><code><span class="n">generate_picture_images</span><span class="p">:</span> <span class="n"><span title="bool">bool</span></span> <span class="o">=</span> <span class="kc">False</span>
|
||
</code></pre></div>
|
||
|
||
<div class="doc doc-contents ">
|
||
|
||
</div>
|
||
|
||
</div>
|
||
|
||
<div class="doc doc-object doc-attribute">
|
||
|
||
|
||
|
||
<h4 id="docling.datamodel.pipeline_options.PaginatedPipelineOptions.images_scale" class="doc doc-heading">
|
||
<code class="doc-symbol doc-symbol-heading doc-symbol-attribute"></code> <span class="doc doc-object-name doc-attribute-name">images_scale</span>
|
||
|
||
|
||
<span class="doc doc-labels">
|
||
<small class="doc doc-label doc-label-class-attribute"><code>class-attribute</code></small>
|
||
<small class="doc doc-label doc-label-instance-attribute"><code>instance-attribute</code></small>
|
||
</span>
|
||
|
||
</h4>
|
||
<div class="doc-signature highlight"><pre><span></span><code><span class="n">images_scale</span><span class="p">:</span> <span class="n"><span title="float">float</span></span> <span class="o">=</span> <span class="mf">1.0</span>
|
||
</code></pre></div>
|
||
|
||
<div class="doc doc-contents ">
|
||
|
||
</div>
|
||
|
||
</div>
|
||
|
||
<div class="doc doc-object doc-attribute">
|
||
|
||
|
||
|
||
<h4 id="docling.datamodel.pipeline_options.PaginatedPipelineOptions.kind" class="doc doc-heading">
|
||
<code class="doc-symbol doc-symbol-heading doc-symbol-attribute"></code> <span class="doc doc-object-name doc-attribute-name">kind</span>
|
||
|
||
|
||
<span class="doc doc-labels">
|
||
<small class="doc doc-label doc-label-class-attribute"><code>class-attribute</code></small>
|
||
</span>
|
||
|
||
</h4>
|
||
<div class="doc-signature highlight"><pre><span></span><code><span class="n">kind</span><span class="p">:</span> <span class="n"><span title="str">str</span></span>
|
||
</code></pre></div>
|
||
|
||
<div class="doc doc-contents ">
|
||
|
||
</div>
|
||
|
||
</div>
|
||
|
||
<div class="doc doc-object doc-attribute">
|
||
|
||
|
||
|
||
<h4 id="docling.datamodel.pipeline_options.PaginatedPipelineOptions.picture_description_options" class="doc doc-heading">
|
||
<code class="doc-symbol doc-symbol-heading doc-symbol-attribute"></code> <span class="doc doc-object-name doc-attribute-name">picture_description_options</span>
|
||
|
||
|
||
<span class="doc doc-labels">
|
||
<small class="doc doc-label doc-label-class-attribute"><code>class-attribute</code></small>
|
||
<small class="doc doc-label doc-label-instance-attribute"><code>instance-attribute</code></small>
|
||
</span>
|
||
|
||
</h4>
|
||
<div class="doc-signature highlight"><pre><span></span><code><span class="n">picture_description_options</span><span class="p">:</span> <span class="n"><a class="autorefs autorefs-internal" title="<code class="doc-symbol doc-symbol-heading doc-symbol-class"></code> <span class="doc doc-object-name doc-class-name">PictureDescriptionBaseOptions</span> (<code>docling.datamodel.pipeline_options.PictureDescriptionBaseOptions</code>)" href="#docling.datamodel.pipeline_options.PictureDescriptionBaseOptions">PictureDescriptionBaseOptions</a></span> <span class="o">=</span> <span class="n"><a class="autorefs autorefs-internal" title="<code class="doc-symbol doc-symbol-heading doc-symbol-attribute"></code> <span class="doc doc-object-name doc-attribute-name">smolvlm_picture_description</span>
|
||
|
||
|
||
<span class="doc doc-labels">
|
||
<small class="doc doc-label doc-label-module-attribute"><code>module-attribute</code></small>
|
||
</span> (<code>docling.datamodel.pipeline_options.smolvlm_picture_description</code>)" href="#docling.datamodel.pipeline_options.smolvlm_picture_description">smolvlm_picture_description</a></span>
|
||
</code></pre></div>
|
||
|
||
<div class="doc doc-contents ">
|
||
|
||
</div>
|
||
|
||
</div>
|
||
|
||
|
||
|
||
|
||
|
||
|
||
</div>
|
||
|
||
</div>
|
||
|
||
</div>
|
||
|
||
<div class="doc doc-object doc-class">
|
||
|
||
|
||
|
||
<h3 id="docling.datamodel.pipeline_options.PdfBackend" class="doc doc-heading">
|
||
<code class="doc-symbol doc-symbol-heading doc-symbol-class"></code> <span class="doc doc-object-name doc-class-name">PdfBackend</span>
|
||
|
||
|
||
</h3>
|
||
|
||
|
||
<div class="doc doc-contents ">
|
||
<p class="doc doc-class-bases">
|
||
Bases: <code><span title="str">str</span></code>, <code><span title="enum.Enum">Enum</span></code></p>
|
||
|
||
|
||
|
||
<p>Enum of valid PDF backends.</p>
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
<p><span class="doc-section-title">Attributes:</span></p>
|
||
<ul>
|
||
<li class="doc-section-item field-body">
|
||
<b><code><a class="autorefs autorefs-internal" title="<code class="doc-symbol doc-symbol-heading doc-symbol-attribute"></code> <span class="doc doc-object-name doc-attribute-name">DLPARSE_V1</span>
|
||
|
||
|
||
<span class="doc doc-labels">
|
||
<small class="doc doc-label doc-label-class-attribute"><code>class-attribute</code></small>
|
||
<small class="doc doc-label doc-label-instance-attribute"><code>instance-attribute</code></small>
|
||
</span> (<code>docling.datamodel.pipeline_options.PdfBackend.DLPARSE_V1</code>)" href="#docling.datamodel.pipeline_options.PdfBackend.DLPARSE_V1">DLPARSE_V1</a></code></b>
|
||
–
|
||
<div class="doc-md-description">
|
||
|
||
</div>
|
||
</li>
|
||
<li class="doc-section-item field-body">
|
||
<b><code><a class="autorefs autorefs-internal" title="<code class="doc-symbol doc-symbol-heading doc-symbol-attribute"></code> <span class="doc doc-object-name doc-attribute-name">DLPARSE_V2</span>
|
||
|
||
|
||
<span class="doc doc-labels">
|
||
<small class="doc doc-label doc-label-class-attribute"><code>class-attribute</code></small>
|
||
<small class="doc doc-label doc-label-instance-attribute"><code>instance-attribute</code></small>
|
||
</span> (<code>docling.datamodel.pipeline_options.PdfBackend.DLPARSE_V2</code>)" href="#docling.datamodel.pipeline_options.PdfBackend.DLPARSE_V2">DLPARSE_V2</a></code></b>
|
||
–
|
||
<div class="doc-md-description">
|
||
|
||
</div>
|
||
</li>
|
||
<li class="doc-section-item field-body">
|
||
<b><code><a class="autorefs autorefs-internal" title="<code class="doc-symbol doc-symbol-heading doc-symbol-attribute"></code> <span class="doc doc-object-name doc-attribute-name">DLPARSE_V4</span>
|
||
|
||
|
||
<span class="doc doc-labels">
|
||
<small class="doc doc-label doc-label-class-attribute"><code>class-attribute</code></small>
|
||
<small class="doc doc-label doc-label-instance-attribute"><code>instance-attribute</code></small>
|
||
</span> (<code>docling.datamodel.pipeline_options.PdfBackend.DLPARSE_V4</code>)" href="#docling.datamodel.pipeline_options.PdfBackend.DLPARSE_V4">DLPARSE_V4</a></code></b>
|
||
–
|
||
<div class="doc-md-description">
|
||
|
||
</div>
|
||
</li>
|
||
<li class="doc-section-item field-body">
|
||
<b><code><a class="autorefs autorefs-internal" title="<code class="doc-symbol doc-symbol-heading doc-symbol-attribute"></code> <span class="doc doc-object-name doc-attribute-name">PYPDFIUM2</span>
|
||
|
||
|
||
<span class="doc doc-labels">
|
||
<small class="doc doc-label doc-label-class-attribute"><code>class-attribute</code></small>
|
||
<small class="doc doc-label doc-label-instance-attribute"><code>instance-attribute</code></small>
|
||
</span> (<code>docling.datamodel.pipeline_options.PdfBackend.PYPDFIUM2</code>)" href="#docling.datamodel.pipeline_options.PdfBackend.PYPDFIUM2">PYPDFIUM2</a></code></b>
|
||
–
|
||
<div class="doc-md-description">
|
||
|
||
</div>
|
||
</li>
|
||
</ul>
|
||
|
||
|
||
|
||
|
||
<div class="doc doc-children">
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
<div class="doc doc-object doc-attribute">
|
||
|
||
|
||
|
||
<h4 id="docling.datamodel.pipeline_options.PdfBackend.DLPARSE_V1" class="doc doc-heading">
|
||
<code class="doc-symbol doc-symbol-heading doc-symbol-attribute"></code> <span class="doc doc-object-name doc-attribute-name">DLPARSE_V1</span>
|
||
|
||
|
||
<span class="doc doc-labels">
|
||
<small class="doc doc-label doc-label-class-attribute"><code>class-attribute</code></small>
|
||
<small class="doc doc-label doc-label-instance-attribute"><code>instance-attribute</code></small>
|
||
</span>
|
||
|
||
</h4>
|
||
<div class="doc-signature highlight"><pre><span></span><code><span class="n">DLPARSE_V1</span> <span class="o">=</span> <span class="s1">'dlparse_v1'</span>
|
||
</code></pre></div>
|
||
|
||
<div class="doc doc-contents ">
|
||
|
||
</div>
|
||
|
||
</div>
|
||
|
||
<div class="doc doc-object doc-attribute">
|
||
|
||
|
||
|
||
<h4 id="docling.datamodel.pipeline_options.PdfBackend.DLPARSE_V2" class="doc doc-heading">
|
||
<code class="doc-symbol doc-symbol-heading doc-symbol-attribute"></code> <span class="doc doc-object-name doc-attribute-name">DLPARSE_V2</span>
|
||
|
||
|
||
<span class="doc doc-labels">
|
||
<small class="doc doc-label doc-label-class-attribute"><code>class-attribute</code></small>
|
||
<small class="doc doc-label doc-label-instance-attribute"><code>instance-attribute</code></small>
|
||
</span>
|
||
|
||
</h4>
|
||
<div class="doc-signature highlight"><pre><span></span><code><span class="n">DLPARSE_V2</span> <span class="o">=</span> <span class="s1">'dlparse_v2'</span>
|
||
</code></pre></div>
|
||
|
||
<div class="doc doc-contents ">
|
||
|
||
</div>
|
||
|
||
</div>
|
||
|
||
<div class="doc doc-object doc-attribute">
|
||
|
||
|
||
|
||
<h4 id="docling.datamodel.pipeline_options.PdfBackend.DLPARSE_V4" class="doc doc-heading">
|
||
<code class="doc-symbol doc-symbol-heading doc-symbol-attribute"></code> <span class="doc doc-object-name doc-attribute-name">DLPARSE_V4</span>
|
||
|
||
|
||
<span class="doc doc-labels">
|
||
<small class="doc doc-label doc-label-class-attribute"><code>class-attribute</code></small>
|
||
<small class="doc doc-label doc-label-instance-attribute"><code>instance-attribute</code></small>
|
||
</span>
|
||
|
||
</h4>
|
||
<div class="doc-signature highlight"><pre><span></span><code><span class="n">DLPARSE_V4</span> <span class="o">=</span> <span class="s1">'dlparse_v4'</span>
|
||
</code></pre></div>
|
||
|
||
<div class="doc doc-contents ">
|
||
|
||
</div>
|
||
|
||
</div>
|
||
|
||
<div class="doc doc-object doc-attribute">
|
||
|
||
|
||
|
||
<h4 id="docling.datamodel.pipeline_options.PdfBackend.PYPDFIUM2" class="doc doc-heading">
|
||
<code class="doc-symbol doc-symbol-heading doc-symbol-attribute"></code> <span class="doc doc-object-name doc-attribute-name">PYPDFIUM2</span>
|
||
|
||
|
||
<span class="doc doc-labels">
|
||
<small class="doc doc-label doc-label-class-attribute"><code>class-attribute</code></small>
|
||
<small class="doc doc-label doc-label-instance-attribute"><code>instance-attribute</code></small>
|
||
</span>
|
||
|
||
</h4>
|
||
<div class="doc-signature highlight"><pre><span></span><code><span class="n">PYPDFIUM2</span> <span class="o">=</span> <span class="s1">'pypdfium2'</span>
|
||
</code></pre></div>
|
||
|
||
<div class="doc doc-contents ">
|
||
|
||
</div>
|
||
|
||
</div>
|
||
|
||
|
||
|
||
|
||
|
||
|
||
</div>
|
||
|
||
</div>
|
||
|
||
</div>
|
||
|
||
<div class="doc doc-object doc-class">
|
||
|
||
|
||
|
||
<h3 id="docling.datamodel.pipeline_options.PdfPipelineOptions" class="doc doc-heading">
|
||
<code class="doc-symbol doc-symbol-heading doc-symbol-class"></code> <span class="doc doc-object-name doc-class-name">PdfPipelineOptions</span>
|
||
|
||
|
||
</h3>
|
||
|
||
|
||
<div class="doc doc-contents ">
|
||
<p class="doc doc-class-bases">
|
||
Bases: <code><a class="autorefs autorefs-internal" title="<code class="doc-symbol doc-symbol-heading doc-symbol-class"></code> <span class="doc doc-object-name doc-class-name">PaginatedPipelineOptions</span> (<code>docling.datamodel.pipeline_options.PaginatedPipelineOptions</code>)" href="#docling.datamodel.pipeline_options.PaginatedPipelineOptions">PaginatedPipelineOptions</a></code></p>
|
||
|
||
|
||
|
||
<p>Options for the PDF pipeline.</p>
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
<p><span class="doc-section-title">Attributes:</span></p>
|
||
<ul>
|
||
<li class="doc-section-item field-body">
|
||
<b><code><a class="autorefs autorefs-internal" title="<code class="doc-symbol doc-symbol-heading doc-symbol-attribute"></code> <span class="doc doc-object-name doc-attribute-name">accelerator_options</span>
|
||
|
||
|
||
<span class="doc doc-labels">
|
||
<small class="doc doc-label doc-label-class-attribute"><code>class-attribute</code></small>
|
||
<small class="doc doc-label doc-label-instance-attribute"><code>instance-attribute</code></small>
|
||
</span> (<code>docling.datamodel.pipeline_options.PdfPipelineOptions.accelerator_options</code>)" href="#docling.datamodel.pipeline_options.PdfPipelineOptions.accelerator_options">accelerator_options</a></code></b>
|
||
(<code><span title="docling.datamodel.accelerator_options.AcceleratorOptions">AcceleratorOptions</span></code>)
|
||
–
|
||
<div class="doc-md-description">
|
||
|
||
</div>
|
||
</li>
|
||
<li class="doc-section-item field-body">
|
||
<b><code><a class="autorefs autorefs-internal" title="<code class="doc-symbol doc-symbol-heading doc-symbol-attribute"></code> <span class="doc doc-object-name doc-attribute-name">allow_external_plugins</span>
|
||
|
||
|
||
<span class="doc doc-labels">
|
||
<small class="doc doc-label doc-label-class-attribute"><code>class-attribute</code></small>
|
||
<small class="doc doc-label doc-label-instance-attribute"><code>instance-attribute</code></small>
|
||
</span> (<code>docling.datamodel.pipeline_options.PdfPipelineOptions.allow_external_plugins</code>)" href="#docling.datamodel.pipeline_options.PdfPipelineOptions.allow_external_plugins">allow_external_plugins</a></code></b>
|
||
(<code><span title="bool">bool</span></code>)
|
||
–
|
||
<div class="doc-md-description">
|
||
|
||
</div>
|
||
</li>
|
||
<li class="doc-section-item field-body">
|
||
<b><code><a class="autorefs autorefs-internal" title="<code class="doc-symbol doc-symbol-heading doc-symbol-attribute"></code> <span class="doc doc-object-name doc-attribute-name">artifacts_path</span>
|
||
|
||
|
||
<span class="doc doc-labels">
|
||
<small class="doc doc-label doc-label-class-attribute"><code>class-attribute</code></small>
|
||
<small class="doc doc-label doc-label-instance-attribute"><code>instance-attribute</code></small>
|
||
</span> (<code>docling.datamodel.pipeline_options.PdfPipelineOptions.artifacts_path</code>)" href="#docling.datamodel.pipeline_options.PdfPipelineOptions.artifacts_path">artifacts_path</a></code></b>
|
||
(<code><span title="typing.Optional">Optional</span>[<span title="typing.Union">Union</span>[<span title="pathlib.Path">Path</span>, <span title="str">str</span>]]</code>)
|
||
–
|
||
<div class="doc-md-description">
|
||
|
||
</div>
|
||
</li>
|
||
<li class="doc-section-item field-body">
|
||
<b><code><a class="autorefs autorefs-internal" title="<code class="doc-symbol doc-symbol-heading doc-symbol-attribute"></code> <span class="doc doc-object-name doc-attribute-name">batch_polling_interval_seconds</span>
|
||
|
||
|
||
<span class="doc doc-labels">
|
||
<small class="doc doc-label doc-label-class-attribute"><code>class-attribute</code></small>
|
||
<small class="doc doc-label doc-label-instance-attribute"><code>instance-attribute</code></small>
|
||
</span> (<code>docling.datamodel.pipeline_options.PdfPipelineOptions.batch_polling_interval_seconds</code>)" href="#docling.datamodel.pipeline_options.PdfPipelineOptions.batch_polling_interval_seconds">batch_polling_interval_seconds</a></code></b>
|
||
(<code><span title="float">float</span></code>)
|
||
–
|
||
<div class="doc-md-description">
|
||
|
||
</div>
|
||
</li>
|
||
<li class="doc-section-item field-body">
|
||
<b><code><a class="autorefs autorefs-internal" title="<code class="doc-symbol doc-symbol-heading doc-symbol-attribute"></code> <span class="doc doc-object-name doc-attribute-name">do_code_enrichment</span>
|
||
|
||
|
||
<span class="doc doc-labels">
|
||
<small class="doc doc-label doc-label-class-attribute"><code>class-attribute</code></small>
|
||
<small class="doc doc-label doc-label-instance-attribute"><code>instance-attribute</code></small>
|
||
</span> (<code>docling.datamodel.pipeline_options.PdfPipelineOptions.do_code_enrichment</code>)" href="#docling.datamodel.pipeline_options.PdfPipelineOptions.do_code_enrichment">do_code_enrichment</a></code></b>
|
||
(<code><span title="bool">bool</span></code>)
|
||
–
|
||
<div class="doc-md-description">
|
||
|
||
</div>
|
||
</li>
|
||
<li class="doc-section-item field-body">
|
||
<b><code><a class="autorefs autorefs-internal" title="<code class="doc-symbol doc-symbol-heading doc-symbol-attribute"></code> <span class="doc doc-object-name doc-attribute-name">do_formula_enrichment</span>
|
||
|
||
|
||
<span class="doc doc-labels">
|
||
<small class="doc doc-label doc-label-class-attribute"><code>class-attribute</code></small>
|
||
<small class="doc doc-label doc-label-instance-attribute"><code>instance-attribute</code></small>
|
||
</span> (<code>docling.datamodel.pipeline_options.PdfPipelineOptions.do_formula_enrichment</code>)" href="#docling.datamodel.pipeline_options.PdfPipelineOptions.do_formula_enrichment">do_formula_enrichment</a></code></b>
|
||
(<code><span title="bool">bool</span></code>)
|
||
–
|
||
<div class="doc-md-description">
|
||
|
||
</div>
|
||
</li>
|
||
<li class="doc-section-item field-body">
|
||
<b><code><a class="autorefs autorefs-internal" title="<code class="doc-symbol doc-symbol-heading doc-symbol-attribute"></code> <span class="doc doc-object-name doc-attribute-name">do_ocr</span>
|
||
|
||
|
||
<span class="doc doc-labels">
|
||
<small class="doc doc-label doc-label-class-attribute"><code>class-attribute</code></small>
|
||
<small class="doc doc-label doc-label-instance-attribute"><code>instance-attribute</code></small>
|
||
</span> (<code>docling.datamodel.pipeline_options.PdfPipelineOptions.do_ocr</code>)" href="#docling.datamodel.pipeline_options.PdfPipelineOptions.do_ocr">do_ocr</a></code></b>
|
||
(<code><span title="bool">bool</span></code>)
|
||
–
|
||
<div class="doc-md-description">
|
||
|
||
</div>
|
||
</li>
|
||
<li class="doc-section-item field-body">
|
||
<b><code><a class="autorefs autorefs-internal" title="<code class="doc-symbol doc-symbol-heading doc-symbol-attribute"></code> <span class="doc doc-object-name doc-attribute-name">do_picture_classification</span>
|
||
|
||
|
||
<span class="doc doc-labels">
|
||
<small class="doc doc-label doc-label-class-attribute"><code>class-attribute</code></small>
|
||
<small class="doc doc-label doc-label-instance-attribute"><code>instance-attribute</code></small>
|
||
</span> (<code>docling.datamodel.pipeline_options.PdfPipelineOptions.do_picture_classification</code>)" href="#docling.datamodel.pipeline_options.PdfPipelineOptions.do_picture_classification">do_picture_classification</a></code></b>
|
||
(<code><span title="bool">bool</span></code>)
|
||
–
|
||
<div class="doc-md-description">
|
||
|
||
</div>
|
||
</li>
|
||
<li class="doc-section-item field-body">
|
||
<b><code><a class="autorefs autorefs-internal" title="<code class="doc-symbol doc-symbol-heading doc-symbol-attribute"></code> <span class="doc doc-object-name doc-attribute-name">do_picture_description</span>
|
||
|
||
|
||
<span class="doc doc-labels">
|
||
<small class="doc doc-label doc-label-class-attribute"><code>class-attribute</code></small>
|
||
<small class="doc doc-label doc-label-instance-attribute"><code>instance-attribute</code></small>
|
||
</span> (<code>docling.datamodel.pipeline_options.PdfPipelineOptions.do_picture_description</code>)" href="#docling.datamodel.pipeline_options.PdfPipelineOptions.do_picture_description">do_picture_description</a></code></b>
|
||
(<code><span title="bool">bool</span></code>)
|
||
–
|
||
<div class="doc-md-description">
|
||
|
||
</div>
|
||
</li>
|
||
<li class="doc-section-item field-body">
|
||
<b><code><a class="autorefs autorefs-internal" title="<code class="doc-symbol doc-symbol-heading doc-symbol-attribute"></code> <span class="doc doc-object-name doc-attribute-name">do_table_structure</span>
|
||
|
||
|
||
<span class="doc doc-labels">
|
||
<small class="doc doc-label doc-label-class-attribute"><code>class-attribute</code></small>
|
||
<small class="doc doc-label doc-label-instance-attribute"><code>instance-attribute</code></small>
|
||
</span> (<code>docling.datamodel.pipeline_options.PdfPipelineOptions.do_table_structure</code>)" href="#docling.datamodel.pipeline_options.PdfPipelineOptions.do_table_structure">do_table_structure</a></code></b>
|
||
(<code><span title="bool">bool</span></code>)
|
||
–
|
||
<div class="doc-md-description">
|
||
|
||
</div>
|
||
</li>
|
||
<li class="doc-section-item field-body">
|
||
<b><code><a class="autorefs autorefs-internal" title="<code class="doc-symbol doc-symbol-heading doc-symbol-attribute"></code> <span class="doc doc-object-name doc-attribute-name">document_timeout</span>
|
||
|
||
|
||
<span class="doc doc-labels">
|
||
<small class="doc doc-label doc-label-class-attribute"><code>class-attribute</code></small>
|
||
<small class="doc doc-label doc-label-instance-attribute"><code>instance-attribute</code></small>
|
||
</span> (<code>docling.datamodel.pipeline_options.PdfPipelineOptions.document_timeout</code>)" href="#docling.datamodel.pipeline_options.PdfPipelineOptions.document_timeout">document_timeout</a></code></b>
|
||
(<code><span title="typing.Optional">Optional</span>[<span title="float">float</span>]</code>)
|
||
–
|
||
<div class="doc-md-description">
|
||
|
||
</div>
|
||
</li>
|
||
<li class="doc-section-item field-body">
|
||
<b><code><a class="autorefs autorefs-internal" title="<code class="doc-symbol doc-symbol-heading doc-symbol-attribute"></code> <span class="doc doc-object-name doc-attribute-name">enable_remote_services</span>
|
||
|
||
|
||
<span class="doc doc-labels">
|
||
<small class="doc doc-label doc-label-class-attribute"><code>class-attribute</code></small>
|
||
<small class="doc doc-label doc-label-instance-attribute"><code>instance-attribute</code></small>
|
||
</span> (<code>docling.datamodel.pipeline_options.PdfPipelineOptions.enable_remote_services</code>)" href="#docling.datamodel.pipeline_options.PdfPipelineOptions.enable_remote_services">enable_remote_services</a></code></b>
|
||
(<code><span title="bool">bool</span></code>)
|
||
–
|
||
<div class="doc-md-description">
|
||
|
||
</div>
|
||
</li>
|
||
<li class="doc-section-item field-body">
|
||
<b><code><a class="autorefs autorefs-internal" title="<code class="doc-symbol doc-symbol-heading doc-symbol-attribute"></code> <span class="doc doc-object-name doc-attribute-name">force_backend_text</span>
|
||
|
||
|
||
<span class="doc doc-labels">
|
||
<small class="doc doc-label doc-label-class-attribute"><code>class-attribute</code></small>
|
||
<small class="doc doc-label doc-label-instance-attribute"><code>instance-attribute</code></small>
|
||
</span> (<code>docling.datamodel.pipeline_options.PdfPipelineOptions.force_backend_text</code>)" href="#docling.datamodel.pipeline_options.PdfPipelineOptions.force_backend_text">force_backend_text</a></code></b>
|
||
(<code><span title="bool">bool</span></code>)
|
||
–
|
||
<div class="doc-md-description">
|
||
|
||
</div>
|
||
</li>
|
||
<li class="doc-section-item field-body">
|
||
<b><code><a class="autorefs autorefs-internal" title="<code class="doc-symbol doc-symbol-heading doc-symbol-attribute"></code> <span class="doc doc-object-name doc-attribute-name">generate_page_images</span>
|
||
|
||
|
||
<span class="doc doc-labels">
|
||
<small class="doc doc-label doc-label-class-attribute"><code>class-attribute</code></small>
|
||
<small class="doc doc-label doc-label-instance-attribute"><code>instance-attribute</code></small>
|
||
</span> (<code>docling.datamodel.pipeline_options.PdfPipelineOptions.generate_page_images</code>)" href="#docling.datamodel.pipeline_options.PdfPipelineOptions.generate_page_images">generate_page_images</a></code></b>
|
||
(<code><span title="bool">bool</span></code>)
|
||
–
|
||
<div class="doc-md-description">
|
||
|
||
</div>
|
||
</li>
|
||
<li class="doc-section-item field-body">
|
||
<b><code><a class="autorefs autorefs-internal" title="<code class="doc-symbol doc-symbol-heading doc-symbol-attribute"></code> <span class="doc doc-object-name doc-attribute-name">generate_parsed_pages</span>
|
||
|
||
|
||
<span class="doc doc-labels">
|
||
<small class="doc doc-label doc-label-class-attribute"><code>class-attribute</code></small>
|
||
<small class="doc doc-label doc-label-instance-attribute"><code>instance-attribute</code></small>
|
||
</span> (<code>docling.datamodel.pipeline_options.PdfPipelineOptions.generate_parsed_pages</code>)" href="#docling.datamodel.pipeline_options.PdfPipelineOptions.generate_parsed_pages">generate_parsed_pages</a></code></b>
|
||
(<code><span title="bool">bool</span></code>)
|
||
–
|
||
<div class="doc-md-description">
|
||
|
||
</div>
|
||
</li>
|
||
<li class="doc-section-item field-body">
|
||
<b><code><a class="autorefs autorefs-internal" title="<code class="doc-symbol doc-symbol-heading doc-symbol-attribute"></code> <span class="doc doc-object-name doc-attribute-name">generate_picture_images</span>
|
||
|
||
|
||
<span class="doc doc-labels">
|
||
<small class="doc doc-label doc-label-class-attribute"><code>class-attribute</code></small>
|
||
<small class="doc doc-label doc-label-instance-attribute"><code>instance-attribute</code></small>
|
||
</span> (<code>docling.datamodel.pipeline_options.PdfPipelineOptions.generate_picture_images</code>)" href="#docling.datamodel.pipeline_options.PdfPipelineOptions.generate_picture_images">generate_picture_images</a></code></b>
|
||
(<code><span title="bool">bool</span></code>)
|
||
–
|
||
<div class="doc-md-description">
|
||
|
||
</div>
|
||
</li>
|
||
<li class="doc-section-item field-body">
|
||
<b><code><a class="autorefs autorefs-internal" title="<code class="doc-symbol doc-symbol-heading doc-symbol-attribute"></code> <span class="doc doc-object-name doc-attribute-name">generate_table_images</span>
|
||
|
||
|
||
<span class="doc doc-labels">
|
||
<small class="doc doc-label doc-label-class-attribute"><code>class-attribute</code></small>
|
||
<small class="doc doc-label doc-label-instance-attribute"><code>instance-attribute</code></small>
|
||
</span> (<code>docling.datamodel.pipeline_options.PdfPipelineOptions.generate_table_images</code>)" href="#docling.datamodel.pipeline_options.PdfPipelineOptions.generate_table_images">generate_table_images</a></code></b>
|
||
(<code><span title="bool">bool</span></code>)
|
||
–
|
||
<div class="doc-md-description">
|
||
|
||
</div>
|
||
</li>
|
||
<li class="doc-section-item field-body">
|
||
<b><code><a class="autorefs autorefs-internal" title="<code class="doc-symbol doc-symbol-heading doc-symbol-attribute"></code> <span class="doc doc-object-name doc-attribute-name">images_scale</span>
|
||
|
||
|
||
<span class="doc doc-labels">
|
||
<small class="doc doc-label doc-label-class-attribute"><code>class-attribute</code></small>
|
||
<small class="doc doc-label doc-label-instance-attribute"><code>instance-attribute</code></small>
|
||
</span> (<code>docling.datamodel.pipeline_options.PdfPipelineOptions.images_scale</code>)" href="#docling.datamodel.pipeline_options.PdfPipelineOptions.images_scale">images_scale</a></code></b>
|
||
(<code><span title="float">float</span></code>)
|
||
–
|
||
<div class="doc-md-description">
|
||
|
||
</div>
|
||
</li>
|
||
<li class="doc-section-item field-body">
|
||
<b><code><a class="autorefs autorefs-internal" title="<code class="doc-symbol doc-symbol-heading doc-symbol-attribute"></code> <span class="doc doc-object-name doc-attribute-name">kind</span>
|
||
|
||
|
||
<span class="doc doc-labels">
|
||
<small class="doc doc-label doc-label-class-attribute"><code>class-attribute</code></small>
|
||
</span> (<code>docling.datamodel.pipeline_options.PdfPipelineOptions.kind</code>)" href="#docling.datamodel.pipeline_options.PdfPipelineOptions.kind">kind</a></code></b>
|
||
(<code><span title="str">str</span></code>)
|
||
–
|
||
<div class="doc-md-description">
|
||
|
||
</div>
|
||
</li>
|
||
<li class="doc-section-item field-body">
|
||
<b><code><a class="autorefs autorefs-internal" title="<code class="doc-symbol doc-symbol-heading doc-symbol-attribute"></code> <span class="doc doc-object-name doc-attribute-name">layout_batch_size</span>
|
||
|
||
|
||
<span class="doc doc-labels">
|
||
<small class="doc doc-label doc-label-class-attribute"><code>class-attribute</code></small>
|
||
<small class="doc doc-label doc-label-instance-attribute"><code>instance-attribute</code></small>
|
||
</span> (<code>docling.datamodel.pipeline_options.PdfPipelineOptions.layout_batch_size</code>)" href="#docling.datamodel.pipeline_options.PdfPipelineOptions.layout_batch_size">layout_batch_size</a></code></b>
|
||
(<code><span title="int">int</span></code>)
|
||
–
|
||
<div class="doc-md-description">
|
||
|
||
</div>
|
||
</li>
|
||
<li class="doc-section-item field-body">
|
||
<b><code><a class="autorefs autorefs-internal" title="<code class="doc-symbol doc-symbol-heading doc-symbol-attribute"></code> <span class="doc doc-object-name doc-attribute-name">layout_options</span>
|
||
|
||
|
||
<span class="doc doc-labels">
|
||
<small class="doc doc-label doc-label-class-attribute"><code>class-attribute</code></small>
|
||
<small class="doc doc-label doc-label-instance-attribute"><code>instance-attribute</code></small>
|
||
</span> (<code>docling.datamodel.pipeline_options.PdfPipelineOptions.layout_options</code>)" href="#docling.datamodel.pipeline_options.PdfPipelineOptions.layout_options">layout_options</a></code></b>
|
||
(<code><a class="autorefs autorefs-internal" title="<code class="doc-symbol doc-symbol-heading doc-symbol-class"></code> <span class="doc doc-object-name doc-class-name">BaseLayoutOptions</span> (<code>docling.datamodel.pipeline_options.BaseLayoutOptions</code>)" href="#docling.datamodel.pipeline_options.BaseLayoutOptions">BaseLayoutOptions</a></code>)
|
||
–
|
||
<div class="doc-md-description">
|
||
|
||
</div>
|
||
</li>
|
||
<li class="doc-section-item field-body">
|
||
<b><code><a class="autorefs autorefs-internal" title="<code class="doc-symbol doc-symbol-heading doc-symbol-attribute"></code> <span class="doc doc-object-name doc-attribute-name">ocr_batch_size</span>
|
||
|
||
|
||
<span class="doc doc-labels">
|
||
<small class="doc doc-label doc-label-class-attribute"><code>class-attribute</code></small>
|
||
<small class="doc doc-label doc-label-instance-attribute"><code>instance-attribute</code></small>
|
||
</span> (<code>docling.datamodel.pipeline_options.PdfPipelineOptions.ocr_batch_size</code>)" href="#docling.datamodel.pipeline_options.PdfPipelineOptions.ocr_batch_size">ocr_batch_size</a></code></b>
|
||
(<code><span title="int">int</span></code>)
|
||
–
|
||
<div class="doc-md-description">
|
||
|
||
</div>
|
||
</li>
|
||
<li class="doc-section-item field-body">
|
||
<b><code><a class="autorefs autorefs-internal" title="<code class="doc-symbol doc-symbol-heading doc-symbol-attribute"></code> <span class="doc doc-object-name doc-attribute-name">ocr_options</span>
|
||
|
||
|
||
<span class="doc doc-labels">
|
||
<small class="doc doc-label doc-label-class-attribute"><code>class-attribute</code></small>
|
||
<small class="doc doc-label doc-label-instance-attribute"><code>instance-attribute</code></small>
|
||
</span> (<code>docling.datamodel.pipeline_options.PdfPipelineOptions.ocr_options</code>)" href="#docling.datamodel.pipeline_options.PdfPipelineOptions.ocr_options">ocr_options</a></code></b>
|
||
(<code><a class="autorefs autorefs-internal" title="<code class="doc-symbol doc-symbol-heading doc-symbol-class"></code> <span class="doc doc-object-name doc-class-name">OcrOptions</span> (<code>docling.datamodel.pipeline_options.OcrOptions</code>)" href="#docling.datamodel.pipeline_options.OcrOptions">OcrOptions</a></code>)
|
||
–
|
||
<div class="doc-md-description">
|
||
|
||
</div>
|
||
</li>
|
||
<li class="doc-section-item field-body">
|
||
<b><code><a class="autorefs autorefs-internal" title="<code class="doc-symbol doc-symbol-heading doc-symbol-attribute"></code> <span class="doc doc-object-name doc-attribute-name">picture_description_options</span>
|
||
|
||
|
||
<span class="doc doc-labels">
|
||
<small class="doc doc-label doc-label-class-attribute"><code>class-attribute</code></small>
|
||
<small class="doc doc-label doc-label-instance-attribute"><code>instance-attribute</code></small>
|
||
</span> (<code>docling.datamodel.pipeline_options.PdfPipelineOptions.picture_description_options</code>)" href="#docling.datamodel.pipeline_options.PdfPipelineOptions.picture_description_options">picture_description_options</a></code></b>
|
||
(<code><a class="autorefs autorefs-internal" title="<code class="doc-symbol doc-symbol-heading doc-symbol-class"></code> <span class="doc doc-object-name doc-class-name">PictureDescriptionBaseOptions</span> (<code>docling.datamodel.pipeline_options.PictureDescriptionBaseOptions</code>)" href="#docling.datamodel.pipeline_options.PictureDescriptionBaseOptions">PictureDescriptionBaseOptions</a></code>)
|
||
–
|
||
<div class="doc-md-description">
|
||
|
||
</div>
|
||
</li>
|
||
<li class="doc-section-item field-body">
|
||
<b><code><a class="autorefs autorefs-internal" title="<code class="doc-symbol doc-symbol-heading doc-symbol-attribute"></code> <span class="doc doc-object-name doc-attribute-name">queue_max_size</span>
|
||
|
||
|
||
<span class="doc doc-labels">
|
||
<small class="doc doc-label doc-label-class-attribute"><code>class-attribute</code></small>
|
||
<small class="doc doc-label doc-label-instance-attribute"><code>instance-attribute</code></small>
|
||
</span> (<code>docling.datamodel.pipeline_options.PdfPipelineOptions.queue_max_size</code>)" href="#docling.datamodel.pipeline_options.PdfPipelineOptions.queue_max_size">queue_max_size</a></code></b>
|
||
(<code><span title="int">int</span></code>)
|
||
–
|
||
<div class="doc-md-description">
|
||
|
||
</div>
|
||
</li>
|
||
<li class="doc-section-item field-body">
|
||
<b><code><a class="autorefs autorefs-internal" title="<code class="doc-symbol doc-symbol-heading doc-symbol-attribute"></code> <span class="doc doc-object-name doc-attribute-name">table_batch_size</span>
|
||
|
||
|
||
<span class="doc doc-labels">
|
||
<small class="doc doc-label doc-label-class-attribute"><code>class-attribute</code></small>
|
||
<small class="doc doc-label doc-label-instance-attribute"><code>instance-attribute</code></small>
|
||
</span> (<code>docling.datamodel.pipeline_options.PdfPipelineOptions.table_batch_size</code>)" href="#docling.datamodel.pipeline_options.PdfPipelineOptions.table_batch_size">table_batch_size</a></code></b>
|
||
(<code><span title="int">int</span></code>)
|
||
–
|
||
<div class="doc-md-description">
|
||
|
||
</div>
|
||
</li>
|
||
<li class="doc-section-item field-body">
|
||
<b><code><a class="autorefs autorefs-internal" title="<code class="doc-symbol doc-symbol-heading doc-symbol-attribute"></code> <span class="doc doc-object-name doc-attribute-name">table_structure_options</span>
|
||
|
||
|
||
<span class="doc doc-labels">
|
||
<small class="doc doc-label doc-label-class-attribute"><code>class-attribute</code></small>
|
||
<small class="doc doc-label doc-label-instance-attribute"><code>instance-attribute</code></small>
|
||
</span> (<code>docling.datamodel.pipeline_options.PdfPipelineOptions.table_structure_options</code>)" href="#docling.datamodel.pipeline_options.PdfPipelineOptions.table_structure_options">table_structure_options</a></code></b>
|
||
(<code><a class="autorefs autorefs-internal" title="<code class="doc-symbol doc-symbol-heading doc-symbol-class"></code> <span class="doc doc-object-name doc-class-name">BaseTableStructureOptions</span> (<code>docling.datamodel.pipeline_options.BaseTableStructureOptions</code>)" href="#docling.datamodel.pipeline_options.BaseTableStructureOptions">BaseTableStructureOptions</a></code>)
|
||
–
|
||
<div class="doc-md-description">
|
||
|
||
</div>
|
||
</li>
|
||
</ul>
|
||
|
||
|
||
|
||
|
||
<div class="doc doc-children">
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
<div class="doc doc-object doc-attribute">
|
||
|
||
|
||
|
||
<h4 id="docling.datamodel.pipeline_options.PdfPipelineOptions.accelerator_options" class="doc doc-heading">
|
||
<code class="doc-symbol doc-symbol-heading doc-symbol-attribute"></code> <span class="doc doc-object-name doc-attribute-name">accelerator_options</span>
|
||
|
||
|
||
<span class="doc doc-labels">
|
||
<small class="doc doc-label doc-label-class-attribute"><code>class-attribute</code></small>
|
||
<small class="doc doc-label doc-label-instance-attribute"><code>instance-attribute</code></small>
|
||
</span>
|
||
|
||
</h4>
|
||
<div class="doc-signature highlight"><pre><span></span><code><span class="n">accelerator_options</span><span class="p">:</span> <span class="n"><span title="docling.datamodel.accelerator_options.AcceleratorOptions">AcceleratorOptions</span></span> <span class="o">=</span> <span class="n"><span title="docling.datamodel.accelerator_options.AcceleratorOptions">AcceleratorOptions</span></span><span class="p">()</span>
|
||
</code></pre></div>
|
||
|
||
<div class="doc doc-contents ">
|
||
|
||
</div>
|
||
|
||
</div>
|
||
|
||
<div class="doc doc-object doc-attribute">
|
||
|
||
|
||
|
||
<h4 id="docling.datamodel.pipeline_options.PdfPipelineOptions.allow_external_plugins" class="doc doc-heading">
|
||
<code class="doc-symbol doc-symbol-heading doc-symbol-attribute"></code> <span class="doc doc-object-name doc-attribute-name">allow_external_plugins</span>
|
||
|
||
|
||
<span class="doc doc-labels">
|
||
<small class="doc doc-label doc-label-class-attribute"><code>class-attribute</code></small>
|
||
<small class="doc doc-label doc-label-instance-attribute"><code>instance-attribute</code></small>
|
||
</span>
|
||
|
||
</h4>
|
||
<div class="doc-signature highlight"><pre><span></span><code><span class="n">allow_external_plugins</span><span class="p">:</span> <span class="n"><span title="bool">bool</span></span> <span class="o">=</span> <span class="kc">False</span>
|
||
</code></pre></div>
|
||
|
||
<div class="doc doc-contents ">
|
||
|
||
</div>
|
||
|
||
</div>
|
||
|
||
<div class="doc doc-object doc-attribute">
|
||
|
||
|
||
|
||
<h4 id="docling.datamodel.pipeline_options.PdfPipelineOptions.artifacts_path" class="doc doc-heading">
|
||
<code class="doc-symbol doc-symbol-heading doc-symbol-attribute"></code> <span class="doc doc-object-name doc-attribute-name">artifacts_path</span>
|
||
|
||
|
||
<span class="doc doc-labels">
|
||
<small class="doc doc-label doc-label-class-attribute"><code>class-attribute</code></small>
|
||
<small class="doc doc-label doc-label-instance-attribute"><code>instance-attribute</code></small>
|
||
</span>
|
||
|
||
</h4>
|
||
<div class="doc-signature highlight"><pre><span></span><code><span class="n">artifacts_path</span><span class="p">:</span> <span class="n"><span title="typing.Optional">Optional</span></span><span class="p">[</span><span class="n"><span title="typing.Union">Union</span></span><span class="p">[</span><span class="n"><span title="pathlib.Path">Path</span></span><span class="p">,</span> <span class="n"><span title="str">str</span></span><span class="p">]]</span> <span class="o">=</span> <span class="kc">None</span>
|
||
</code></pre></div>
|
||
|
||
<div class="doc doc-contents ">
|
||
|
||
</div>
|
||
|
||
</div>
|
||
|
||
<div class="doc doc-object doc-attribute">
|
||
|
||
|
||
|
||
<h4 id="docling.datamodel.pipeline_options.PdfPipelineOptions.batch_polling_interval_seconds" class="doc doc-heading">
|
||
<code class="doc-symbol doc-symbol-heading doc-symbol-attribute"></code> <span class="doc doc-object-name doc-attribute-name">batch_polling_interval_seconds</span>
|
||
|
||
|
||
<span class="doc doc-labels">
|
||
<small class="doc doc-label doc-label-class-attribute"><code>class-attribute</code></small>
|
||
<small class="doc doc-label doc-label-instance-attribute"><code>instance-attribute</code></small>
|
||
</span>
|
||
|
||
</h4>
|
||
<div class="doc-signature highlight"><pre><span></span><code><span class="n">batch_polling_interval_seconds</span><span class="p">:</span> <span class="n"><span title="float">float</span></span> <span class="o">=</span> <span class="mf">0.5</span>
|
||
</code></pre></div>
|
||
|
||
<div class="doc doc-contents ">
|
||
|
||
</div>
|
||
|
||
</div>
|
||
|
||
<div class="doc doc-object doc-attribute">
|
||
|
||
|
||
|
||
<h4 id="docling.datamodel.pipeline_options.PdfPipelineOptions.do_code_enrichment" class="doc doc-heading">
|
||
<code class="doc-symbol doc-symbol-heading doc-symbol-attribute"></code> <span class="doc doc-object-name doc-attribute-name">do_code_enrichment</span>
|
||
|
||
|
||
<span class="doc doc-labels">
|
||
<small class="doc doc-label doc-label-class-attribute"><code>class-attribute</code></small>
|
||
<small class="doc doc-label doc-label-instance-attribute"><code>instance-attribute</code></small>
|
||
</span>
|
||
|
||
</h4>
|
||
<div class="doc-signature highlight"><pre><span></span><code><span class="n">do_code_enrichment</span><span class="p">:</span> <span class="n"><span title="bool">bool</span></span> <span class="o">=</span> <span class="kc">False</span>
|
||
</code></pre></div>
|
||
|
||
<div class="doc doc-contents ">
|
||
|
||
</div>
|
||
|
||
</div>
|
||
|
||
<div class="doc doc-object doc-attribute">
|
||
|
||
|
||
|
||
<h4 id="docling.datamodel.pipeline_options.PdfPipelineOptions.do_formula_enrichment" class="doc doc-heading">
|
||
<code class="doc-symbol doc-symbol-heading doc-symbol-attribute"></code> <span class="doc doc-object-name doc-attribute-name">do_formula_enrichment</span>
|
||
|
||
|
||
<span class="doc doc-labels">
|
||
<small class="doc doc-label doc-label-class-attribute"><code>class-attribute</code></small>
|
||
<small class="doc doc-label doc-label-instance-attribute"><code>instance-attribute</code></small>
|
||
</span>
|
||
|
||
</h4>
|
||
<div class="doc-signature highlight"><pre><span></span><code><span class="n">do_formula_enrichment</span><span class="p">:</span> <span class="n"><span title="bool">bool</span></span> <span class="o">=</span> <span class="kc">False</span>
|
||
</code></pre></div>
|
||
|
||
<div class="doc doc-contents ">
|
||
|
||
</div>
|
||
|
||
</div>
|
||
|
||
<div class="doc doc-object doc-attribute">
|
||
|
||
|
||
|
||
<h4 id="docling.datamodel.pipeline_options.PdfPipelineOptions.do_ocr" class="doc doc-heading">
|
||
<code class="doc-symbol doc-symbol-heading doc-symbol-attribute"></code> <span class="doc doc-object-name doc-attribute-name">do_ocr</span>
|
||
|
||
|
||
<span class="doc doc-labels">
|
||
<small class="doc doc-label doc-label-class-attribute"><code>class-attribute</code></small>
|
||
<small class="doc doc-label doc-label-instance-attribute"><code>instance-attribute</code></small>
|
||
</span>
|
||
|
||
</h4>
|
||
<div class="doc-signature highlight"><pre><span></span><code><span class="n">do_ocr</span><span class="p">:</span> <span class="n"><span title="bool">bool</span></span> <span class="o">=</span> <span class="kc">True</span>
|
||
</code></pre></div>
|
||
|
||
<div class="doc doc-contents ">
|
||
|
||
</div>
|
||
|
||
</div>
|
||
|
||
<div class="doc doc-object doc-attribute">
|
||
|
||
|
||
|
||
<h4 id="docling.datamodel.pipeline_options.PdfPipelineOptions.do_picture_classification" class="doc doc-heading">
|
||
<code class="doc-symbol doc-symbol-heading doc-symbol-attribute"></code> <span class="doc doc-object-name doc-attribute-name">do_picture_classification</span>
|
||
|
||
|
||
<span class="doc doc-labels">
|
||
<small class="doc doc-label doc-label-class-attribute"><code>class-attribute</code></small>
|
||
<small class="doc doc-label doc-label-instance-attribute"><code>instance-attribute</code></small>
|
||
</span>
|
||
|
||
</h4>
|
||
<div class="doc-signature highlight"><pre><span></span><code><span class="n">do_picture_classification</span><span class="p">:</span> <span class="n"><span title="bool">bool</span></span> <span class="o">=</span> <span class="kc">False</span>
|
||
</code></pre></div>
|
||
|
||
<div class="doc doc-contents ">
|
||
|
||
</div>
|
||
|
||
</div>
|
||
|
||
<div class="doc doc-object doc-attribute">
|
||
|
||
|
||
|
||
<h4 id="docling.datamodel.pipeline_options.PdfPipelineOptions.do_picture_description" class="doc doc-heading">
|
||
<code class="doc-symbol doc-symbol-heading doc-symbol-attribute"></code> <span class="doc doc-object-name doc-attribute-name">do_picture_description</span>
|
||
|
||
|
||
<span class="doc doc-labels">
|
||
<small class="doc doc-label doc-label-class-attribute"><code>class-attribute</code></small>
|
||
<small class="doc doc-label doc-label-instance-attribute"><code>instance-attribute</code></small>
|
||
</span>
|
||
|
||
</h4>
|
||
<div class="doc-signature highlight"><pre><span></span><code><span class="n">do_picture_description</span><span class="p">:</span> <span class="n"><span title="bool">bool</span></span> <span class="o">=</span> <span class="kc">False</span>
|
||
</code></pre></div>
|
||
|
||
<div class="doc doc-contents ">
|
||
|
||
</div>
|
||
|
||
</div>
|
||
|
||
<div class="doc doc-object doc-attribute">
|
||
|
||
|
||
|
||
<h4 id="docling.datamodel.pipeline_options.PdfPipelineOptions.do_table_structure" class="doc doc-heading">
|
||
<code class="doc-symbol doc-symbol-heading doc-symbol-attribute"></code> <span class="doc doc-object-name doc-attribute-name">do_table_structure</span>
|
||
|
||
|
||
<span class="doc doc-labels">
|
||
<small class="doc doc-label doc-label-class-attribute"><code>class-attribute</code></small>
|
||
<small class="doc doc-label doc-label-instance-attribute"><code>instance-attribute</code></small>
|
||
</span>
|
||
|
||
</h4>
|
||
<div class="doc-signature highlight"><pre><span></span><code><span class="n">do_table_structure</span><span class="p">:</span> <span class="n"><span title="bool">bool</span></span> <span class="o">=</span> <span class="kc">True</span>
|
||
</code></pre></div>
|
||
|
||
<div class="doc doc-contents ">
|
||
|
||
</div>
|
||
|
||
</div>
|
||
|
||
<div class="doc doc-object doc-attribute">
|
||
|
||
|
||
|
||
<h4 id="docling.datamodel.pipeline_options.PdfPipelineOptions.document_timeout" class="doc doc-heading">
|
||
<code class="doc-symbol doc-symbol-heading doc-symbol-attribute"></code> <span class="doc doc-object-name doc-attribute-name">document_timeout</span>
|
||
|
||
|
||
<span class="doc doc-labels">
|
||
<small class="doc doc-label doc-label-class-attribute"><code>class-attribute</code></small>
|
||
<small class="doc doc-label doc-label-instance-attribute"><code>instance-attribute</code></small>
|
||
</span>
|
||
|
||
</h4>
|
||
<div class="doc-signature highlight"><pre><span></span><code><span class="n">document_timeout</span><span class="p">:</span> <span class="n"><span title="typing.Optional">Optional</span></span><span class="p">[</span><span class="n"><span title="float">float</span></span><span class="p">]</span> <span class="o">=</span> <span class="kc">None</span>
|
||
</code></pre></div>
|
||
|
||
<div class="doc doc-contents ">
|
||
|
||
</div>
|
||
|
||
</div>
|
||
|
||
<div class="doc doc-object doc-attribute">
|
||
|
||
|
||
|
||
<h4 id="docling.datamodel.pipeline_options.PdfPipelineOptions.enable_remote_services" class="doc doc-heading">
|
||
<code class="doc-symbol doc-symbol-heading doc-symbol-attribute"></code> <span class="doc doc-object-name doc-attribute-name">enable_remote_services</span>
|
||
|
||
|
||
<span class="doc doc-labels">
|
||
<small class="doc doc-label doc-label-class-attribute"><code>class-attribute</code></small>
|
||
<small class="doc doc-label doc-label-instance-attribute"><code>instance-attribute</code></small>
|
||
</span>
|
||
|
||
</h4>
|
||
<div class="doc-signature highlight"><pre><span></span><code><span class="n">enable_remote_services</span><span class="p">:</span> <span class="n"><span title="bool">bool</span></span> <span class="o">=</span> <span class="kc">False</span>
|
||
</code></pre></div>
|
||
|
||
<div class="doc doc-contents ">
|
||
|
||
</div>
|
||
|
||
</div>
|
||
|
||
<div class="doc doc-object doc-attribute">
|
||
|
||
|
||
|
||
<h4 id="docling.datamodel.pipeline_options.PdfPipelineOptions.force_backend_text" class="doc doc-heading">
|
||
<code class="doc-symbol doc-symbol-heading doc-symbol-attribute"></code> <span class="doc doc-object-name doc-attribute-name">force_backend_text</span>
|
||
|
||
|
||
<span class="doc doc-labels">
|
||
<small class="doc doc-label doc-label-class-attribute"><code>class-attribute</code></small>
|
||
<small class="doc doc-label doc-label-instance-attribute"><code>instance-attribute</code></small>
|
||
</span>
|
||
|
||
</h4>
|
||
<div class="doc-signature highlight"><pre><span></span><code><span class="n">force_backend_text</span><span class="p">:</span> <span class="n"><span title="bool">bool</span></span> <span class="o">=</span> <span class="kc">False</span>
|
||
</code></pre></div>
|
||
|
||
<div class="doc doc-contents ">
|
||
|
||
</div>
|
||
|
||
</div>
|
||
|
||
<div class="doc doc-object doc-attribute">
|
||
|
||
|
||
|
||
<h4 id="docling.datamodel.pipeline_options.PdfPipelineOptions.generate_page_images" class="doc doc-heading">
|
||
<code class="doc-symbol doc-symbol-heading doc-symbol-attribute"></code> <span class="doc doc-object-name doc-attribute-name">generate_page_images</span>
|
||
|
||
|
||
<span class="doc doc-labels">
|
||
<small class="doc doc-label doc-label-class-attribute"><code>class-attribute</code></small>
|
||
<small class="doc doc-label doc-label-instance-attribute"><code>instance-attribute</code></small>
|
||
</span>
|
||
|
||
</h4>
|
||
<div class="doc-signature highlight"><pre><span></span><code><span class="n">generate_page_images</span><span class="p">:</span> <span class="n"><span title="bool">bool</span></span> <span class="o">=</span> <span class="kc">False</span>
|
||
</code></pre></div>
|
||
|
||
<div class="doc doc-contents ">
|
||
|
||
</div>
|
||
|
||
</div>
|
||
|
||
<div class="doc doc-object doc-attribute">
|
||
|
||
|
||
|
||
<h4 id="docling.datamodel.pipeline_options.PdfPipelineOptions.generate_parsed_pages" class="doc doc-heading">
|
||
<code class="doc-symbol doc-symbol-heading doc-symbol-attribute"></code> <span class="doc doc-object-name doc-attribute-name">generate_parsed_pages</span>
|
||
|
||
|
||
<span class="doc doc-labels">
|
||
<small class="doc doc-label doc-label-class-attribute"><code>class-attribute</code></small>
|
||
<small class="doc doc-label doc-label-instance-attribute"><code>instance-attribute</code></small>
|
||
</span>
|
||
|
||
</h4>
|
||
<div class="doc-signature highlight"><pre><span></span><code><span class="n">generate_parsed_pages</span><span class="p">:</span> <span class="n"><span title="bool">bool</span></span> <span class="o">=</span> <span class="kc">False</span>
|
||
</code></pre></div>
|
||
|
||
<div class="doc doc-contents ">
|
||
|
||
</div>
|
||
|
||
</div>
|
||
|
||
<div class="doc doc-object doc-attribute">
|
||
|
||
|
||
|
||
<h4 id="docling.datamodel.pipeline_options.PdfPipelineOptions.generate_picture_images" class="doc doc-heading">
|
||
<code class="doc-symbol doc-symbol-heading doc-symbol-attribute"></code> <span class="doc doc-object-name doc-attribute-name">generate_picture_images</span>
|
||
|
||
|
||
<span class="doc doc-labels">
|
||
<small class="doc doc-label doc-label-class-attribute"><code>class-attribute</code></small>
|
||
<small class="doc doc-label doc-label-instance-attribute"><code>instance-attribute</code></small>
|
||
</span>
|
||
|
||
</h4>
|
||
<div class="doc-signature highlight"><pre><span></span><code><span class="n">generate_picture_images</span><span class="p">:</span> <span class="n"><span title="bool">bool</span></span> <span class="o">=</span> <span class="kc">False</span>
|
||
</code></pre></div>
|
||
|
||
<div class="doc doc-contents ">
|
||
|
||
</div>
|
||
|
||
</div>
|
||
|
||
<div class="doc doc-object doc-attribute">
|
||
|
||
|
||
|
||
<h4 id="docling.datamodel.pipeline_options.PdfPipelineOptions.generate_table_images" class="doc doc-heading">
|
||
<code class="doc-symbol doc-symbol-heading doc-symbol-attribute"></code> <span class="doc doc-object-name doc-attribute-name">generate_table_images</span>
|
||
|
||
|
||
<span class="doc doc-labels">
|
||
<small class="doc doc-label doc-label-class-attribute"><code>class-attribute</code></small>
|
||
<small class="doc doc-label doc-label-instance-attribute"><code>instance-attribute</code></small>
|
||
</span>
|
||
|
||
</h4>
|
||
<div class="doc-signature highlight"><pre><span></span><code><span class="n">generate_table_images</span><span class="p">:</span> <span class="n"><span title="bool">bool</span></span> <span class="o">=</span> <span class="n"><span title="pydantic.Field">Field</span></span><span class="p">(</span><span class="n"><span title="pydantic.Field(default)">default</span></span><span class="o">=</span><span class="kc">False</span><span class="p">,</span> <span class="n"><span title="pydantic.Field(deprecated)">deprecated</span></span><span class="o">=</span><span class="s1">'Field `generate_table_images` is deprecated. To obtain table images, set `PdfPipelineOptions.generate_page_images = True` before conversion and then use the `TableItem.get_image` function.'</span><span class="p">)</span>
|
||
</code></pre></div>
|
||
|
||
<div class="doc doc-contents ">
|
||
|
||
</div>
|
||
|
||
</div>
|
||
|
||
<div class="doc doc-object doc-attribute">
|
||
|
||
|
||
|
||
<h4 id="docling.datamodel.pipeline_options.PdfPipelineOptions.images_scale" class="doc doc-heading">
|
||
<code class="doc-symbol doc-symbol-heading doc-symbol-attribute"></code> <span class="doc doc-object-name doc-attribute-name">images_scale</span>
|
||
|
||
|
||
<span class="doc doc-labels">
|
||
<small class="doc doc-label doc-label-class-attribute"><code>class-attribute</code></small>
|
||
<small class="doc doc-label doc-label-instance-attribute"><code>instance-attribute</code></small>
|
||
</span>
|
||
|
||
</h4>
|
||
<div class="doc-signature highlight"><pre><span></span><code><span class="n">images_scale</span><span class="p">:</span> <span class="n"><span title="float">float</span></span> <span class="o">=</span> <span class="mf">1.0</span>
|
||
</code></pre></div>
|
||
|
||
<div class="doc doc-contents ">
|
||
|
||
</div>
|
||
|
||
</div>
|
||
|
||
<div class="doc doc-object doc-attribute">
|
||
|
||
|
||
|
||
<h4 id="docling.datamodel.pipeline_options.PdfPipelineOptions.kind" class="doc doc-heading">
|
||
<code class="doc-symbol doc-symbol-heading doc-symbol-attribute"></code> <span class="doc doc-object-name doc-attribute-name">kind</span>
|
||
|
||
|
||
<span class="doc doc-labels">
|
||
<small class="doc doc-label doc-label-class-attribute"><code>class-attribute</code></small>
|
||
</span>
|
||
|
||
</h4>
|
||
<div class="doc-signature highlight"><pre><span></span><code><span class="n">kind</span><span class="p">:</span> <span class="n"><span title="str">str</span></span>
|
||
</code></pre></div>
|
||
|
||
<div class="doc doc-contents ">
|
||
|
||
</div>
|
||
|
||
</div>
|
||
|
||
<div class="doc doc-object doc-attribute">
|
||
|
||
|
||
|
||
<h4 id="docling.datamodel.pipeline_options.PdfPipelineOptions.layout_batch_size" class="doc doc-heading">
|
||
<code class="doc-symbol doc-symbol-heading doc-symbol-attribute"></code> <span class="doc doc-object-name doc-attribute-name">layout_batch_size</span>
|
||
|
||
|
||
<span class="doc doc-labels">
|
||
<small class="doc doc-label doc-label-class-attribute"><code>class-attribute</code></small>
|
||
<small class="doc doc-label doc-label-instance-attribute"><code>instance-attribute</code></small>
|
||
</span>
|
||
|
||
</h4>
|
||
<div class="doc-signature highlight"><pre><span></span><code><span class="n">layout_batch_size</span><span class="p">:</span> <span class="n"><span title="int">int</span></span> <span class="o">=</span> <span class="mi">4</span>
|
||
</code></pre></div>
|
||
|
||
<div class="doc doc-contents ">
|
||
|
||
</div>
|
||
|
||
</div>
|
||
|
||
<div class="doc doc-object doc-attribute">
|
||
|
||
|
||
|
||
<h4 id="docling.datamodel.pipeline_options.PdfPipelineOptions.layout_options" class="doc doc-heading">
|
||
<code class="doc-symbol doc-symbol-heading doc-symbol-attribute"></code> <span class="doc doc-object-name doc-attribute-name">layout_options</span>
|
||
|
||
|
||
<span class="doc doc-labels">
|
||
<small class="doc doc-label doc-label-class-attribute"><code>class-attribute</code></small>
|
||
<small class="doc doc-label doc-label-instance-attribute"><code>instance-attribute</code></small>
|
||
</span>
|
||
|
||
</h4>
|
||
<div class="doc-signature highlight"><pre><span></span><code><span class="n">layout_options</span><span class="p">:</span> <span class="n"><a class="autorefs autorefs-internal" title="<code class="doc-symbol doc-symbol-heading doc-symbol-class"></code> <span class="doc doc-object-name doc-class-name">BaseLayoutOptions</span> (<code>docling.datamodel.pipeline_options.BaseLayoutOptions</code>)" href="#docling.datamodel.pipeline_options.BaseLayoutOptions">BaseLayoutOptions</a></span> <span class="o">=</span> <span class="n"><a class="autorefs autorefs-internal" title="<code class="doc-symbol doc-symbol-heading doc-symbol-class"></code> <span class="doc doc-object-name doc-class-name">LayoutOptions</span> (<code>docling.datamodel.pipeline_options.LayoutOptions</code>)" href="#docling.datamodel.pipeline_options.LayoutOptions">LayoutOptions</a></span><span class="p">()</span>
|
||
</code></pre></div>
|
||
|
||
<div class="doc doc-contents ">
|
||
|
||
</div>
|
||
|
||
</div>
|
||
|
||
<div class="doc doc-object doc-attribute">
|
||
|
||
|
||
|
||
<h4 id="docling.datamodel.pipeline_options.PdfPipelineOptions.ocr_batch_size" class="doc doc-heading">
|
||
<code class="doc-symbol doc-symbol-heading doc-symbol-attribute"></code> <span class="doc doc-object-name doc-attribute-name">ocr_batch_size</span>
|
||
|
||
|
||
<span class="doc doc-labels">
|
||
<small class="doc doc-label doc-label-class-attribute"><code>class-attribute</code></small>
|
||
<small class="doc doc-label doc-label-instance-attribute"><code>instance-attribute</code></small>
|
||
</span>
|
||
|
||
</h4>
|
||
<div class="doc-signature highlight"><pre><span></span><code><span class="n">ocr_batch_size</span><span class="p">:</span> <span class="n"><span title="int">int</span></span> <span class="o">=</span> <span class="mi">4</span>
|
||
</code></pre></div>
|
||
|
||
<div class="doc doc-contents ">
|
||
|
||
</div>
|
||
|
||
</div>
|
||
|
||
<div class="doc doc-object doc-attribute">
|
||
|
||
|
||
|
||
<h4 id="docling.datamodel.pipeline_options.PdfPipelineOptions.ocr_options" class="doc doc-heading">
|
||
<code class="doc-symbol doc-symbol-heading doc-symbol-attribute"></code> <span class="doc doc-object-name doc-attribute-name">ocr_options</span>
|
||
|
||
|
||
<span class="doc doc-labels">
|
||
<small class="doc doc-label doc-label-class-attribute"><code>class-attribute</code></small>
|
||
<small class="doc doc-label doc-label-instance-attribute"><code>instance-attribute</code></small>
|
||
</span>
|
||
|
||
</h4>
|
||
<div class="doc-signature highlight"><pre><span></span><code><span class="n">ocr_options</span><span class="p">:</span> <span class="n"><a class="autorefs autorefs-internal" title="<code class="doc-symbol doc-symbol-heading doc-symbol-class"></code> <span class="doc doc-object-name doc-class-name">OcrOptions</span> (<code>docling.datamodel.pipeline_options.OcrOptions</code>)" href="#docling.datamodel.pipeline_options.OcrOptions">OcrOptions</a></span> <span class="o">=</span> <span class="n"><a class="autorefs autorefs-internal" title="<code class="doc-symbol doc-symbol-heading doc-symbol-class"></code> <span class="doc doc-object-name doc-class-name">OcrAutoOptions</span> (<code>docling.datamodel.pipeline_options.OcrAutoOptions</code>)" href="#docling.datamodel.pipeline_options.OcrAutoOptions">OcrAutoOptions</a></span><span class="p">()</span>
|
||
</code></pre></div>
|
||
|
||
<div class="doc doc-contents ">
|
||
|
||
</div>
|
||
|
||
</div>
|
||
|
||
<div class="doc doc-object doc-attribute">
|
||
|
||
|
||
|
||
<h4 id="docling.datamodel.pipeline_options.PdfPipelineOptions.picture_description_options" class="doc doc-heading">
|
||
<code class="doc-symbol doc-symbol-heading doc-symbol-attribute"></code> <span class="doc doc-object-name doc-attribute-name">picture_description_options</span>
|
||
|
||
|
||
<span class="doc doc-labels">
|
||
<small class="doc doc-label doc-label-class-attribute"><code>class-attribute</code></small>
|
||
<small class="doc doc-label doc-label-instance-attribute"><code>instance-attribute</code></small>
|
||
</span>
|
||
|
||
</h4>
|
||
<div class="doc-signature highlight"><pre><span></span><code><span class="n">picture_description_options</span><span class="p">:</span> <span class="n"><a class="autorefs autorefs-internal" title="<code class="doc-symbol doc-symbol-heading doc-symbol-class"></code> <span class="doc doc-object-name doc-class-name">PictureDescriptionBaseOptions</span> (<code>docling.datamodel.pipeline_options.PictureDescriptionBaseOptions</code>)" href="#docling.datamodel.pipeline_options.PictureDescriptionBaseOptions">PictureDescriptionBaseOptions</a></span> <span class="o">=</span> <span class="n"><a class="autorefs autorefs-internal" title="<code class="doc-symbol doc-symbol-heading doc-symbol-attribute"></code> <span class="doc doc-object-name doc-attribute-name">smolvlm_picture_description</span>
|
||
|
||
|
||
<span class="doc doc-labels">
|
||
<small class="doc doc-label doc-label-module-attribute"><code>module-attribute</code></small>
|
||
</span> (<code>docling.datamodel.pipeline_options.smolvlm_picture_description</code>)" href="#docling.datamodel.pipeline_options.smolvlm_picture_description">smolvlm_picture_description</a></span>
|
||
</code></pre></div>
|
||
|
||
<div class="doc doc-contents ">
|
||
|
||
</div>
|
||
|
||
</div>
|
||
|
||
<div class="doc doc-object doc-attribute">
|
||
|
||
|
||
|
||
<h4 id="docling.datamodel.pipeline_options.PdfPipelineOptions.queue_max_size" class="doc doc-heading">
|
||
<code class="doc-symbol doc-symbol-heading doc-symbol-attribute"></code> <span class="doc doc-object-name doc-attribute-name">queue_max_size</span>
|
||
|
||
|
||
<span class="doc doc-labels">
|
||
<small class="doc doc-label doc-label-class-attribute"><code>class-attribute</code></small>
|
||
<small class="doc doc-label doc-label-instance-attribute"><code>instance-attribute</code></small>
|
||
</span>
|
||
|
||
</h4>
|
||
<div class="doc-signature highlight"><pre><span></span><code><span class="n">queue_max_size</span><span class="p">:</span> <span class="n"><span title="int">int</span></span> <span class="o">=</span> <span class="mi">100</span>
|
||
</code></pre></div>
|
||
|
||
<div class="doc doc-contents ">
|
||
|
||
</div>
|
||
|
||
</div>
|
||
|
||
<div class="doc doc-object doc-attribute">
|
||
|
||
|
||
|
||
<h4 id="docling.datamodel.pipeline_options.PdfPipelineOptions.table_batch_size" class="doc doc-heading">
|
||
<code class="doc-symbol doc-symbol-heading doc-symbol-attribute"></code> <span class="doc doc-object-name doc-attribute-name">table_batch_size</span>
|
||
|
||
|
||
<span class="doc doc-labels">
|
||
<small class="doc doc-label doc-label-class-attribute"><code>class-attribute</code></small>
|
||
<small class="doc doc-label doc-label-instance-attribute"><code>instance-attribute</code></small>
|
||
</span>
|
||
|
||
</h4>
|
||
<div class="doc-signature highlight"><pre><span></span><code><span class="n">table_batch_size</span><span class="p">:</span> <span class="n"><span title="int">int</span></span> <span class="o">=</span> <span class="mi">4</span>
|
||
</code></pre></div>
|
||
|
||
<div class="doc doc-contents ">
|
||
|
||
</div>
|
||
|
||
</div>
|
||
|
||
<div class="doc doc-object doc-attribute">
|
||
|
||
|
||
|
||
<h4 id="docling.datamodel.pipeline_options.PdfPipelineOptions.table_structure_options" class="doc doc-heading">
|
||
<code class="doc-symbol doc-symbol-heading doc-symbol-attribute"></code> <span class="doc doc-object-name doc-attribute-name">table_structure_options</span>
|
||
|
||
|
||
<span class="doc doc-labels">
|
||
<small class="doc doc-label doc-label-class-attribute"><code>class-attribute</code></small>
|
||
<small class="doc doc-label doc-label-instance-attribute"><code>instance-attribute</code></small>
|
||
</span>
|
||
|
||
</h4>
|
||
<div class="doc-signature highlight"><pre><span></span><code><span class="n">table_structure_options</span><span class="p">:</span> <span class="n"><a class="autorefs autorefs-internal" title="<code class="doc-symbol doc-symbol-heading doc-symbol-class"></code> <span class="doc doc-object-name doc-class-name">BaseTableStructureOptions</span> (<code>docling.datamodel.pipeline_options.BaseTableStructureOptions</code>)" href="#docling.datamodel.pipeline_options.BaseTableStructureOptions">BaseTableStructureOptions</a></span> <span class="o">=</span> <span class="n"><a class="autorefs autorefs-internal" title="<code class="doc-symbol doc-symbol-heading doc-symbol-class"></code> <span class="doc doc-object-name doc-class-name">TableStructureOptions</span> (<code>docling.datamodel.pipeline_options.TableStructureOptions</code>)" href="#docling.datamodel.pipeline_options.TableStructureOptions">TableStructureOptions</a></span><span class="p">()</span>
|
||
</code></pre></div>
|
||
|
||
<div class="doc doc-contents ">
|
||
|
||
</div>
|
||
|
||
</div>
|
||
|
||
|
||
|
||
|
||
|
||
|
||
</div>
|
||
|
||
</div>
|
||
|
||
</div>
|
||
|
||
<div class="doc doc-object doc-class">
|
||
|
||
|
||
|
||
<h3 id="docling.datamodel.pipeline_options.PictureDescriptionApiOptions" class="doc doc-heading">
|
||
<code class="doc-symbol doc-symbol-heading doc-symbol-class"></code> <span class="doc doc-object-name doc-class-name">PictureDescriptionApiOptions</span>
|
||
|
||
|
||
</h3>
|
||
|
||
|
||
<div class="doc doc-contents ">
|
||
<p class="doc doc-class-bases">
|
||
Bases: <code><a class="autorefs autorefs-internal" title="<code class="doc-symbol doc-symbol-heading doc-symbol-class"></code> <span class="doc doc-object-name doc-class-name">PictureDescriptionBaseOptions</span> (<code>docling.datamodel.pipeline_options.PictureDescriptionBaseOptions</code>)" href="#docling.datamodel.pipeline_options.PictureDescriptionBaseOptions">PictureDescriptionBaseOptions</a></code></p>
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
<p><span class="doc-section-title">Attributes:</span></p>
|
||
<ul>
|
||
<li class="doc-section-item field-body">
|
||
<b><code><a class="autorefs autorefs-internal" title="<code class="doc-symbol doc-symbol-heading doc-symbol-attribute"></code> <span class="doc doc-object-name doc-attribute-name">batch_size</span>
|
||
|
||
|
||
<span class="doc doc-labels">
|
||
<small class="doc doc-label doc-label-class-attribute"><code>class-attribute</code></small>
|
||
<small class="doc doc-label doc-label-instance-attribute"><code>instance-attribute</code></small>
|
||
</span> (<code>docling.datamodel.pipeline_options.PictureDescriptionApiOptions.batch_size</code>)" href="#docling.datamodel.pipeline_options.PictureDescriptionApiOptions.batch_size">batch_size</a></code></b>
|
||
(<code><span title="int">int</span></code>)
|
||
–
|
||
<div class="doc-md-description">
|
||
|
||
</div>
|
||
</li>
|
||
<li class="doc-section-item field-body">
|
||
<b><code><a class="autorefs autorefs-internal" title="<code class="doc-symbol doc-symbol-heading doc-symbol-attribute"></code> <span class="doc doc-object-name doc-attribute-name">concurrency</span>
|
||
|
||
|
||
<span class="doc doc-labels">
|
||
<small class="doc doc-label doc-label-class-attribute"><code>class-attribute</code></small>
|
||
<small class="doc doc-label doc-label-instance-attribute"><code>instance-attribute</code></small>
|
||
</span> (<code>docling.datamodel.pipeline_options.PictureDescriptionApiOptions.concurrency</code>)" href="#docling.datamodel.pipeline_options.PictureDescriptionApiOptions.concurrency">concurrency</a></code></b>
|
||
(<code><span title="int">int</span></code>)
|
||
–
|
||
<div class="doc-md-description">
|
||
|
||
</div>
|
||
</li>
|
||
<li class="doc-section-item field-body">
|
||
<b><code><a class="autorefs autorefs-internal" title="<code class="doc-symbol doc-symbol-heading doc-symbol-attribute"></code> <span class="doc doc-object-name doc-attribute-name">headers</span>
|
||
|
||
|
||
<span class="doc doc-labels">
|
||
<small class="doc doc-label doc-label-class-attribute"><code>class-attribute</code></small>
|
||
<small class="doc doc-label doc-label-instance-attribute"><code>instance-attribute</code></small>
|
||
</span> (<code>docling.datamodel.pipeline_options.PictureDescriptionApiOptions.headers</code>)" href="#docling.datamodel.pipeline_options.PictureDescriptionApiOptions.headers">headers</a></code></b>
|
||
(<code><span title="typing.Dict">Dict</span>[<span title="str">str</span>, <span title="str">str</span>]</code>)
|
||
–
|
||
<div class="doc-md-description">
|
||
|
||
</div>
|
||
</li>
|
||
<li class="doc-section-item field-body">
|
||
<b><code><a class="autorefs autorefs-internal" title="<code class="doc-symbol doc-symbol-heading doc-symbol-attribute"></code> <span class="doc doc-object-name doc-attribute-name">kind</span>
|
||
|
||
|
||
<span class="doc doc-labels">
|
||
<small class="doc doc-label doc-label-class-attribute"><code>class-attribute</code></small>
|
||
</span> (<code>docling.datamodel.pipeline_options.PictureDescriptionApiOptions.kind</code>)" href="#docling.datamodel.pipeline_options.PictureDescriptionApiOptions.kind">kind</a></code></b>
|
||
(<code><span title="typing.Literal">Literal</span>['api']</code>)
|
||
–
|
||
<div class="doc-md-description">
|
||
|
||
</div>
|
||
</li>
|
||
<li class="doc-section-item field-body">
|
||
<b><code><a class="autorefs autorefs-internal" title="<code class="doc-symbol doc-symbol-heading doc-symbol-attribute"></code> <span class="doc doc-object-name doc-attribute-name">params</span>
|
||
|
||
|
||
<span class="doc doc-labels">
|
||
<small class="doc doc-label doc-label-class-attribute"><code>class-attribute</code></small>
|
||
<small class="doc doc-label doc-label-instance-attribute"><code>instance-attribute</code></small>
|
||
</span> (<code>docling.datamodel.pipeline_options.PictureDescriptionApiOptions.params</code>)" href="#docling.datamodel.pipeline_options.PictureDescriptionApiOptions.params">params</a></code></b>
|
||
(<code><span title="typing.Dict">Dict</span>[<span title="str">str</span>, <span title="typing.Any">Any</span>]</code>)
|
||
–
|
||
<div class="doc-md-description">
|
||
|
||
</div>
|
||
</li>
|
||
<li class="doc-section-item field-body">
|
||
<b><code><a class="autorefs autorefs-internal" title="<code class="doc-symbol doc-symbol-heading doc-symbol-attribute"></code> <span class="doc doc-object-name doc-attribute-name">picture_area_threshold</span>
|
||
|
||
|
||
<span class="doc doc-labels">
|
||
<small class="doc doc-label doc-label-class-attribute"><code>class-attribute</code></small>
|
||
<small class="doc doc-label doc-label-instance-attribute"><code>instance-attribute</code></small>
|
||
</span> (<code>docling.datamodel.pipeline_options.PictureDescriptionApiOptions.picture_area_threshold</code>)" href="#docling.datamodel.pipeline_options.PictureDescriptionApiOptions.picture_area_threshold">picture_area_threshold</a></code></b>
|
||
(<code><span title="float">float</span></code>)
|
||
–
|
||
<div class="doc-md-description">
|
||
|
||
</div>
|
||
</li>
|
||
<li class="doc-section-item field-body">
|
||
<b><code><a class="autorefs autorefs-internal" title="<code class="doc-symbol doc-symbol-heading doc-symbol-attribute"></code> <span class="doc doc-object-name doc-attribute-name">prompt</span>
|
||
|
||
|
||
<span class="doc doc-labels">
|
||
<small class="doc doc-label doc-label-class-attribute"><code>class-attribute</code></small>
|
||
<small class="doc doc-label doc-label-instance-attribute"><code>instance-attribute</code></small>
|
||
</span> (<code>docling.datamodel.pipeline_options.PictureDescriptionApiOptions.prompt</code>)" href="#docling.datamodel.pipeline_options.PictureDescriptionApiOptions.prompt">prompt</a></code></b>
|
||
(<code><span title="str">str</span></code>)
|
||
–
|
||
<div class="doc-md-description">
|
||
|
||
</div>
|
||
</li>
|
||
<li class="doc-section-item field-body">
|
||
<b><code><a class="autorefs autorefs-internal" title="<code class="doc-symbol doc-symbol-heading doc-symbol-attribute"></code> <span class="doc doc-object-name doc-attribute-name">provenance</span>
|
||
|
||
|
||
<span class="doc doc-labels">
|
||
<small class="doc doc-label doc-label-class-attribute"><code>class-attribute</code></small>
|
||
<small class="doc doc-label doc-label-instance-attribute"><code>instance-attribute</code></small>
|
||
</span> (<code>docling.datamodel.pipeline_options.PictureDescriptionApiOptions.provenance</code>)" href="#docling.datamodel.pipeline_options.PictureDescriptionApiOptions.provenance">provenance</a></code></b>
|
||
(<code><span title="str">str</span></code>)
|
||
–
|
||
<div class="doc-md-description">
|
||
|
||
</div>
|
||
</li>
|
||
<li class="doc-section-item field-body">
|
||
<b><code><a class="autorefs autorefs-internal" title="<code class="doc-symbol doc-symbol-heading doc-symbol-attribute"></code> <span class="doc doc-object-name doc-attribute-name">scale</span>
|
||
|
||
|
||
<span class="doc doc-labels">
|
||
<small class="doc doc-label doc-label-class-attribute"><code>class-attribute</code></small>
|
||
<small class="doc doc-label doc-label-instance-attribute"><code>instance-attribute</code></small>
|
||
</span> (<code>docling.datamodel.pipeline_options.PictureDescriptionApiOptions.scale</code>)" href="#docling.datamodel.pipeline_options.PictureDescriptionApiOptions.scale">scale</a></code></b>
|
||
(<code><span title="float">float</span></code>)
|
||
–
|
||
<div class="doc-md-description">
|
||
|
||
</div>
|
||
</li>
|
||
<li class="doc-section-item field-body">
|
||
<b><code><a class="autorefs autorefs-internal" title="<code class="doc-symbol doc-symbol-heading doc-symbol-attribute"></code> <span class="doc doc-object-name doc-attribute-name">timeout</span>
|
||
|
||
|
||
<span class="doc doc-labels">
|
||
<small class="doc doc-label doc-label-class-attribute"><code>class-attribute</code></small>
|
||
<small class="doc doc-label doc-label-instance-attribute"><code>instance-attribute</code></small>
|
||
</span> (<code>docling.datamodel.pipeline_options.PictureDescriptionApiOptions.timeout</code>)" href="#docling.datamodel.pipeline_options.PictureDescriptionApiOptions.timeout">timeout</a></code></b>
|
||
(<code><span title="float">float</span></code>)
|
||
–
|
||
<div class="doc-md-description">
|
||
|
||
</div>
|
||
</li>
|
||
<li class="doc-section-item field-body">
|
||
<b><code><a class="autorefs autorefs-internal" title="<code class="doc-symbol doc-symbol-heading doc-symbol-attribute"></code> <span class="doc doc-object-name doc-attribute-name">url</span>
|
||
|
||
|
||
<span class="doc doc-labels">
|
||
<small class="doc doc-label doc-label-class-attribute"><code>class-attribute</code></small>
|
||
<small class="doc doc-label doc-label-instance-attribute"><code>instance-attribute</code></small>
|
||
</span> (<code>docling.datamodel.pipeline_options.PictureDescriptionApiOptions.url</code>)" href="#docling.datamodel.pipeline_options.PictureDescriptionApiOptions.url">url</a></code></b>
|
||
(<code><span title="pydantic.AnyUrl">AnyUrl</span></code>)
|
||
–
|
||
<div class="doc-md-description">
|
||
|
||
</div>
|
||
</li>
|
||
</ul>
|
||
|
||
|
||
|
||
|
||
<div class="doc doc-children">
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
<div class="doc doc-object doc-attribute">
|
||
|
||
|
||
|
||
<h4 id="docling.datamodel.pipeline_options.PictureDescriptionApiOptions.batch_size" class="doc doc-heading">
|
||
<code class="doc-symbol doc-symbol-heading doc-symbol-attribute"></code> <span class="doc doc-object-name doc-attribute-name">batch_size</span>
|
||
|
||
|
||
<span class="doc doc-labels">
|
||
<small class="doc doc-label doc-label-class-attribute"><code>class-attribute</code></small>
|
||
<small class="doc doc-label doc-label-instance-attribute"><code>instance-attribute</code></small>
|
||
</span>
|
||
|
||
</h4>
|
||
<div class="doc-signature highlight"><pre><span></span><code><span class="n">batch_size</span><span class="p">:</span> <span class="n"><span title="int">int</span></span> <span class="o">=</span> <span class="mi">8</span>
|
||
</code></pre></div>
|
||
|
||
<div class="doc doc-contents ">
|
||
|
||
</div>
|
||
|
||
</div>
|
||
|
||
<div class="doc doc-object doc-attribute">
|
||
|
||
|
||
|
||
<h4 id="docling.datamodel.pipeline_options.PictureDescriptionApiOptions.concurrency" class="doc doc-heading">
|
||
<code class="doc-symbol doc-symbol-heading doc-symbol-attribute"></code> <span class="doc doc-object-name doc-attribute-name">concurrency</span>
|
||
|
||
|
||
<span class="doc doc-labels">
|
||
<small class="doc doc-label doc-label-class-attribute"><code>class-attribute</code></small>
|
||
<small class="doc doc-label doc-label-instance-attribute"><code>instance-attribute</code></small>
|
||
</span>
|
||
|
||
</h4>
|
||
<div class="doc-signature highlight"><pre><span></span><code><span class="n">concurrency</span><span class="p">:</span> <span class="n"><span title="int">int</span></span> <span class="o">=</span> <span class="mi">1</span>
|
||
</code></pre></div>
|
||
|
||
<div class="doc doc-contents ">
|
||
|
||
</div>
|
||
|
||
</div>
|
||
|
||
<div class="doc doc-object doc-attribute">
|
||
|
||
|
||
|
||
<h4 id="docling.datamodel.pipeline_options.PictureDescriptionApiOptions.headers" class="doc doc-heading">
|
||
<code class="doc-symbol doc-symbol-heading doc-symbol-attribute"></code> <span class="doc doc-object-name doc-attribute-name">headers</span>
|
||
|
||
|
||
<span class="doc doc-labels">
|
||
<small class="doc doc-label doc-label-class-attribute"><code>class-attribute</code></small>
|
||
<small class="doc doc-label doc-label-instance-attribute"><code>instance-attribute</code></small>
|
||
</span>
|
||
|
||
</h4>
|
||
<div class="doc-signature highlight"><pre><span></span><code><span class="n">headers</span><span class="p">:</span> <span class="n"><span title="typing.Dict">Dict</span></span><span class="p">[</span><span class="n"><span title="str">str</span></span><span class="p">,</span> <span class="n"><span title="str">str</span></span><span class="p">]</span> <span class="o">=</span> <span class="p">{}</span>
|
||
</code></pre></div>
|
||
|
||
<div class="doc doc-contents ">
|
||
|
||
</div>
|
||
|
||
</div>
|
||
|
||
<div class="doc doc-object doc-attribute">
|
||
|
||
|
||
|
||
<h4 id="docling.datamodel.pipeline_options.PictureDescriptionApiOptions.kind" class="doc doc-heading">
|
||
<code class="doc-symbol doc-symbol-heading doc-symbol-attribute"></code> <span class="doc doc-object-name doc-attribute-name">kind</span>
|
||
|
||
|
||
<span class="doc doc-labels">
|
||
<small class="doc doc-label doc-label-class-attribute"><code>class-attribute</code></small>
|
||
</span>
|
||
|
||
</h4>
|
||
<div class="doc-signature highlight"><pre><span></span><code><span class="n">kind</span><span class="p">:</span> <span class="n"><span title="typing.Literal">Literal</span></span><span class="p">[</span><span class="s1">'api'</span><span class="p">]</span> <span class="o">=</span> <span class="s1">'api'</span>
|
||
</code></pre></div>
|
||
|
||
<div class="doc doc-contents ">
|
||
|
||
</div>
|
||
|
||
</div>
|
||
|
||
<div class="doc doc-object doc-attribute">
|
||
|
||
|
||
|
||
<h4 id="docling.datamodel.pipeline_options.PictureDescriptionApiOptions.params" class="doc doc-heading">
|
||
<code class="doc-symbol doc-symbol-heading doc-symbol-attribute"></code> <span class="doc doc-object-name doc-attribute-name">params</span>
|
||
|
||
|
||
<span class="doc doc-labels">
|
||
<small class="doc doc-label doc-label-class-attribute"><code>class-attribute</code></small>
|
||
<small class="doc doc-label doc-label-instance-attribute"><code>instance-attribute</code></small>
|
||
</span>
|
||
|
||
</h4>
|
||
<div class="doc-signature highlight"><pre><span></span><code><span class="n">params</span><span class="p">:</span> <span class="n"><span title="typing.Dict">Dict</span></span><span class="p">[</span><span class="n"><span title="str">str</span></span><span class="p">,</span> <span class="n"><span title="typing.Any">Any</span></span><span class="p">]</span> <span class="o">=</span> <span class="p">{}</span>
|
||
</code></pre></div>
|
||
|
||
<div class="doc doc-contents ">
|
||
|
||
</div>
|
||
|
||
</div>
|
||
|
||
<div class="doc doc-object doc-attribute">
|
||
|
||
|
||
|
||
<h4 id="docling.datamodel.pipeline_options.PictureDescriptionApiOptions.picture_area_threshold" class="doc doc-heading">
|
||
<code class="doc-symbol doc-symbol-heading doc-symbol-attribute"></code> <span class="doc doc-object-name doc-attribute-name">picture_area_threshold</span>
|
||
|
||
|
||
<span class="doc doc-labels">
|
||
<small class="doc doc-label doc-label-class-attribute"><code>class-attribute</code></small>
|
||
<small class="doc doc-label doc-label-instance-attribute"><code>instance-attribute</code></small>
|
||
</span>
|
||
|
||
</h4>
|
||
<div class="doc-signature highlight"><pre><span></span><code><span class="n">picture_area_threshold</span><span class="p">:</span> <span class="n"><span title="float">float</span></span> <span class="o">=</span> <span class="mf">0.05</span>
|
||
</code></pre></div>
|
||
|
||
<div class="doc doc-contents ">
|
||
|
||
</div>
|
||
|
||
</div>
|
||
|
||
<div class="doc doc-object doc-attribute">
|
||
|
||
|
||
|
||
<h4 id="docling.datamodel.pipeline_options.PictureDescriptionApiOptions.prompt" class="doc doc-heading">
|
||
<code class="doc-symbol doc-symbol-heading doc-symbol-attribute"></code> <span class="doc doc-object-name doc-attribute-name">prompt</span>
|
||
|
||
|
||
<span class="doc doc-labels">
|
||
<small class="doc doc-label doc-label-class-attribute"><code>class-attribute</code></small>
|
||
<small class="doc doc-label doc-label-instance-attribute"><code>instance-attribute</code></small>
|
||
</span>
|
||
|
||
</h4>
|
||
<div class="doc-signature highlight"><pre><span></span><code><span class="n">prompt</span><span class="p">:</span> <span class="n"><span title="str">str</span></span> <span class="o">=</span> <span class="s1">'Describe this image in a few sentences.'</span>
|
||
</code></pre></div>
|
||
|
||
<div class="doc doc-contents ">
|
||
|
||
</div>
|
||
|
||
</div>
|
||
|
||
<div class="doc doc-object doc-attribute">
|
||
|
||
|
||
|
||
<h4 id="docling.datamodel.pipeline_options.PictureDescriptionApiOptions.provenance" class="doc doc-heading">
|
||
<code class="doc-symbol doc-symbol-heading doc-symbol-attribute"></code> <span class="doc doc-object-name doc-attribute-name">provenance</span>
|
||
|
||
|
||
<span class="doc doc-labels">
|
||
<small class="doc doc-label doc-label-class-attribute"><code>class-attribute</code></small>
|
||
<small class="doc doc-label doc-label-instance-attribute"><code>instance-attribute</code></small>
|
||
</span>
|
||
|
||
</h4>
|
||
<div class="doc-signature highlight"><pre><span></span><code><span class="n">provenance</span><span class="p">:</span> <span class="n"><span title="str">str</span></span> <span class="o">=</span> <span class="s1">''</span>
|
||
</code></pre></div>
|
||
|
||
<div class="doc doc-contents ">
|
||
|
||
</div>
|
||
|
||
</div>
|
||
|
||
<div class="doc doc-object doc-attribute">
|
||
|
||
|
||
|
||
<h4 id="docling.datamodel.pipeline_options.PictureDescriptionApiOptions.scale" class="doc doc-heading">
|
||
<code class="doc-symbol doc-symbol-heading doc-symbol-attribute"></code> <span class="doc doc-object-name doc-attribute-name">scale</span>
|
||
|
||
|
||
<span class="doc doc-labels">
|
||
<small class="doc doc-label doc-label-class-attribute"><code>class-attribute</code></small>
|
||
<small class="doc doc-label doc-label-instance-attribute"><code>instance-attribute</code></small>
|
||
</span>
|
||
|
||
</h4>
|
||
<div class="doc-signature highlight"><pre><span></span><code><span class="n">scale</span><span class="p">:</span> <span class="n"><span title="float">float</span></span> <span class="o">=</span> <span class="mi">2</span>
|
||
</code></pre></div>
|
||
|
||
<div class="doc doc-contents ">
|
||
|
||
</div>
|
||
|
||
</div>
|
||
|
||
<div class="doc doc-object doc-attribute">
|
||
|
||
|
||
|
||
<h4 id="docling.datamodel.pipeline_options.PictureDescriptionApiOptions.timeout" class="doc doc-heading">
|
||
<code class="doc-symbol doc-symbol-heading doc-symbol-attribute"></code> <span class="doc doc-object-name doc-attribute-name">timeout</span>
|
||
|
||
|
||
<span class="doc doc-labels">
|
||
<small class="doc doc-label doc-label-class-attribute"><code>class-attribute</code></small>
|
||
<small class="doc doc-label doc-label-instance-attribute"><code>instance-attribute</code></small>
|
||
</span>
|
||
|
||
</h4>
|
||
<div class="doc-signature highlight"><pre><span></span><code><span class="n">timeout</span><span class="p">:</span> <span class="n"><span title="float">float</span></span> <span class="o">=</span> <span class="mi">20</span>
|
||
</code></pre></div>
|
||
|
||
<div class="doc doc-contents ">
|
||
|
||
</div>
|
||
|
||
</div>
|
||
|
||
<div class="doc doc-object doc-attribute">
|
||
|
||
|
||
|
||
<h4 id="docling.datamodel.pipeline_options.PictureDescriptionApiOptions.url" class="doc doc-heading">
|
||
<code class="doc-symbol doc-symbol-heading doc-symbol-attribute"></code> <span class="doc doc-object-name doc-attribute-name">url</span>
|
||
|
||
|
||
<span class="doc doc-labels">
|
||
<small class="doc doc-label doc-label-class-attribute"><code>class-attribute</code></small>
|
||
<small class="doc doc-label doc-label-instance-attribute"><code>instance-attribute</code></small>
|
||
</span>
|
||
|
||
</h4>
|
||
<div class="doc-signature highlight"><pre><span></span><code><span class="n">url</span><span class="p">:</span> <span class="n"><span title="pydantic.AnyUrl">AnyUrl</span></span> <span class="o">=</span> <span class="n"><span title="pydantic.AnyUrl">AnyUrl</span></span><span class="p">(</span><span class="s1">'http://localhost:8000/v1/chat/completions'</span><span class="p">)</span>
|
||
</code></pre></div>
|
||
|
||
<div class="doc doc-contents ">
|
||
|
||
</div>
|
||
|
||
</div>
|
||
|
||
|
||
|
||
|
||
|
||
|
||
</div>
|
||
|
||
</div>
|
||
|
||
</div>
|
||
|
||
<div class="doc doc-object doc-class">
|
||
|
||
|
||
|
||
<h3 id="docling.datamodel.pipeline_options.PictureDescriptionBaseOptions" class="doc doc-heading">
|
||
<code class="doc-symbol doc-symbol-heading doc-symbol-class"></code> <span class="doc doc-object-name doc-class-name">PictureDescriptionBaseOptions</span>
|
||
|
||
|
||
</h3>
|
||
|
||
|
||
<div class="doc doc-contents ">
|
||
<p class="doc doc-class-bases">
|
||
Bases: <code><a class="autorefs autorefs-internal" title="<code class="doc-symbol doc-symbol-heading doc-symbol-class"></code> <span class="doc doc-object-name doc-class-name">BaseOptions</span> (<code>docling.datamodel.pipeline_options.BaseOptions</code>)" href="#docling.datamodel.pipeline_options.BaseOptions">BaseOptions</a></code></p>
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
<p><span class="doc-section-title">Attributes:</span></p>
|
||
<ul>
|
||
<li class="doc-section-item field-body">
|
||
<b><code><a class="autorefs autorefs-internal" title="<code class="doc-symbol doc-symbol-heading doc-symbol-attribute"></code> <span class="doc doc-object-name doc-attribute-name">batch_size</span>
|
||
|
||
|
||
<span class="doc doc-labels">
|
||
<small class="doc doc-label doc-label-class-attribute"><code>class-attribute</code></small>
|
||
<small class="doc doc-label doc-label-instance-attribute"><code>instance-attribute</code></small>
|
||
</span> (<code>docling.datamodel.pipeline_options.PictureDescriptionBaseOptions.batch_size</code>)" href="#docling.datamodel.pipeline_options.PictureDescriptionBaseOptions.batch_size">batch_size</a></code></b>
|
||
(<code><span title="int">int</span></code>)
|
||
–
|
||
<div class="doc-md-description">
|
||
|
||
</div>
|
||
</li>
|
||
<li class="doc-section-item field-body">
|
||
<b><code><a class="autorefs autorefs-internal" title="<code class="doc-symbol doc-symbol-heading doc-symbol-attribute"></code> <span class="doc doc-object-name doc-attribute-name">kind</span>
|
||
|
||
|
||
<span class="doc doc-labels">
|
||
<small class="doc doc-label doc-label-class-attribute"><code>class-attribute</code></small>
|
||
</span> (<code>docling.datamodel.pipeline_options.PictureDescriptionBaseOptions.kind</code>)" href="#docling.datamodel.pipeline_options.PictureDescriptionBaseOptions.kind">kind</a></code></b>
|
||
(<code><span title="str">str</span></code>)
|
||
–
|
||
<div class="doc-md-description">
|
||
|
||
</div>
|
||
</li>
|
||
<li class="doc-section-item field-body">
|
||
<b><code><a class="autorefs autorefs-internal" title="<code class="doc-symbol doc-symbol-heading doc-symbol-attribute"></code> <span class="doc doc-object-name doc-attribute-name">picture_area_threshold</span>
|
||
|
||
|
||
<span class="doc doc-labels">
|
||
<small class="doc doc-label doc-label-class-attribute"><code>class-attribute</code></small>
|
||
<small class="doc doc-label doc-label-instance-attribute"><code>instance-attribute</code></small>
|
||
</span> (<code>docling.datamodel.pipeline_options.PictureDescriptionBaseOptions.picture_area_threshold</code>)" href="#docling.datamodel.pipeline_options.PictureDescriptionBaseOptions.picture_area_threshold">picture_area_threshold</a></code></b>
|
||
(<code><span title="float">float</span></code>)
|
||
–
|
||
<div class="doc-md-description">
|
||
|
||
</div>
|
||
</li>
|
||
<li class="doc-section-item field-body">
|
||
<b><code><a class="autorefs autorefs-internal" title="<code class="doc-symbol doc-symbol-heading doc-symbol-attribute"></code> <span class="doc doc-object-name doc-attribute-name">scale</span>
|
||
|
||
|
||
<span class="doc doc-labels">
|
||
<small class="doc doc-label doc-label-class-attribute"><code>class-attribute</code></small>
|
||
<small class="doc doc-label doc-label-instance-attribute"><code>instance-attribute</code></small>
|
||
</span> (<code>docling.datamodel.pipeline_options.PictureDescriptionBaseOptions.scale</code>)" href="#docling.datamodel.pipeline_options.PictureDescriptionBaseOptions.scale">scale</a></code></b>
|
||
(<code><span title="float">float</span></code>)
|
||
–
|
||
<div class="doc-md-description">
|
||
|
||
</div>
|
||
</li>
|
||
</ul>
|
||
|
||
|
||
|
||
|
||
<div class="doc doc-children">
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
<div class="doc doc-object doc-attribute">
|
||
|
||
|
||
|
||
<h4 id="docling.datamodel.pipeline_options.PictureDescriptionBaseOptions.batch_size" class="doc doc-heading">
|
||
<code class="doc-symbol doc-symbol-heading doc-symbol-attribute"></code> <span class="doc doc-object-name doc-attribute-name">batch_size</span>
|
||
|
||
|
||
<span class="doc doc-labels">
|
||
<small class="doc doc-label doc-label-class-attribute"><code>class-attribute</code></small>
|
||
<small class="doc doc-label doc-label-instance-attribute"><code>instance-attribute</code></small>
|
||
</span>
|
||
|
||
</h4>
|
||
<div class="doc-signature highlight"><pre><span></span><code><span class="n">batch_size</span><span class="p">:</span> <span class="n"><span title="int">int</span></span> <span class="o">=</span> <span class="mi">8</span>
|
||
</code></pre></div>
|
||
|
||
<div class="doc doc-contents ">
|
||
|
||
</div>
|
||
|
||
</div>
|
||
|
||
<div class="doc doc-object doc-attribute">
|
||
|
||
|
||
|
||
<h4 id="docling.datamodel.pipeline_options.PictureDescriptionBaseOptions.kind" class="doc doc-heading">
|
||
<code class="doc-symbol doc-symbol-heading doc-symbol-attribute"></code> <span class="doc doc-object-name doc-attribute-name">kind</span>
|
||
|
||
|
||
<span class="doc doc-labels">
|
||
<small class="doc doc-label doc-label-class-attribute"><code>class-attribute</code></small>
|
||
</span>
|
||
|
||
</h4>
|
||
<div class="doc-signature highlight"><pre><span></span><code><span class="n">kind</span><span class="p">:</span> <span class="n"><span title="str">str</span></span>
|
||
</code></pre></div>
|
||
|
||
<div class="doc doc-contents ">
|
||
|
||
</div>
|
||
|
||
</div>
|
||
|
||
<div class="doc doc-object doc-attribute">
|
||
|
||
|
||
|
||
<h4 id="docling.datamodel.pipeline_options.PictureDescriptionBaseOptions.picture_area_threshold" class="doc doc-heading">
|
||
<code class="doc-symbol doc-symbol-heading doc-symbol-attribute"></code> <span class="doc doc-object-name doc-attribute-name">picture_area_threshold</span>
|
||
|
||
|
||
<span class="doc doc-labels">
|
||
<small class="doc doc-label doc-label-class-attribute"><code>class-attribute</code></small>
|
||
<small class="doc doc-label doc-label-instance-attribute"><code>instance-attribute</code></small>
|
||
</span>
|
||
|
||
</h4>
|
||
<div class="doc-signature highlight"><pre><span></span><code><span class="n">picture_area_threshold</span><span class="p">:</span> <span class="n"><span title="float">float</span></span> <span class="o">=</span> <span class="mf">0.05</span>
|
||
</code></pre></div>
|
||
|
||
<div class="doc doc-contents ">
|
||
|
||
</div>
|
||
|
||
</div>
|
||
|
||
<div class="doc doc-object doc-attribute">
|
||
|
||
|
||
|
||
<h4 id="docling.datamodel.pipeline_options.PictureDescriptionBaseOptions.scale" class="doc doc-heading">
|
||
<code class="doc-symbol doc-symbol-heading doc-symbol-attribute"></code> <span class="doc doc-object-name doc-attribute-name">scale</span>
|
||
|
||
|
||
<span class="doc doc-labels">
|
||
<small class="doc doc-label doc-label-class-attribute"><code>class-attribute</code></small>
|
||
<small class="doc doc-label doc-label-instance-attribute"><code>instance-attribute</code></small>
|
||
</span>
|
||
|
||
</h4>
|
||
<div class="doc-signature highlight"><pre><span></span><code><span class="n">scale</span><span class="p">:</span> <span class="n"><span title="float">float</span></span> <span class="o">=</span> <span class="mi">2</span>
|
||
</code></pre></div>
|
||
|
||
<div class="doc doc-contents ">
|
||
|
||
</div>
|
||
|
||
</div>
|
||
|
||
|
||
|
||
|
||
|
||
|
||
</div>
|
||
|
||
</div>
|
||
|
||
</div>
|
||
|
||
<div class="doc doc-object doc-class">
|
||
|
||
|
||
|
||
<h3 id="docling.datamodel.pipeline_options.PictureDescriptionVlmOptions" class="doc doc-heading">
|
||
<code class="doc-symbol doc-symbol-heading doc-symbol-class"></code> <span class="doc doc-object-name doc-class-name">PictureDescriptionVlmOptions</span>
|
||
|
||
|
||
</h3>
|
||
|
||
|
||
<div class="doc doc-contents ">
|
||
<p class="doc doc-class-bases">
|
||
Bases: <code><a class="autorefs autorefs-internal" title="<code class="doc-symbol doc-symbol-heading doc-symbol-class"></code> <span class="doc doc-object-name doc-class-name">PictureDescriptionBaseOptions</span> (<code>docling.datamodel.pipeline_options.PictureDescriptionBaseOptions</code>)" href="#docling.datamodel.pipeline_options.PictureDescriptionBaseOptions">PictureDescriptionBaseOptions</a></code></p>
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
<p><span class="doc-section-title">Attributes:</span></p>
|
||
<ul>
|
||
<li class="doc-section-item field-body">
|
||
<b><code><a class="autorefs autorefs-internal" title="<code class="doc-symbol doc-symbol-heading doc-symbol-attribute"></code> <span class="doc doc-object-name doc-attribute-name">batch_size</span>
|
||
|
||
|
||
<span class="doc doc-labels">
|
||
<small class="doc doc-label doc-label-class-attribute"><code>class-attribute</code></small>
|
||
<small class="doc doc-label doc-label-instance-attribute"><code>instance-attribute</code></small>
|
||
</span> (<code>docling.datamodel.pipeline_options.PictureDescriptionVlmOptions.batch_size</code>)" href="#docling.datamodel.pipeline_options.PictureDescriptionVlmOptions.batch_size">batch_size</a></code></b>
|
||
(<code><span title="int">int</span></code>)
|
||
–
|
||
<div class="doc-md-description">
|
||
|
||
</div>
|
||
</li>
|
||
<li class="doc-section-item field-body">
|
||
<b><code><a class="autorefs autorefs-internal" title="<code class="doc-symbol doc-symbol-heading doc-symbol-attribute"></code> <span class="doc doc-object-name doc-attribute-name">generation_config</span>
|
||
|
||
|
||
<span class="doc doc-labels">
|
||
<small class="doc doc-label doc-label-class-attribute"><code>class-attribute</code></small>
|
||
<small class="doc doc-label doc-label-instance-attribute"><code>instance-attribute</code></small>
|
||
</span> (<code>docling.datamodel.pipeline_options.PictureDescriptionVlmOptions.generation_config</code>)" href="#docling.datamodel.pipeline_options.PictureDescriptionVlmOptions.generation_config">generation_config</a></code></b>
|
||
(<code><span title="typing.Dict">Dict</span>[<span title="str">str</span>, <span title="typing.Any">Any</span>]</code>)
|
||
–
|
||
<div class="doc-md-description">
|
||
|
||
</div>
|
||
</li>
|
||
<li class="doc-section-item field-body">
|
||
<b><code><a class="autorefs autorefs-internal" title="<code class="doc-symbol doc-symbol-heading doc-symbol-attribute"></code> <span class="doc doc-object-name doc-attribute-name">kind</span>
|
||
|
||
|
||
<span class="doc doc-labels">
|
||
<small class="doc doc-label doc-label-class-attribute"><code>class-attribute</code></small>
|
||
</span> (<code>docling.datamodel.pipeline_options.PictureDescriptionVlmOptions.kind</code>)" href="#docling.datamodel.pipeline_options.PictureDescriptionVlmOptions.kind">kind</a></code></b>
|
||
(<code><span title="typing.Literal">Literal</span>['vlm']</code>)
|
||
–
|
||
<div class="doc-md-description">
|
||
|
||
</div>
|
||
</li>
|
||
<li class="doc-section-item field-body">
|
||
<b><code><a class="autorefs autorefs-internal" title="<code class="doc-symbol doc-symbol-heading doc-symbol-attribute"></code> <span class="doc doc-object-name doc-attribute-name">picture_area_threshold</span>
|
||
|
||
|
||
<span class="doc doc-labels">
|
||
<small class="doc doc-label doc-label-class-attribute"><code>class-attribute</code></small>
|
||
<small class="doc doc-label doc-label-instance-attribute"><code>instance-attribute</code></small>
|
||
</span> (<code>docling.datamodel.pipeline_options.PictureDescriptionVlmOptions.picture_area_threshold</code>)" href="#docling.datamodel.pipeline_options.PictureDescriptionVlmOptions.picture_area_threshold">picture_area_threshold</a></code></b>
|
||
(<code><span title="float">float</span></code>)
|
||
–
|
||
<div class="doc-md-description">
|
||
|
||
</div>
|
||
</li>
|
||
<li class="doc-section-item field-body">
|
||
<b><code><a class="autorefs autorefs-internal" title="<code class="doc-symbol doc-symbol-heading doc-symbol-attribute"></code> <span class="doc doc-object-name doc-attribute-name">prompt</span>
|
||
|
||
|
||
<span class="doc doc-labels">
|
||
<small class="doc doc-label doc-label-class-attribute"><code>class-attribute</code></small>
|
||
<small class="doc doc-label doc-label-instance-attribute"><code>instance-attribute</code></small>
|
||
</span> (<code>docling.datamodel.pipeline_options.PictureDescriptionVlmOptions.prompt</code>)" href="#docling.datamodel.pipeline_options.PictureDescriptionVlmOptions.prompt">prompt</a></code></b>
|
||
(<code><span title="str">str</span></code>)
|
||
–
|
||
<div class="doc-md-description">
|
||
|
||
</div>
|
||
</li>
|
||
<li class="doc-section-item field-body">
|
||
<b><code><a class="autorefs autorefs-internal" title="<code class="doc-symbol doc-symbol-heading doc-symbol-attribute"></code> <span class="doc doc-object-name doc-attribute-name">repo_cache_folder</span>
|
||
|
||
|
||
<span class="doc doc-labels">
|
||
<small class="doc doc-label doc-label-property"><code>property</code></small>
|
||
</span> (<code>docling.datamodel.pipeline_options.PictureDescriptionVlmOptions.repo_cache_folder</code>)" href="#docling.datamodel.pipeline_options.PictureDescriptionVlmOptions.repo_cache_folder">repo_cache_folder</a></code></b>
|
||
(<code><span title="str">str</span></code>)
|
||
–
|
||
<div class="doc-md-description">
|
||
|
||
</div>
|
||
</li>
|
||
<li class="doc-section-item field-body">
|
||
<b><code><a class="autorefs autorefs-internal" title="<code class="doc-symbol doc-symbol-heading doc-symbol-attribute"></code> <span class="doc doc-object-name doc-attribute-name">repo_id</span>
|
||
|
||
|
||
<span class="doc doc-labels">
|
||
<small class="doc doc-label doc-label-instance-attribute"><code>instance-attribute</code></small>
|
||
</span> (<code>docling.datamodel.pipeline_options.PictureDescriptionVlmOptions.repo_id</code>)" href="#docling.datamodel.pipeline_options.PictureDescriptionVlmOptions.repo_id">repo_id</a></code></b>
|
||
(<code><span title="str">str</span></code>)
|
||
–
|
||
<div class="doc-md-description">
|
||
|
||
</div>
|
||
</li>
|
||
<li class="doc-section-item field-body">
|
||
<b><code><a class="autorefs autorefs-internal" title="<code class="doc-symbol doc-symbol-heading doc-symbol-attribute"></code> <span class="doc doc-object-name doc-attribute-name">scale</span>
|
||
|
||
|
||
<span class="doc doc-labels">
|
||
<small class="doc doc-label doc-label-class-attribute"><code>class-attribute</code></small>
|
||
<small class="doc doc-label doc-label-instance-attribute"><code>instance-attribute</code></small>
|
||
</span> (<code>docling.datamodel.pipeline_options.PictureDescriptionVlmOptions.scale</code>)" href="#docling.datamodel.pipeline_options.PictureDescriptionVlmOptions.scale">scale</a></code></b>
|
||
(<code><span title="float">float</span></code>)
|
||
–
|
||
<div class="doc-md-description">
|
||
|
||
</div>
|
||
</li>
|
||
</ul>
|
||
|
||
|
||
|
||
|
||
<div class="doc doc-children">
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
<div class="doc doc-object doc-attribute">
|
||
|
||
|
||
|
||
<h4 id="docling.datamodel.pipeline_options.PictureDescriptionVlmOptions.batch_size" class="doc doc-heading">
|
||
<code class="doc-symbol doc-symbol-heading doc-symbol-attribute"></code> <span class="doc doc-object-name doc-attribute-name">batch_size</span>
|
||
|
||
|
||
<span class="doc doc-labels">
|
||
<small class="doc doc-label doc-label-class-attribute"><code>class-attribute</code></small>
|
||
<small class="doc doc-label doc-label-instance-attribute"><code>instance-attribute</code></small>
|
||
</span>
|
||
|
||
</h4>
|
||
<div class="doc-signature highlight"><pre><span></span><code><span class="n">batch_size</span><span class="p">:</span> <span class="n"><span title="int">int</span></span> <span class="o">=</span> <span class="mi">8</span>
|
||
</code></pre></div>
|
||
|
||
<div class="doc doc-contents ">
|
||
|
||
</div>
|
||
|
||
</div>
|
||
|
||
<div class="doc doc-object doc-attribute">
|
||
|
||
|
||
|
||
<h4 id="docling.datamodel.pipeline_options.PictureDescriptionVlmOptions.generation_config" class="doc doc-heading">
|
||
<code class="doc-symbol doc-symbol-heading doc-symbol-attribute"></code> <span class="doc doc-object-name doc-attribute-name">generation_config</span>
|
||
|
||
|
||
<span class="doc doc-labels">
|
||
<small class="doc doc-label doc-label-class-attribute"><code>class-attribute</code></small>
|
||
<small class="doc doc-label doc-label-instance-attribute"><code>instance-attribute</code></small>
|
||
</span>
|
||
|
||
</h4>
|
||
<div class="doc-signature highlight"><pre><span></span><code><span class="n">generation_config</span><span class="p">:</span> <span class="n"><span title="typing.Dict">Dict</span></span><span class="p">[</span><span class="n"><span title="str">str</span></span><span class="p">,</span> <span class="n"><span title="typing.Any">Any</span></span><span class="p">]</span> <span class="o">=</span> <span class="n"><span title="dict">dict</span></span><span class="p">(</span><span class="n"><span title="dict(max_new_tokens)">max_new_tokens</span></span><span class="o">=</span><span class="mi">200</span><span class="p">,</span> <span class="n"><span title="dict(do_sample)">do_sample</span></span><span class="o">=</span><span class="kc">False</span><span class="p">)</span>
|
||
</code></pre></div>
|
||
|
||
<div class="doc doc-contents ">
|
||
|
||
</div>
|
||
|
||
</div>
|
||
|
||
<div class="doc doc-object doc-attribute">
|
||
|
||
|
||
|
||
<h4 id="docling.datamodel.pipeline_options.PictureDescriptionVlmOptions.kind" class="doc doc-heading">
|
||
<code class="doc-symbol doc-symbol-heading doc-symbol-attribute"></code> <span class="doc doc-object-name doc-attribute-name">kind</span>
|
||
|
||
|
||
<span class="doc doc-labels">
|
||
<small class="doc doc-label doc-label-class-attribute"><code>class-attribute</code></small>
|
||
</span>
|
||
|
||
</h4>
|
||
<div class="doc-signature highlight"><pre><span></span><code><span class="n">kind</span><span class="p">:</span> <span class="n"><span title="typing.Literal">Literal</span></span><span class="p">[</span><span class="s1">'vlm'</span><span class="p">]</span> <span class="o">=</span> <span class="s1">'vlm'</span>
|
||
</code></pre></div>
|
||
|
||
<div class="doc doc-contents ">
|
||
|
||
</div>
|
||
|
||
</div>
|
||
|
||
<div class="doc doc-object doc-attribute">
|
||
|
||
|
||
|
||
<h4 id="docling.datamodel.pipeline_options.PictureDescriptionVlmOptions.picture_area_threshold" class="doc doc-heading">
|
||
<code class="doc-symbol doc-symbol-heading doc-symbol-attribute"></code> <span class="doc doc-object-name doc-attribute-name">picture_area_threshold</span>
|
||
|
||
|
||
<span class="doc doc-labels">
|
||
<small class="doc doc-label doc-label-class-attribute"><code>class-attribute</code></small>
|
||
<small class="doc doc-label doc-label-instance-attribute"><code>instance-attribute</code></small>
|
||
</span>
|
||
|
||
</h4>
|
||
<div class="doc-signature highlight"><pre><span></span><code><span class="n">picture_area_threshold</span><span class="p">:</span> <span class="n"><span title="float">float</span></span> <span class="o">=</span> <span class="mf">0.05</span>
|
||
</code></pre></div>
|
||
|
||
<div class="doc doc-contents ">
|
||
|
||
</div>
|
||
|
||
</div>
|
||
|
||
<div class="doc doc-object doc-attribute">
|
||
|
||
|
||
|
||
<h4 id="docling.datamodel.pipeline_options.PictureDescriptionVlmOptions.prompt" class="doc doc-heading">
|
||
<code class="doc-symbol doc-symbol-heading doc-symbol-attribute"></code> <span class="doc doc-object-name doc-attribute-name">prompt</span>
|
||
|
||
|
||
<span class="doc doc-labels">
|
||
<small class="doc doc-label doc-label-class-attribute"><code>class-attribute</code></small>
|
||
<small class="doc doc-label doc-label-instance-attribute"><code>instance-attribute</code></small>
|
||
</span>
|
||
|
||
</h4>
|
||
<div class="doc-signature highlight"><pre><span></span><code><span class="n">prompt</span><span class="p">:</span> <span class="n"><span title="str">str</span></span> <span class="o">=</span> <span class="s1">'Describe this image in a few sentences.'</span>
|
||
</code></pre></div>
|
||
|
||
<div class="doc doc-contents ">
|
||
|
||
</div>
|
||
|
||
</div>
|
||
|
||
<div class="doc doc-object doc-attribute">
|
||
|
||
|
||
|
||
<h4 id="docling.datamodel.pipeline_options.PictureDescriptionVlmOptions.repo_cache_folder" class="doc doc-heading">
|
||
<code class="doc-symbol doc-symbol-heading doc-symbol-attribute"></code> <span class="doc doc-object-name doc-attribute-name">repo_cache_folder</span>
|
||
|
||
|
||
<span class="doc doc-labels">
|
||
<small class="doc doc-label doc-label-property"><code>property</code></small>
|
||
</span>
|
||
|
||
</h4>
|
||
<div class="doc-signature highlight"><pre><span></span><code><span class="n">repo_cache_folder</span><span class="p">:</span> <span class="n"><span title="str">str</span></span>
|
||
</code></pre></div>
|
||
|
||
<div class="doc doc-contents ">
|
||
|
||
</div>
|
||
|
||
</div>
|
||
|
||
<div class="doc doc-object doc-attribute">
|
||
|
||
|
||
|
||
<h4 id="docling.datamodel.pipeline_options.PictureDescriptionVlmOptions.repo_id" class="doc doc-heading">
|
||
<code class="doc-symbol doc-symbol-heading doc-symbol-attribute"></code> <span class="doc doc-object-name doc-attribute-name">repo_id</span>
|
||
|
||
|
||
<span class="doc doc-labels">
|
||
<small class="doc doc-label doc-label-instance-attribute"><code>instance-attribute</code></small>
|
||
</span>
|
||
|
||
</h4>
|
||
<div class="doc-signature highlight"><pre><span></span><code><span class="n">repo_id</span><span class="p">:</span> <span class="n"><span title="str">str</span></span>
|
||
</code></pre></div>
|
||
|
||
<div class="doc doc-contents ">
|
||
|
||
</div>
|
||
|
||
</div>
|
||
|
||
<div class="doc doc-object doc-attribute">
|
||
|
||
|
||
|
||
<h4 id="docling.datamodel.pipeline_options.PictureDescriptionVlmOptions.scale" class="doc doc-heading">
|
||
<code class="doc-symbol doc-symbol-heading doc-symbol-attribute"></code> <span class="doc doc-object-name doc-attribute-name">scale</span>
|
||
|
||
|
||
<span class="doc doc-labels">
|
||
<small class="doc doc-label doc-label-class-attribute"><code>class-attribute</code></small>
|
||
<small class="doc doc-label doc-label-instance-attribute"><code>instance-attribute</code></small>
|
||
</span>
|
||
|
||
</h4>
|
||
<div class="doc-signature highlight"><pre><span></span><code><span class="n">scale</span><span class="p">:</span> <span class="n"><span title="float">float</span></span> <span class="o">=</span> <span class="mi">2</span>
|
||
</code></pre></div>
|
||
|
||
<div class="doc doc-contents ">
|
||
|
||
</div>
|
||
|
||
</div>
|
||
|
||
|
||
|
||
|
||
|
||
|
||
</div>
|
||
|
||
</div>
|
||
|
||
</div>
|
||
|
||
<div class="doc doc-object doc-class">
|
||
|
||
|
||
|
||
<h3 id="docling.datamodel.pipeline_options.PipelineOptions" class="doc doc-heading">
|
||
<code class="doc-symbol doc-symbol-heading doc-symbol-class"></code> <span class="doc doc-object-name doc-class-name">PipelineOptions</span>
|
||
|
||
|
||
</h3>
|
||
|
||
|
||
<div class="doc doc-contents ">
|
||
<p class="doc doc-class-bases">
|
||
Bases: <code><a class="autorefs autorefs-internal" title="<code class="doc-symbol doc-symbol-heading doc-symbol-class"></code> <span class="doc doc-object-name doc-class-name">BaseOptions</span> (<code>docling.datamodel.pipeline_options.BaseOptions</code>)" href="#docling.datamodel.pipeline_options.BaseOptions">BaseOptions</a></code></p>
|
||
|
||
|
||
|
||
<p>Base pipeline options.</p>
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
<p><span class="doc-section-title">Attributes:</span></p>
|
||
<ul>
|
||
<li class="doc-section-item field-body">
|
||
<b><code><a class="autorefs autorefs-internal" title="<code class="doc-symbol doc-symbol-heading doc-symbol-attribute"></code> <span class="doc doc-object-name doc-attribute-name">accelerator_options</span>
|
||
|
||
|
||
<span class="doc doc-labels">
|
||
<small class="doc doc-label doc-label-class-attribute"><code>class-attribute</code></small>
|
||
<small class="doc doc-label doc-label-instance-attribute"><code>instance-attribute</code></small>
|
||
</span> (<code>docling.datamodel.pipeline_options.PipelineOptions.accelerator_options</code>)" href="#docling.datamodel.pipeline_options.PipelineOptions.accelerator_options">accelerator_options</a></code></b>
|
||
(<code><span title="docling.datamodel.accelerator_options.AcceleratorOptions">AcceleratorOptions</span></code>)
|
||
–
|
||
<div class="doc-md-description">
|
||
|
||
</div>
|
||
</li>
|
||
<li class="doc-section-item field-body">
|
||
<b><code><a class="autorefs autorefs-internal" title="<code class="doc-symbol doc-symbol-heading doc-symbol-attribute"></code> <span class="doc doc-object-name doc-attribute-name">allow_external_plugins</span>
|
||
|
||
|
||
<span class="doc doc-labels">
|
||
<small class="doc doc-label doc-label-class-attribute"><code>class-attribute</code></small>
|
||
<small class="doc doc-label doc-label-instance-attribute"><code>instance-attribute</code></small>
|
||
</span> (<code>docling.datamodel.pipeline_options.PipelineOptions.allow_external_plugins</code>)" href="#docling.datamodel.pipeline_options.PipelineOptions.allow_external_plugins">allow_external_plugins</a></code></b>
|
||
(<code><span title="bool">bool</span></code>)
|
||
–
|
||
<div class="doc-md-description">
|
||
|
||
</div>
|
||
</li>
|
||
<li class="doc-section-item field-body">
|
||
<b><code><a class="autorefs autorefs-internal" title="<code class="doc-symbol doc-symbol-heading doc-symbol-attribute"></code> <span class="doc doc-object-name doc-attribute-name">artifacts_path</span>
|
||
|
||
|
||
<span class="doc doc-labels">
|
||
<small class="doc doc-label doc-label-class-attribute"><code>class-attribute</code></small>
|
||
<small class="doc doc-label doc-label-instance-attribute"><code>instance-attribute</code></small>
|
||
</span> (<code>docling.datamodel.pipeline_options.PipelineOptions.artifacts_path</code>)" href="#docling.datamodel.pipeline_options.PipelineOptions.artifacts_path">artifacts_path</a></code></b>
|
||
(<code><span title="typing.Optional">Optional</span>[<span title="typing.Union">Union</span>[<span title="pathlib.Path">Path</span>, <span title="str">str</span>]]</code>)
|
||
–
|
||
<div class="doc-md-description">
|
||
|
||
</div>
|
||
</li>
|
||
<li class="doc-section-item field-body">
|
||
<b><code><a class="autorefs autorefs-internal" title="<code class="doc-symbol doc-symbol-heading doc-symbol-attribute"></code> <span class="doc doc-object-name doc-attribute-name">document_timeout</span>
|
||
|
||
|
||
<span class="doc doc-labels">
|
||
<small class="doc doc-label doc-label-class-attribute"><code>class-attribute</code></small>
|
||
<small class="doc doc-label doc-label-instance-attribute"><code>instance-attribute</code></small>
|
||
</span> (<code>docling.datamodel.pipeline_options.PipelineOptions.document_timeout</code>)" href="#docling.datamodel.pipeline_options.PipelineOptions.document_timeout">document_timeout</a></code></b>
|
||
(<code><span title="typing.Optional">Optional</span>[<span title="float">float</span>]</code>)
|
||
–
|
||
<div class="doc-md-description">
|
||
|
||
</div>
|
||
</li>
|
||
<li class="doc-section-item field-body">
|
||
<b><code><a class="autorefs autorefs-internal" title="<code class="doc-symbol doc-symbol-heading doc-symbol-attribute"></code> <span class="doc doc-object-name doc-attribute-name">enable_remote_services</span>
|
||
|
||
|
||
<span class="doc doc-labels">
|
||
<small class="doc doc-label doc-label-class-attribute"><code>class-attribute</code></small>
|
||
<small class="doc doc-label doc-label-instance-attribute"><code>instance-attribute</code></small>
|
||
</span> (<code>docling.datamodel.pipeline_options.PipelineOptions.enable_remote_services</code>)" href="#docling.datamodel.pipeline_options.PipelineOptions.enable_remote_services">enable_remote_services</a></code></b>
|
||
(<code><span title="bool">bool</span></code>)
|
||
–
|
||
<div class="doc-md-description">
|
||
|
||
</div>
|
||
</li>
|
||
<li class="doc-section-item field-body">
|
||
<b><code><a class="autorefs autorefs-internal" title="<code class="doc-symbol doc-symbol-heading doc-symbol-attribute"></code> <span class="doc doc-object-name doc-attribute-name">kind</span>
|
||
|
||
|
||
<span class="doc doc-labels">
|
||
<small class="doc doc-label doc-label-class-attribute"><code>class-attribute</code></small>
|
||
</span> (<code>docling.datamodel.pipeline_options.PipelineOptions.kind</code>)" href="#docling.datamodel.pipeline_options.PipelineOptions.kind">kind</a></code></b>
|
||
(<code><span title="str">str</span></code>)
|
||
–
|
||
<div class="doc-md-description">
|
||
|
||
</div>
|
||
</li>
|
||
</ul>
|
||
|
||
|
||
|
||
|
||
<div class="doc doc-children">
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
<div class="doc doc-object doc-attribute">
|
||
|
||
|
||
|
||
<h4 id="docling.datamodel.pipeline_options.PipelineOptions.accelerator_options" class="doc doc-heading">
|
||
<code class="doc-symbol doc-symbol-heading doc-symbol-attribute"></code> <span class="doc doc-object-name doc-attribute-name">accelerator_options</span>
|
||
|
||
|
||
<span class="doc doc-labels">
|
||
<small class="doc doc-label doc-label-class-attribute"><code>class-attribute</code></small>
|
||
<small class="doc doc-label doc-label-instance-attribute"><code>instance-attribute</code></small>
|
||
</span>
|
||
|
||
</h4>
|
||
<div class="doc-signature highlight"><pre><span></span><code><span class="n">accelerator_options</span><span class="p">:</span> <span class="n"><span title="docling.datamodel.accelerator_options.AcceleratorOptions">AcceleratorOptions</span></span> <span class="o">=</span> <span class="n"><span title="docling.datamodel.accelerator_options.AcceleratorOptions">AcceleratorOptions</span></span><span class="p">()</span>
|
||
</code></pre></div>
|
||
|
||
<div class="doc doc-contents ">
|
||
|
||
</div>
|
||
|
||
</div>
|
||
|
||
<div class="doc doc-object doc-attribute">
|
||
|
||
|
||
|
||
<h4 id="docling.datamodel.pipeline_options.PipelineOptions.allow_external_plugins" class="doc doc-heading">
|
||
<code class="doc-symbol doc-symbol-heading doc-symbol-attribute"></code> <span class="doc doc-object-name doc-attribute-name">allow_external_plugins</span>
|
||
|
||
|
||
<span class="doc doc-labels">
|
||
<small class="doc doc-label doc-label-class-attribute"><code>class-attribute</code></small>
|
||
<small class="doc doc-label doc-label-instance-attribute"><code>instance-attribute</code></small>
|
||
</span>
|
||
|
||
</h4>
|
||
<div class="doc-signature highlight"><pre><span></span><code><span class="n">allow_external_plugins</span><span class="p">:</span> <span class="n"><span title="bool">bool</span></span> <span class="o">=</span> <span class="kc">False</span>
|
||
</code></pre></div>
|
||
|
||
<div class="doc doc-contents ">
|
||
|
||
</div>
|
||
|
||
</div>
|
||
|
||
<div class="doc doc-object doc-attribute">
|
||
|
||
|
||
|
||
<h4 id="docling.datamodel.pipeline_options.PipelineOptions.artifacts_path" class="doc doc-heading">
|
||
<code class="doc-symbol doc-symbol-heading doc-symbol-attribute"></code> <span class="doc doc-object-name doc-attribute-name">artifacts_path</span>
|
||
|
||
|
||
<span class="doc doc-labels">
|
||
<small class="doc doc-label doc-label-class-attribute"><code>class-attribute</code></small>
|
||
<small class="doc doc-label doc-label-instance-attribute"><code>instance-attribute</code></small>
|
||
</span>
|
||
|
||
</h4>
|
||
<div class="doc-signature highlight"><pre><span></span><code><span class="n">artifacts_path</span><span class="p">:</span> <span class="n"><span title="typing.Optional">Optional</span></span><span class="p">[</span><span class="n"><span title="typing.Union">Union</span></span><span class="p">[</span><span class="n"><span title="pathlib.Path">Path</span></span><span class="p">,</span> <span class="n"><span title="str">str</span></span><span class="p">]]</span> <span class="o">=</span> <span class="kc">None</span>
|
||
</code></pre></div>
|
||
|
||
<div class="doc doc-contents ">
|
||
|
||
</div>
|
||
|
||
</div>
|
||
|
||
<div class="doc doc-object doc-attribute">
|
||
|
||
|
||
|
||
<h4 id="docling.datamodel.pipeline_options.PipelineOptions.document_timeout" class="doc doc-heading">
|
||
<code class="doc-symbol doc-symbol-heading doc-symbol-attribute"></code> <span class="doc doc-object-name doc-attribute-name">document_timeout</span>
|
||
|
||
|
||
<span class="doc doc-labels">
|
||
<small class="doc doc-label doc-label-class-attribute"><code>class-attribute</code></small>
|
||
<small class="doc doc-label doc-label-instance-attribute"><code>instance-attribute</code></small>
|
||
</span>
|
||
|
||
</h4>
|
||
<div class="doc-signature highlight"><pre><span></span><code><span class="n">document_timeout</span><span class="p">:</span> <span class="n"><span title="typing.Optional">Optional</span></span><span class="p">[</span><span class="n"><span title="float">float</span></span><span class="p">]</span> <span class="o">=</span> <span class="kc">None</span>
|
||
</code></pre></div>
|
||
|
||
<div class="doc doc-contents ">
|
||
|
||
</div>
|
||
|
||
</div>
|
||
|
||
<div class="doc doc-object doc-attribute">
|
||
|
||
|
||
|
||
<h4 id="docling.datamodel.pipeline_options.PipelineOptions.enable_remote_services" class="doc doc-heading">
|
||
<code class="doc-symbol doc-symbol-heading doc-symbol-attribute"></code> <span class="doc doc-object-name doc-attribute-name">enable_remote_services</span>
|
||
|
||
|
||
<span class="doc doc-labels">
|
||
<small class="doc doc-label doc-label-class-attribute"><code>class-attribute</code></small>
|
||
<small class="doc doc-label doc-label-instance-attribute"><code>instance-attribute</code></small>
|
||
</span>
|
||
|
||
</h4>
|
||
<div class="doc-signature highlight"><pre><span></span><code><span class="n">enable_remote_services</span><span class="p">:</span> <span class="n"><span title="bool">bool</span></span> <span class="o">=</span> <span class="kc">False</span>
|
||
</code></pre></div>
|
||
|
||
<div class="doc doc-contents ">
|
||
|
||
</div>
|
||
|
||
</div>
|
||
|
||
<div class="doc doc-object doc-attribute">
|
||
|
||
|
||
|
||
<h4 id="docling.datamodel.pipeline_options.PipelineOptions.kind" class="doc doc-heading">
|
||
<code class="doc-symbol doc-symbol-heading doc-symbol-attribute"></code> <span class="doc doc-object-name doc-attribute-name">kind</span>
|
||
|
||
|
||
<span class="doc doc-labels">
|
||
<small class="doc doc-label doc-label-class-attribute"><code>class-attribute</code></small>
|
||
</span>
|
||
|
||
</h4>
|
||
<div class="doc-signature highlight"><pre><span></span><code><span class="n">kind</span><span class="p">:</span> <span class="n"><span title="str">str</span></span>
|
||
</code></pre></div>
|
||
|
||
<div class="doc doc-contents ">
|
||
|
||
</div>
|
||
|
||
</div>
|
||
|
||
|
||
|
||
|
||
|
||
|
||
</div>
|
||
|
||
</div>
|
||
|
||
</div>
|
||
|
||
<div class="doc doc-object doc-class">
|
||
|
||
|
||
|
||
<h3 id="docling.datamodel.pipeline_options.ProcessingPipeline" class="doc doc-heading">
|
||
<code class="doc-symbol doc-symbol-heading doc-symbol-class"></code> <span class="doc doc-object-name doc-class-name">ProcessingPipeline</span>
|
||
|
||
|
||
</h3>
|
||
|
||
|
||
<div class="doc doc-contents ">
|
||
<p class="doc doc-class-bases">
|
||
Bases: <code><span title="str">str</span></code>, <code><span title="enum.Enum">Enum</span></code></p>
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
<p><span class="doc-section-title">Attributes:</span></p>
|
||
<ul>
|
||
<li class="doc-section-item field-body">
|
||
<b><code><a class="autorefs autorefs-internal" title="<code class="doc-symbol doc-symbol-heading doc-symbol-attribute"></code> <span class="doc doc-object-name doc-attribute-name">ASR</span>
|
||
|
||
|
||
<span class="doc doc-labels">
|
||
<small class="doc doc-label doc-label-class-attribute"><code>class-attribute</code></small>
|
||
<small class="doc doc-label doc-label-instance-attribute"><code>instance-attribute</code></small>
|
||
</span> (<code>docling.datamodel.pipeline_options.ProcessingPipeline.ASR</code>)" href="#docling.datamodel.pipeline_options.ProcessingPipeline.ASR">ASR</a></code></b>
|
||
–
|
||
<div class="doc-md-description">
|
||
|
||
</div>
|
||
</li>
|
||
<li class="doc-section-item field-body">
|
||
<b><code><a class="autorefs autorefs-internal" title="<code class="doc-symbol doc-symbol-heading doc-symbol-attribute"></code> <span class="doc doc-object-name doc-attribute-name">LEGACY</span>
|
||
|
||
|
||
<span class="doc doc-labels">
|
||
<small class="doc doc-label doc-label-class-attribute"><code>class-attribute</code></small>
|
||
<small class="doc doc-label doc-label-instance-attribute"><code>instance-attribute</code></small>
|
||
</span> (<code>docling.datamodel.pipeline_options.ProcessingPipeline.LEGACY</code>)" href="#docling.datamodel.pipeline_options.ProcessingPipeline.LEGACY">LEGACY</a></code></b>
|
||
–
|
||
<div class="doc-md-description">
|
||
|
||
</div>
|
||
</li>
|
||
<li class="doc-section-item field-body">
|
||
<b><code><a class="autorefs autorefs-internal" title="<code class="doc-symbol doc-symbol-heading doc-symbol-attribute"></code> <span class="doc doc-object-name doc-attribute-name">STANDARD</span>
|
||
|
||
|
||
<span class="doc doc-labels">
|
||
<small class="doc doc-label doc-label-class-attribute"><code>class-attribute</code></small>
|
||
<small class="doc doc-label doc-label-instance-attribute"><code>instance-attribute</code></small>
|
||
</span> (<code>docling.datamodel.pipeline_options.ProcessingPipeline.STANDARD</code>)" href="#docling.datamodel.pipeline_options.ProcessingPipeline.STANDARD">STANDARD</a></code></b>
|
||
–
|
||
<div class="doc-md-description">
|
||
|
||
</div>
|
||
</li>
|
||
<li class="doc-section-item field-body">
|
||
<b><code><a class="autorefs autorefs-internal" title="<code class="doc-symbol doc-symbol-heading doc-symbol-attribute"></code> <span class="doc doc-object-name doc-attribute-name">VLM</span>
|
||
|
||
|
||
<span class="doc doc-labels">
|
||
<small class="doc doc-label doc-label-class-attribute"><code>class-attribute</code></small>
|
||
<small class="doc doc-label doc-label-instance-attribute"><code>instance-attribute</code></small>
|
||
</span> (<code>docling.datamodel.pipeline_options.ProcessingPipeline.VLM</code>)" href="#docling.datamodel.pipeline_options.ProcessingPipeline.VLM">VLM</a></code></b>
|
||
–
|
||
<div class="doc-md-description">
|
||
|
||
</div>
|
||
</li>
|
||
</ul>
|
||
|
||
|
||
|
||
|
||
<div class="doc doc-children">
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
<div class="doc doc-object doc-attribute">
|
||
|
||
|
||
|
||
<h4 id="docling.datamodel.pipeline_options.ProcessingPipeline.ASR" class="doc doc-heading">
|
||
<code class="doc-symbol doc-symbol-heading doc-symbol-attribute"></code> <span class="doc doc-object-name doc-attribute-name">ASR</span>
|
||
|
||
|
||
<span class="doc doc-labels">
|
||
<small class="doc doc-label doc-label-class-attribute"><code>class-attribute</code></small>
|
||
<small class="doc doc-label doc-label-instance-attribute"><code>instance-attribute</code></small>
|
||
</span>
|
||
|
||
</h4>
|
||
<div class="doc-signature highlight"><pre><span></span><code><span class="n">ASR</span> <span class="o">=</span> <span class="s1">'asr'</span>
|
||
</code></pre></div>
|
||
|
||
<div class="doc doc-contents ">
|
||
|
||
</div>
|
||
|
||
</div>
|
||
|
||
<div class="doc doc-object doc-attribute">
|
||
|
||
|
||
|
||
<h4 id="docling.datamodel.pipeline_options.ProcessingPipeline.LEGACY" class="doc doc-heading">
|
||
<code class="doc-symbol doc-symbol-heading doc-symbol-attribute"></code> <span class="doc doc-object-name doc-attribute-name">LEGACY</span>
|
||
|
||
|
||
<span class="doc doc-labels">
|
||
<small class="doc doc-label doc-label-class-attribute"><code>class-attribute</code></small>
|
||
<small class="doc doc-label doc-label-instance-attribute"><code>instance-attribute</code></small>
|
||
</span>
|
||
|
||
</h4>
|
||
<div class="doc-signature highlight"><pre><span></span><code><span class="n">LEGACY</span> <span class="o">=</span> <span class="s1">'legacy'</span>
|
||
</code></pre></div>
|
||
|
||
<div class="doc doc-contents ">
|
||
|
||
</div>
|
||
|
||
</div>
|
||
|
||
<div class="doc doc-object doc-attribute">
|
||
|
||
|
||
|
||
<h4 id="docling.datamodel.pipeline_options.ProcessingPipeline.STANDARD" class="doc doc-heading">
|
||
<code class="doc-symbol doc-symbol-heading doc-symbol-attribute"></code> <span class="doc doc-object-name doc-attribute-name">STANDARD</span>
|
||
|
||
|
||
<span class="doc doc-labels">
|
||
<small class="doc doc-label doc-label-class-attribute"><code>class-attribute</code></small>
|
||
<small class="doc doc-label doc-label-instance-attribute"><code>instance-attribute</code></small>
|
||
</span>
|
||
|
||
</h4>
|
||
<div class="doc-signature highlight"><pre><span></span><code><span class="n">STANDARD</span> <span class="o">=</span> <span class="s1">'standard'</span>
|
||
</code></pre></div>
|
||
|
||
<div class="doc doc-contents ">
|
||
|
||
</div>
|
||
|
||
</div>
|
||
|
||
<div class="doc doc-object doc-attribute">
|
||
|
||
|
||
|
||
<h4 id="docling.datamodel.pipeline_options.ProcessingPipeline.VLM" class="doc doc-heading">
|
||
<code class="doc-symbol doc-symbol-heading doc-symbol-attribute"></code> <span class="doc doc-object-name doc-attribute-name">VLM</span>
|
||
|
||
|
||
<span class="doc doc-labels">
|
||
<small class="doc doc-label doc-label-class-attribute"><code>class-attribute</code></small>
|
||
<small class="doc doc-label doc-label-instance-attribute"><code>instance-attribute</code></small>
|
||
</span>
|
||
|
||
</h4>
|
||
<div class="doc-signature highlight"><pre><span></span><code><span class="n">VLM</span> <span class="o">=</span> <span class="s1">'vlm'</span>
|
||
</code></pre></div>
|
||
|
||
<div class="doc doc-contents ">
|
||
|
||
</div>
|
||
|
||
</div>
|
||
|
||
|
||
|
||
|
||
|
||
|
||
</div>
|
||
|
||
</div>
|
||
|
||
</div>
|
||
|
||
<div class="doc doc-object doc-class">
|
||
|
||
|
||
|
||
<h3 id="docling.datamodel.pipeline_options.RapidOcrOptions" class="doc doc-heading">
|
||
<code class="doc-symbol doc-symbol-heading doc-symbol-class"></code> <span class="doc doc-object-name doc-class-name">RapidOcrOptions</span>
|
||
|
||
|
||
</h3>
|
||
|
||
|
||
<div class="doc doc-contents ">
|
||
<p class="doc doc-class-bases">
|
||
Bases: <code><a class="autorefs autorefs-internal" title="<code class="doc-symbol doc-symbol-heading doc-symbol-class"></code> <span class="doc doc-object-name doc-class-name">OcrOptions</span> (<code>docling.datamodel.pipeline_options.OcrOptions</code>)" href="#docling.datamodel.pipeline_options.OcrOptions">OcrOptions</a></code></p>
|
||
|
||
|
||
|
||
<p>Options for the RapidOCR engine.</p>
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
<p><span class="doc-section-title">Attributes:</span></p>
|
||
<ul>
|
||
<li class="doc-section-item field-body">
|
||
<b><code><a class="autorefs autorefs-internal" title="<code class="doc-symbol doc-symbol-heading doc-symbol-attribute"></code> <span class="doc doc-object-name doc-attribute-name">backend</span>
|
||
|
||
|
||
<span class="doc doc-labels">
|
||
<small class="doc doc-label doc-label-class-attribute"><code>class-attribute</code></small>
|
||
<small class="doc doc-label doc-label-instance-attribute"><code>instance-attribute</code></small>
|
||
</span> (<code>docling.datamodel.pipeline_options.RapidOcrOptions.backend</code>)" href="#docling.datamodel.pipeline_options.RapidOcrOptions.backend">backend</a></code></b>
|
||
(<code><span title="typing.Literal">Literal</span>['onnxruntime', 'openvino', 'paddle', 'torch']</code>)
|
||
–
|
||
<div class="doc-md-description">
|
||
|
||
</div>
|
||
</li>
|
||
<li class="doc-section-item field-body">
|
||
<b><code><a class="autorefs autorefs-internal" title="<code class="doc-symbol doc-symbol-heading doc-symbol-attribute"></code> <span class="doc doc-object-name doc-attribute-name">bitmap_area_threshold</span>
|
||
|
||
|
||
<span class="doc doc-labels">
|
||
<small class="doc doc-label doc-label-class-attribute"><code>class-attribute</code></small>
|
||
<small class="doc doc-label doc-label-instance-attribute"><code>instance-attribute</code></small>
|
||
</span> (<code>docling.datamodel.pipeline_options.RapidOcrOptions.bitmap_area_threshold</code>)" href="#docling.datamodel.pipeline_options.RapidOcrOptions.bitmap_area_threshold">bitmap_area_threshold</a></code></b>
|
||
(<code><span title="float">float</span></code>)
|
||
–
|
||
<div class="doc-md-description">
|
||
|
||
</div>
|
||
</li>
|
||
<li class="doc-section-item field-body">
|
||
<b><code><a class="autorefs autorefs-internal" title="<code class="doc-symbol doc-symbol-heading doc-symbol-attribute"></code> <span class="doc doc-object-name doc-attribute-name">cls_model_path</span>
|
||
|
||
|
||
<span class="doc doc-labels">
|
||
<small class="doc doc-label doc-label-class-attribute"><code>class-attribute</code></small>
|
||
<small class="doc doc-label doc-label-instance-attribute"><code>instance-attribute</code></small>
|
||
</span> (<code>docling.datamodel.pipeline_options.RapidOcrOptions.cls_model_path</code>)" href="#docling.datamodel.pipeline_options.RapidOcrOptions.cls_model_path">cls_model_path</a></code></b>
|
||
(<code><span title="typing.Optional">Optional</span>[<span title="str">str</span>]</code>)
|
||
–
|
||
<div class="doc-md-description">
|
||
|
||
</div>
|
||
</li>
|
||
<li class="doc-section-item field-body">
|
||
<b><code><a class="autorefs autorefs-internal" title="<code class="doc-symbol doc-symbol-heading doc-symbol-attribute"></code> <span class="doc doc-object-name doc-attribute-name">det_model_path</span>
|
||
|
||
|
||
<span class="doc doc-labels">
|
||
<small class="doc doc-label doc-label-class-attribute"><code>class-attribute</code></small>
|
||
<small class="doc doc-label doc-label-instance-attribute"><code>instance-attribute</code></small>
|
||
</span> (<code>docling.datamodel.pipeline_options.RapidOcrOptions.det_model_path</code>)" href="#docling.datamodel.pipeline_options.RapidOcrOptions.det_model_path">det_model_path</a></code></b>
|
||
(<code><span title="typing.Optional">Optional</span>[<span title="str">str</span>]</code>)
|
||
–
|
||
<div class="doc-md-description">
|
||
|
||
</div>
|
||
</li>
|
||
<li class="doc-section-item field-body">
|
||
<b><code><a class="autorefs autorefs-internal" title="<code class="doc-symbol doc-symbol-heading doc-symbol-attribute"></code> <span class="doc doc-object-name doc-attribute-name">font_path</span>
|
||
|
||
|
||
<span class="doc doc-labels">
|
||
<small class="doc doc-label doc-label-class-attribute"><code>class-attribute</code></small>
|
||
<small class="doc doc-label doc-label-instance-attribute"><code>instance-attribute</code></small>
|
||
</span> (<code>docling.datamodel.pipeline_options.RapidOcrOptions.font_path</code>)" href="#docling.datamodel.pipeline_options.RapidOcrOptions.font_path">font_path</a></code></b>
|
||
(<code><span title="typing.Optional">Optional</span>[<span title="str">str</span>]</code>)
|
||
–
|
||
<div class="doc-md-description">
|
||
|
||
</div>
|
||
</li>
|
||
<li class="doc-section-item field-body">
|
||
<b><code><a class="autorefs autorefs-internal" title="<code class="doc-symbol doc-symbol-heading doc-symbol-attribute"></code> <span class="doc doc-object-name doc-attribute-name">force_full_page_ocr</span>
|
||
|
||
|
||
<span class="doc doc-labels">
|
||
<small class="doc doc-label doc-label-class-attribute"><code>class-attribute</code></small>
|
||
<small class="doc doc-label doc-label-instance-attribute"><code>instance-attribute</code></small>
|
||
</span> (<code>docling.datamodel.pipeline_options.RapidOcrOptions.force_full_page_ocr</code>)" href="#docling.datamodel.pipeline_options.RapidOcrOptions.force_full_page_ocr">force_full_page_ocr</a></code></b>
|
||
(<code><span title="bool">bool</span></code>)
|
||
–
|
||
<div class="doc-md-description">
|
||
|
||
</div>
|
||
</li>
|
||
<li class="doc-section-item field-body">
|
||
<b><code><a class="autorefs autorefs-internal" title="<code class="doc-symbol doc-symbol-heading doc-symbol-attribute"></code> <span class="doc doc-object-name doc-attribute-name">kind</span>
|
||
|
||
|
||
<span class="doc doc-labels">
|
||
<small class="doc doc-label doc-label-class-attribute"><code>class-attribute</code></small>
|
||
</span> (<code>docling.datamodel.pipeline_options.RapidOcrOptions.kind</code>)" href="#docling.datamodel.pipeline_options.RapidOcrOptions.kind">kind</a></code></b>
|
||
(<code><span title="typing.Literal">Literal</span>['rapidocr']</code>)
|
||
–
|
||
<div class="doc-md-description">
|
||
|
||
</div>
|
||
</li>
|
||
<li class="doc-section-item field-body">
|
||
<b><code><a class="autorefs autorefs-internal" title="<code class="doc-symbol doc-symbol-heading doc-symbol-attribute"></code> <span class="doc doc-object-name doc-attribute-name">lang</span>
|
||
|
||
|
||
<span class="doc doc-labels">
|
||
<small class="doc doc-label doc-label-class-attribute"><code>class-attribute</code></small>
|
||
<small class="doc doc-label doc-label-instance-attribute"><code>instance-attribute</code></small>
|
||
</span> (<code>docling.datamodel.pipeline_options.RapidOcrOptions.lang</code>)" href="#docling.datamodel.pipeline_options.RapidOcrOptions.lang">lang</a></code></b>
|
||
(<code><span title="typing.List">List</span>[<span title="str">str</span>]</code>)
|
||
–
|
||
<div class="doc-md-description">
|
||
|
||
</div>
|
||
</li>
|
||
<li class="doc-section-item field-body">
|
||
<b><code><a class="autorefs autorefs-internal" title="<code class="doc-symbol doc-symbol-heading doc-symbol-attribute"></code> <span class="doc doc-object-name doc-attribute-name">model_config</span>
|
||
|
||
|
||
<span class="doc doc-labels">
|
||
<small class="doc doc-label doc-label-class-attribute"><code>class-attribute</code></small>
|
||
<small class="doc doc-label doc-label-instance-attribute"><code>instance-attribute</code></small>
|
||
</span> (<code>docling.datamodel.pipeline_options.RapidOcrOptions.model_config</code>)" href="#docling.datamodel.pipeline_options.RapidOcrOptions.model_config">model_config</a></code></b>
|
||
–
|
||
<div class="doc-md-description">
|
||
|
||
</div>
|
||
</li>
|
||
<li class="doc-section-item field-body">
|
||
<b><code><a class="autorefs autorefs-internal" title="<code class="doc-symbol doc-symbol-heading doc-symbol-attribute"></code> <span class="doc doc-object-name doc-attribute-name">print_verbose</span>
|
||
|
||
|
||
<span class="doc doc-labels">
|
||
<small class="doc doc-label doc-label-class-attribute"><code>class-attribute</code></small>
|
||
<small class="doc doc-label doc-label-instance-attribute"><code>instance-attribute</code></small>
|
||
</span> (<code>docling.datamodel.pipeline_options.RapidOcrOptions.print_verbose</code>)" href="#docling.datamodel.pipeline_options.RapidOcrOptions.print_verbose">print_verbose</a></code></b>
|
||
(<code><span title="bool">bool</span></code>)
|
||
–
|
||
<div class="doc-md-description">
|
||
|
||
</div>
|
||
</li>
|
||
<li class="doc-section-item field-body">
|
||
<b><code><a class="autorefs autorefs-internal" title="<code class="doc-symbol doc-symbol-heading doc-symbol-attribute"></code> <span class="doc doc-object-name doc-attribute-name">rapidocr_params</span>
|
||
|
||
|
||
<span class="doc doc-labels">
|
||
<small class="doc doc-label doc-label-class-attribute"><code>class-attribute</code></small>
|
||
<small class="doc doc-label doc-label-instance-attribute"><code>instance-attribute</code></small>
|
||
</span> (<code>docling.datamodel.pipeline_options.RapidOcrOptions.rapidocr_params</code>)" href="#docling.datamodel.pipeline_options.RapidOcrOptions.rapidocr_params">rapidocr_params</a></code></b>
|
||
(<code><span title="typing.Dict">Dict</span>[<span title="str">str</span>, <span title="typing.Any">Any</span>]</code>)
|
||
–
|
||
<div class="doc-md-description">
|
||
|
||
</div>
|
||
</li>
|
||
<li class="doc-section-item field-body">
|
||
<b><code><a class="autorefs autorefs-internal" title="<code class="doc-symbol doc-symbol-heading doc-symbol-attribute"></code> <span class="doc doc-object-name doc-attribute-name">rec_font_path</span>
|
||
|
||
|
||
<span class="doc doc-labels">
|
||
<small class="doc doc-label doc-label-class-attribute"><code>class-attribute</code></small>
|
||
<small class="doc doc-label doc-label-instance-attribute"><code>instance-attribute</code></small>
|
||
</span> (<code>docling.datamodel.pipeline_options.RapidOcrOptions.rec_font_path</code>)" href="#docling.datamodel.pipeline_options.RapidOcrOptions.rec_font_path">rec_font_path</a></code></b>
|
||
(<code><span title="typing.Optional">Optional</span>[<span title="str">str</span>]</code>)
|
||
–
|
||
<div class="doc-md-description">
|
||
|
||
</div>
|
||
</li>
|
||
<li class="doc-section-item field-body">
|
||
<b><code><a class="autorefs autorefs-internal" title="<code class="doc-symbol doc-symbol-heading doc-symbol-attribute"></code> <span class="doc doc-object-name doc-attribute-name">rec_keys_path</span>
|
||
|
||
|
||
<span class="doc doc-labels">
|
||
<small class="doc doc-label doc-label-class-attribute"><code>class-attribute</code></small>
|
||
<small class="doc doc-label doc-label-instance-attribute"><code>instance-attribute</code></small>
|
||
</span> (<code>docling.datamodel.pipeline_options.RapidOcrOptions.rec_keys_path</code>)" href="#docling.datamodel.pipeline_options.RapidOcrOptions.rec_keys_path">rec_keys_path</a></code></b>
|
||
(<code><span title="typing.Optional">Optional</span>[<span title="str">str</span>]</code>)
|
||
–
|
||
<div class="doc-md-description">
|
||
|
||
</div>
|
||
</li>
|
||
<li class="doc-section-item field-body">
|
||
<b><code><a class="autorefs autorefs-internal" title="<code class="doc-symbol doc-symbol-heading doc-symbol-attribute"></code> <span class="doc doc-object-name doc-attribute-name">rec_model_path</span>
|
||
|
||
|
||
<span class="doc doc-labels">
|
||
<small class="doc doc-label doc-label-class-attribute"><code>class-attribute</code></small>
|
||
<small class="doc doc-label doc-label-instance-attribute"><code>instance-attribute</code></small>
|
||
</span> (<code>docling.datamodel.pipeline_options.RapidOcrOptions.rec_model_path</code>)" href="#docling.datamodel.pipeline_options.RapidOcrOptions.rec_model_path">rec_model_path</a></code></b>
|
||
(<code><span title="typing.Optional">Optional</span>[<span title="str">str</span>]</code>)
|
||
–
|
||
<div class="doc-md-description">
|
||
|
||
</div>
|
||
</li>
|
||
<li class="doc-section-item field-body">
|
||
<b><code><a class="autorefs autorefs-internal" title="<code class="doc-symbol doc-symbol-heading doc-symbol-attribute"></code> <span class="doc doc-object-name doc-attribute-name">text_score</span>
|
||
|
||
|
||
<span class="doc doc-labels">
|
||
<small class="doc doc-label doc-label-class-attribute"><code>class-attribute</code></small>
|
||
<small class="doc doc-label doc-label-instance-attribute"><code>instance-attribute</code></small>
|
||
</span> (<code>docling.datamodel.pipeline_options.RapidOcrOptions.text_score</code>)" href="#docling.datamodel.pipeline_options.RapidOcrOptions.text_score">text_score</a></code></b>
|
||
(<code><span title="float">float</span></code>)
|
||
–
|
||
<div class="doc-md-description">
|
||
|
||
</div>
|
||
</li>
|
||
<li class="doc-section-item field-body">
|
||
<b><code><a class="autorefs autorefs-internal" title="<code class="doc-symbol doc-symbol-heading doc-symbol-attribute"></code> <span class="doc doc-object-name doc-attribute-name">use_cls</span>
|
||
|
||
|
||
<span class="doc doc-labels">
|
||
<small class="doc doc-label doc-label-class-attribute"><code>class-attribute</code></small>
|
||
<small class="doc doc-label doc-label-instance-attribute"><code>instance-attribute</code></small>
|
||
</span> (<code>docling.datamodel.pipeline_options.RapidOcrOptions.use_cls</code>)" href="#docling.datamodel.pipeline_options.RapidOcrOptions.use_cls">use_cls</a></code></b>
|
||
(<code><span title="typing.Optional">Optional</span>[<span title="bool">bool</span>]</code>)
|
||
–
|
||
<div class="doc-md-description">
|
||
|
||
</div>
|
||
</li>
|
||
<li class="doc-section-item field-body">
|
||
<b><code><a class="autorefs autorefs-internal" title="<code class="doc-symbol doc-symbol-heading doc-symbol-attribute"></code> <span class="doc doc-object-name doc-attribute-name">use_det</span>
|
||
|
||
|
||
<span class="doc doc-labels">
|
||
<small class="doc doc-label doc-label-class-attribute"><code>class-attribute</code></small>
|
||
<small class="doc doc-label doc-label-instance-attribute"><code>instance-attribute</code></small>
|
||
</span> (<code>docling.datamodel.pipeline_options.RapidOcrOptions.use_det</code>)" href="#docling.datamodel.pipeline_options.RapidOcrOptions.use_det">use_det</a></code></b>
|
||
(<code><span title="typing.Optional">Optional</span>[<span title="bool">bool</span>]</code>)
|
||
–
|
||
<div class="doc-md-description">
|
||
|
||
</div>
|
||
</li>
|
||
<li class="doc-section-item field-body">
|
||
<b><code><a class="autorefs autorefs-internal" title="<code class="doc-symbol doc-symbol-heading doc-symbol-attribute"></code> <span class="doc doc-object-name doc-attribute-name">use_rec</span>
|
||
|
||
|
||
<span class="doc doc-labels">
|
||
<small class="doc doc-label doc-label-class-attribute"><code>class-attribute</code></small>
|
||
<small class="doc doc-label doc-label-instance-attribute"><code>instance-attribute</code></small>
|
||
</span> (<code>docling.datamodel.pipeline_options.RapidOcrOptions.use_rec</code>)" href="#docling.datamodel.pipeline_options.RapidOcrOptions.use_rec">use_rec</a></code></b>
|
||
(<code><span title="typing.Optional">Optional</span>[<span title="bool">bool</span>]</code>)
|
||
–
|
||
<div class="doc-md-description">
|
||
|
||
</div>
|
||
</li>
|
||
</ul>
|
||
|
||
|
||
|
||
|
||
<div class="doc doc-children">
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
<div class="doc doc-object doc-attribute">
|
||
|
||
|
||
|
||
<h4 id="docling.datamodel.pipeline_options.RapidOcrOptions.backend" class="doc doc-heading">
|
||
<code class="doc-symbol doc-symbol-heading doc-symbol-attribute"></code> <span class="doc doc-object-name doc-attribute-name">backend</span>
|
||
|
||
|
||
<span class="doc doc-labels">
|
||
<small class="doc doc-label doc-label-class-attribute"><code>class-attribute</code></small>
|
||
<small class="doc doc-label doc-label-instance-attribute"><code>instance-attribute</code></small>
|
||
</span>
|
||
|
||
</h4>
|
||
<div class="doc-signature highlight"><pre><span></span><code><span class="n">backend</span><span class="p">:</span> <span class="n"><span title="typing.Literal">Literal</span></span><span class="p">[</span><span class="s1">'onnxruntime'</span><span class="p">,</span> <span class="s1">'openvino'</span><span class="p">,</span> <span class="s1">'paddle'</span><span class="p">,</span> <span class="s1">'torch'</span><span class="p">]</span> <span class="o">=</span> <span class="s1">'onnxruntime'</span>
|
||
</code></pre></div>
|
||
|
||
<div class="doc doc-contents ">
|
||
|
||
</div>
|
||
|
||
</div>
|
||
|
||
<div class="doc doc-object doc-attribute">
|
||
|
||
|
||
|
||
<h4 id="docling.datamodel.pipeline_options.RapidOcrOptions.bitmap_area_threshold" class="doc doc-heading">
|
||
<code class="doc-symbol doc-symbol-heading doc-symbol-attribute"></code> <span class="doc doc-object-name doc-attribute-name">bitmap_area_threshold</span>
|
||
|
||
|
||
<span class="doc doc-labels">
|
||
<small class="doc doc-label doc-label-class-attribute"><code>class-attribute</code></small>
|
||
<small class="doc doc-label doc-label-instance-attribute"><code>instance-attribute</code></small>
|
||
</span>
|
||
|
||
</h4>
|
||
<div class="doc-signature highlight"><pre><span></span><code><span class="n">bitmap_area_threshold</span><span class="p">:</span> <span class="n"><span title="float">float</span></span> <span class="o">=</span> <span class="mf">0.05</span>
|
||
</code></pre></div>
|
||
|
||
<div class="doc doc-contents ">
|
||
|
||
</div>
|
||
|
||
</div>
|
||
|
||
<div class="doc doc-object doc-attribute">
|
||
|
||
|
||
|
||
<h4 id="docling.datamodel.pipeline_options.RapidOcrOptions.cls_model_path" class="doc doc-heading">
|
||
<code class="doc-symbol doc-symbol-heading doc-symbol-attribute"></code> <span class="doc doc-object-name doc-attribute-name">cls_model_path</span>
|
||
|
||
|
||
<span class="doc doc-labels">
|
||
<small class="doc doc-label doc-label-class-attribute"><code>class-attribute</code></small>
|
||
<small class="doc doc-label doc-label-instance-attribute"><code>instance-attribute</code></small>
|
||
</span>
|
||
|
||
</h4>
|
||
<div class="doc-signature highlight"><pre><span></span><code><span class="n">cls_model_path</span><span class="p">:</span> <span class="n"><span title="typing.Optional">Optional</span></span><span class="p">[</span><span class="n"><span title="str">str</span></span><span class="p">]</span> <span class="o">=</span> <span class="kc">None</span>
|
||
</code></pre></div>
|
||
|
||
<div class="doc doc-contents ">
|
||
|
||
</div>
|
||
|
||
</div>
|
||
|
||
<div class="doc doc-object doc-attribute">
|
||
|
||
|
||
|
||
<h4 id="docling.datamodel.pipeline_options.RapidOcrOptions.det_model_path" class="doc doc-heading">
|
||
<code class="doc-symbol doc-symbol-heading doc-symbol-attribute"></code> <span class="doc doc-object-name doc-attribute-name">det_model_path</span>
|
||
|
||
|
||
<span class="doc doc-labels">
|
||
<small class="doc doc-label doc-label-class-attribute"><code>class-attribute</code></small>
|
||
<small class="doc doc-label doc-label-instance-attribute"><code>instance-attribute</code></small>
|
||
</span>
|
||
|
||
</h4>
|
||
<div class="doc-signature highlight"><pre><span></span><code><span class="n">det_model_path</span><span class="p">:</span> <span class="n"><span title="typing.Optional">Optional</span></span><span class="p">[</span><span class="n"><span title="str">str</span></span><span class="p">]</span> <span class="o">=</span> <span class="kc">None</span>
|
||
</code></pre></div>
|
||
|
||
<div class="doc doc-contents ">
|
||
|
||
</div>
|
||
|
||
</div>
|
||
|
||
<div class="doc doc-object doc-attribute">
|
||
|
||
|
||
|
||
<h4 id="docling.datamodel.pipeline_options.RapidOcrOptions.font_path" class="doc doc-heading">
|
||
<code class="doc-symbol doc-symbol-heading doc-symbol-attribute"></code> <span class="doc doc-object-name doc-attribute-name">font_path</span>
|
||
|
||
|
||
<span class="doc doc-labels">
|
||
<small class="doc doc-label doc-label-class-attribute"><code>class-attribute</code></small>
|
||
<small class="doc doc-label doc-label-instance-attribute"><code>instance-attribute</code></small>
|
||
</span>
|
||
|
||
</h4>
|
||
<div class="doc-signature highlight"><pre><span></span><code><span class="n">font_path</span><span class="p">:</span> <span class="n"><span title="typing.Optional">Optional</span></span><span class="p">[</span><span class="n"><span title="str">str</span></span><span class="p">]</span> <span class="o">=</span> <span class="kc">None</span>
|
||
</code></pre></div>
|
||
|
||
<div class="doc doc-contents ">
|
||
|
||
</div>
|
||
|
||
</div>
|
||
|
||
<div class="doc doc-object doc-attribute">
|
||
|
||
|
||
|
||
<h4 id="docling.datamodel.pipeline_options.RapidOcrOptions.force_full_page_ocr" class="doc doc-heading">
|
||
<code class="doc-symbol doc-symbol-heading doc-symbol-attribute"></code> <span class="doc doc-object-name doc-attribute-name">force_full_page_ocr</span>
|
||
|
||
|
||
<span class="doc doc-labels">
|
||
<small class="doc doc-label doc-label-class-attribute"><code>class-attribute</code></small>
|
||
<small class="doc doc-label doc-label-instance-attribute"><code>instance-attribute</code></small>
|
||
</span>
|
||
|
||
</h4>
|
||
<div class="doc-signature highlight"><pre><span></span><code><span class="n">force_full_page_ocr</span><span class="p">:</span> <span class="n"><span title="bool">bool</span></span> <span class="o">=</span> <span class="kc">False</span>
|
||
</code></pre></div>
|
||
|
||
<div class="doc doc-contents ">
|
||
|
||
</div>
|
||
|
||
</div>
|
||
|
||
<div class="doc doc-object doc-attribute">
|
||
|
||
|
||
|
||
<h4 id="docling.datamodel.pipeline_options.RapidOcrOptions.kind" class="doc doc-heading">
|
||
<code class="doc-symbol doc-symbol-heading doc-symbol-attribute"></code> <span class="doc doc-object-name doc-attribute-name">kind</span>
|
||
|
||
|
||
<span class="doc doc-labels">
|
||
<small class="doc doc-label doc-label-class-attribute"><code>class-attribute</code></small>
|
||
</span>
|
||
|
||
</h4>
|
||
<div class="doc-signature highlight"><pre><span></span><code><span class="n">kind</span><span class="p">:</span> <span class="n"><span title="typing.Literal">Literal</span></span><span class="p">[</span><span class="s1">'rapidocr'</span><span class="p">]</span> <span class="o">=</span> <span class="s1">'rapidocr'</span>
|
||
</code></pre></div>
|
||
|
||
<div class="doc doc-contents ">
|
||
|
||
</div>
|
||
|
||
</div>
|
||
|
||
<div class="doc doc-object doc-attribute">
|
||
|
||
|
||
|
||
<h4 id="docling.datamodel.pipeline_options.RapidOcrOptions.lang" class="doc doc-heading">
|
||
<code class="doc-symbol doc-symbol-heading doc-symbol-attribute"></code> <span class="doc doc-object-name doc-attribute-name">lang</span>
|
||
|
||
|
||
<span class="doc doc-labels">
|
||
<small class="doc doc-label doc-label-class-attribute"><code>class-attribute</code></small>
|
||
<small class="doc doc-label doc-label-instance-attribute"><code>instance-attribute</code></small>
|
||
</span>
|
||
|
||
</h4>
|
||
<div class="doc-signature highlight"><pre><span></span><code><span class="n">lang</span><span class="p">:</span> <span class="n"><span title="typing.List">List</span></span><span class="p">[</span><span class="n"><span title="str">str</span></span><span class="p">]</span> <span class="o">=</span> <span class="p">[</span><span class="s1">'english'</span><span class="p">,</span> <span class="s1">'chinese'</span><span class="p">]</span>
|
||
</code></pre></div>
|
||
|
||
<div class="doc doc-contents ">
|
||
|
||
</div>
|
||
|
||
</div>
|
||
|
||
<div class="doc doc-object doc-attribute">
|
||
|
||
|
||
|
||
<h4 id="docling.datamodel.pipeline_options.RapidOcrOptions.model_config" class="doc doc-heading">
|
||
<code class="doc-symbol doc-symbol-heading doc-symbol-attribute"></code> <span class="doc doc-object-name doc-attribute-name">model_config</span>
|
||
|
||
|
||
<span class="doc doc-labels">
|
||
<small class="doc doc-label doc-label-class-attribute"><code>class-attribute</code></small>
|
||
<small class="doc doc-label doc-label-instance-attribute"><code>instance-attribute</code></small>
|
||
</span>
|
||
|
||
</h4>
|
||
<div class="doc-signature highlight"><pre><span></span><code><span class="n">model_config</span> <span class="o">=</span> <span class="n"><span title="pydantic.ConfigDict">ConfigDict</span></span><span class="p">(</span><span class="n"><span title="pydantic.ConfigDict(extra)">extra</span></span><span class="o">=</span><span class="s1">'forbid'</span><span class="p">)</span>
|
||
</code></pre></div>
|
||
|
||
<div class="doc doc-contents ">
|
||
|
||
</div>
|
||
|
||
</div>
|
||
|
||
<div class="doc doc-object doc-attribute">
|
||
|
||
|
||
|
||
<h4 id="docling.datamodel.pipeline_options.RapidOcrOptions.print_verbose" class="doc doc-heading">
|
||
<code class="doc-symbol doc-symbol-heading doc-symbol-attribute"></code> <span class="doc doc-object-name doc-attribute-name">print_verbose</span>
|
||
|
||
|
||
<span class="doc doc-labels">
|
||
<small class="doc doc-label doc-label-class-attribute"><code>class-attribute</code></small>
|
||
<small class="doc doc-label doc-label-instance-attribute"><code>instance-attribute</code></small>
|
||
</span>
|
||
|
||
</h4>
|
||
<div class="doc-signature highlight"><pre><span></span><code><span class="n">print_verbose</span><span class="p">:</span> <span class="n"><span title="bool">bool</span></span> <span class="o">=</span> <span class="kc">False</span>
|
||
</code></pre></div>
|
||
|
||
<div class="doc doc-contents ">
|
||
|
||
</div>
|
||
|
||
</div>
|
||
|
||
<div class="doc doc-object doc-attribute">
|
||
|
||
|
||
|
||
<h4 id="docling.datamodel.pipeline_options.RapidOcrOptions.rapidocr_params" class="doc doc-heading">
|
||
<code class="doc-symbol doc-symbol-heading doc-symbol-attribute"></code> <span class="doc doc-object-name doc-attribute-name">rapidocr_params</span>
|
||
|
||
|
||
<span class="doc doc-labels">
|
||
<small class="doc doc-label doc-label-class-attribute"><code>class-attribute</code></small>
|
||
<small class="doc doc-label doc-label-instance-attribute"><code>instance-attribute</code></small>
|
||
</span>
|
||
|
||
</h4>
|
||
<div class="doc-signature highlight"><pre><span></span><code><span class="n">rapidocr_params</span><span class="p">:</span> <span class="n"><span title="typing.Dict">Dict</span></span><span class="p">[</span><span class="n"><span title="str">str</span></span><span class="p">,</span> <span class="n"><span title="typing.Any">Any</span></span><span class="p">]</span> <span class="o">=</span> <span class="n"><span title="pydantic.Field">Field</span></span><span class="p">(</span><span class="n"><span title="pydantic.Field(default_factory)">default_factory</span></span><span class="o">=</span><span class="n"><span title="dict">dict</span></span><span class="p">)</span>
|
||
</code></pre></div>
|
||
|
||
<div class="doc doc-contents ">
|
||
|
||
</div>
|
||
|
||
</div>
|
||
|
||
<div class="doc doc-object doc-attribute">
|
||
|
||
|
||
|
||
<h4 id="docling.datamodel.pipeline_options.RapidOcrOptions.rec_font_path" class="doc doc-heading">
|
||
<code class="doc-symbol doc-symbol-heading doc-symbol-attribute"></code> <span class="doc doc-object-name doc-attribute-name">rec_font_path</span>
|
||
|
||
|
||
<span class="doc doc-labels">
|
||
<small class="doc doc-label doc-label-class-attribute"><code>class-attribute</code></small>
|
||
<small class="doc doc-label doc-label-instance-attribute"><code>instance-attribute</code></small>
|
||
</span>
|
||
|
||
</h4>
|
||
<div class="doc-signature highlight"><pre><span></span><code><span class="n">rec_font_path</span><span class="p">:</span> <span class="n"><span title="typing.Optional">Optional</span></span><span class="p">[</span><span class="n"><span title="str">str</span></span><span class="p">]</span> <span class="o">=</span> <span class="kc">None</span>
|
||
</code></pre></div>
|
||
|
||
<div class="doc doc-contents ">
|
||
|
||
</div>
|
||
|
||
</div>
|
||
|
||
<div class="doc doc-object doc-attribute">
|
||
|
||
|
||
|
||
<h4 id="docling.datamodel.pipeline_options.RapidOcrOptions.rec_keys_path" class="doc doc-heading">
|
||
<code class="doc-symbol doc-symbol-heading doc-symbol-attribute"></code> <span class="doc doc-object-name doc-attribute-name">rec_keys_path</span>
|
||
|
||
|
||
<span class="doc doc-labels">
|
||
<small class="doc doc-label doc-label-class-attribute"><code>class-attribute</code></small>
|
||
<small class="doc doc-label doc-label-instance-attribute"><code>instance-attribute</code></small>
|
||
</span>
|
||
|
||
</h4>
|
||
<div class="doc-signature highlight"><pre><span></span><code><span class="n">rec_keys_path</span><span class="p">:</span> <span class="n"><span title="typing.Optional">Optional</span></span><span class="p">[</span><span class="n"><span title="str">str</span></span><span class="p">]</span> <span class="o">=</span> <span class="kc">None</span>
|
||
</code></pre></div>
|
||
|
||
<div class="doc doc-contents ">
|
||
|
||
</div>
|
||
|
||
</div>
|
||
|
||
<div class="doc doc-object doc-attribute">
|
||
|
||
|
||
|
||
<h4 id="docling.datamodel.pipeline_options.RapidOcrOptions.rec_model_path" class="doc doc-heading">
|
||
<code class="doc-symbol doc-symbol-heading doc-symbol-attribute"></code> <span class="doc doc-object-name doc-attribute-name">rec_model_path</span>
|
||
|
||
|
||
<span class="doc doc-labels">
|
||
<small class="doc doc-label doc-label-class-attribute"><code>class-attribute</code></small>
|
||
<small class="doc doc-label doc-label-instance-attribute"><code>instance-attribute</code></small>
|
||
</span>
|
||
|
||
</h4>
|
||
<div class="doc-signature highlight"><pre><span></span><code><span class="n">rec_model_path</span><span class="p">:</span> <span class="n"><span title="typing.Optional">Optional</span></span><span class="p">[</span><span class="n"><span title="str">str</span></span><span class="p">]</span> <span class="o">=</span> <span class="kc">None</span>
|
||
</code></pre></div>
|
||
|
||
<div class="doc doc-contents ">
|
||
|
||
</div>
|
||
|
||
</div>
|
||
|
||
<div class="doc doc-object doc-attribute">
|
||
|
||
|
||
|
||
<h4 id="docling.datamodel.pipeline_options.RapidOcrOptions.text_score" class="doc doc-heading">
|
||
<code class="doc-symbol doc-symbol-heading doc-symbol-attribute"></code> <span class="doc doc-object-name doc-attribute-name">text_score</span>
|
||
|
||
|
||
<span class="doc doc-labels">
|
||
<small class="doc doc-label doc-label-class-attribute"><code>class-attribute</code></small>
|
||
<small class="doc doc-label doc-label-instance-attribute"><code>instance-attribute</code></small>
|
||
</span>
|
||
|
||
</h4>
|
||
<div class="doc-signature highlight"><pre><span></span><code><span class="n">text_score</span><span class="p">:</span> <span class="n"><span title="float">float</span></span> <span class="o">=</span> <span class="mf">0.5</span>
|
||
</code></pre></div>
|
||
|
||
<div class="doc doc-contents ">
|
||
|
||
</div>
|
||
|
||
</div>
|
||
|
||
<div class="doc doc-object doc-attribute">
|
||
|
||
|
||
|
||
<h4 id="docling.datamodel.pipeline_options.RapidOcrOptions.use_cls" class="doc doc-heading">
|
||
<code class="doc-symbol doc-symbol-heading doc-symbol-attribute"></code> <span class="doc doc-object-name doc-attribute-name">use_cls</span>
|
||
|
||
|
||
<span class="doc doc-labels">
|
||
<small class="doc doc-label doc-label-class-attribute"><code>class-attribute</code></small>
|
||
<small class="doc doc-label doc-label-instance-attribute"><code>instance-attribute</code></small>
|
||
</span>
|
||
|
||
</h4>
|
||
<div class="doc-signature highlight"><pre><span></span><code><span class="n">use_cls</span><span class="p">:</span> <span class="n"><span title="typing.Optional">Optional</span></span><span class="p">[</span><span class="n"><span title="bool">bool</span></span><span class="p">]</span> <span class="o">=</span> <span class="kc">None</span>
|
||
</code></pre></div>
|
||
|
||
<div class="doc doc-contents ">
|
||
|
||
</div>
|
||
|
||
</div>
|
||
|
||
<div class="doc doc-object doc-attribute">
|
||
|
||
|
||
|
||
<h4 id="docling.datamodel.pipeline_options.RapidOcrOptions.use_det" class="doc doc-heading">
|
||
<code class="doc-symbol doc-symbol-heading doc-symbol-attribute"></code> <span class="doc doc-object-name doc-attribute-name">use_det</span>
|
||
|
||
|
||
<span class="doc doc-labels">
|
||
<small class="doc doc-label doc-label-class-attribute"><code>class-attribute</code></small>
|
||
<small class="doc doc-label doc-label-instance-attribute"><code>instance-attribute</code></small>
|
||
</span>
|
||
|
||
</h4>
|
||
<div class="doc-signature highlight"><pre><span></span><code><span class="n">use_det</span><span class="p">:</span> <span class="n"><span title="typing.Optional">Optional</span></span><span class="p">[</span><span class="n"><span title="bool">bool</span></span><span class="p">]</span> <span class="o">=</span> <span class="kc">None</span>
|
||
</code></pre></div>
|
||
|
||
<div class="doc doc-contents ">
|
||
|
||
</div>
|
||
|
||
</div>
|
||
|
||
<div class="doc doc-object doc-attribute">
|
||
|
||
|
||
|
||
<h4 id="docling.datamodel.pipeline_options.RapidOcrOptions.use_rec" class="doc doc-heading">
|
||
<code class="doc-symbol doc-symbol-heading doc-symbol-attribute"></code> <span class="doc doc-object-name doc-attribute-name">use_rec</span>
|
||
|
||
|
||
<span class="doc doc-labels">
|
||
<small class="doc doc-label doc-label-class-attribute"><code>class-attribute</code></small>
|
||
<small class="doc doc-label doc-label-instance-attribute"><code>instance-attribute</code></small>
|
||
</span>
|
||
|
||
</h4>
|
||
<div class="doc-signature highlight"><pre><span></span><code><span class="n">use_rec</span><span class="p">:</span> <span class="n"><span title="typing.Optional">Optional</span></span><span class="p">[</span><span class="n"><span title="bool">bool</span></span><span class="p">]</span> <span class="o">=</span> <span class="kc">None</span>
|
||
</code></pre></div>
|
||
|
||
<div class="doc doc-contents ">
|
||
|
||
</div>
|
||
|
||
</div>
|
||
|
||
|
||
|
||
|
||
|
||
|
||
</div>
|
||
|
||
</div>
|
||
|
||
</div>
|
||
|
||
<div class="doc doc-object doc-class">
|
||
|
||
|
||
|
||
<h3 id="docling.datamodel.pipeline_options.TableFormerMode" class="doc doc-heading">
|
||
<code class="doc-symbol doc-symbol-heading doc-symbol-class"></code> <span class="doc doc-object-name doc-class-name">TableFormerMode</span>
|
||
|
||
|
||
</h3>
|
||
|
||
|
||
<div class="doc doc-contents ">
|
||
<p class="doc doc-class-bases">
|
||
Bases: <code><span title="str">str</span></code>, <code><span title="enum.Enum">Enum</span></code></p>
|
||
|
||
|
||
|
||
<p>Modes for the TableFormer model.</p>
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
<p><span class="doc-section-title">Attributes:</span></p>
|
||
<ul>
|
||
<li class="doc-section-item field-body">
|
||
<b><code><a class="autorefs autorefs-internal" title="<code class="doc-symbol doc-symbol-heading doc-symbol-attribute"></code> <span class="doc doc-object-name doc-attribute-name">ACCURATE</span>
|
||
|
||
|
||
<span class="doc doc-labels">
|
||
<small class="doc doc-label doc-label-class-attribute"><code>class-attribute</code></small>
|
||
<small class="doc doc-label doc-label-instance-attribute"><code>instance-attribute</code></small>
|
||
</span> (<code>docling.datamodel.pipeline_options.TableFormerMode.ACCURATE</code>)" href="#docling.datamodel.pipeline_options.TableFormerMode.ACCURATE">ACCURATE</a></code></b>
|
||
–
|
||
<div class="doc-md-description">
|
||
|
||
</div>
|
||
</li>
|
||
<li class="doc-section-item field-body">
|
||
<b><code><a class="autorefs autorefs-internal" title="<code class="doc-symbol doc-symbol-heading doc-symbol-attribute"></code> <span class="doc doc-object-name doc-attribute-name">FAST</span>
|
||
|
||
|
||
<span class="doc doc-labels">
|
||
<small class="doc doc-label doc-label-class-attribute"><code>class-attribute</code></small>
|
||
<small class="doc doc-label doc-label-instance-attribute"><code>instance-attribute</code></small>
|
||
</span> (<code>docling.datamodel.pipeline_options.TableFormerMode.FAST</code>)" href="#docling.datamodel.pipeline_options.TableFormerMode.FAST">FAST</a></code></b>
|
||
–
|
||
<div class="doc-md-description">
|
||
|
||
</div>
|
||
</li>
|
||
</ul>
|
||
|
||
|
||
|
||
|
||
<div class="doc doc-children">
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
<div class="doc doc-object doc-attribute">
|
||
|
||
|
||
|
||
<h4 id="docling.datamodel.pipeline_options.TableFormerMode.ACCURATE" class="doc doc-heading">
|
||
<code class="doc-symbol doc-symbol-heading doc-symbol-attribute"></code> <span class="doc doc-object-name doc-attribute-name">ACCURATE</span>
|
||
|
||
|
||
<span class="doc doc-labels">
|
||
<small class="doc doc-label doc-label-class-attribute"><code>class-attribute</code></small>
|
||
<small class="doc doc-label doc-label-instance-attribute"><code>instance-attribute</code></small>
|
||
</span>
|
||
|
||
</h4>
|
||
<div class="doc-signature highlight"><pre><span></span><code><span class="n">ACCURATE</span> <span class="o">=</span> <span class="s1">'accurate'</span>
|
||
</code></pre></div>
|
||
|
||
<div class="doc doc-contents ">
|
||
|
||
</div>
|
||
|
||
</div>
|
||
|
||
<div class="doc doc-object doc-attribute">
|
||
|
||
|
||
|
||
<h4 id="docling.datamodel.pipeline_options.TableFormerMode.FAST" class="doc doc-heading">
|
||
<code class="doc-symbol doc-symbol-heading doc-symbol-attribute"></code> <span class="doc doc-object-name doc-attribute-name">FAST</span>
|
||
|
||
|
||
<span class="doc doc-labels">
|
||
<small class="doc doc-label doc-label-class-attribute"><code>class-attribute</code></small>
|
||
<small class="doc doc-label doc-label-instance-attribute"><code>instance-attribute</code></small>
|
||
</span>
|
||
|
||
</h4>
|
||
<div class="doc-signature highlight"><pre><span></span><code><span class="n">FAST</span> <span class="o">=</span> <span class="s1">'fast'</span>
|
||
</code></pre></div>
|
||
|
||
<div class="doc doc-contents ">
|
||
|
||
</div>
|
||
|
||
</div>
|
||
|
||
|
||
|
||
|
||
|
||
|
||
</div>
|
||
|
||
</div>
|
||
|
||
</div>
|
||
|
||
<div class="doc doc-object doc-class">
|
||
|
||
|
||
|
||
<h3 id="docling.datamodel.pipeline_options.TableStructureOptions" class="doc doc-heading">
|
||
<code class="doc-symbol doc-symbol-heading doc-symbol-class"></code> <span class="doc doc-object-name doc-class-name">TableStructureOptions</span>
|
||
|
||
|
||
</h3>
|
||
|
||
|
||
<div class="doc doc-contents ">
|
||
<p class="doc doc-class-bases">
|
||
Bases: <code><a class="autorefs autorefs-internal" title="<code class="doc-symbol doc-symbol-heading doc-symbol-class"></code> <span class="doc doc-object-name doc-class-name">BaseTableStructureOptions</span> (<code>docling.datamodel.pipeline_options.BaseTableStructureOptions</code>)" href="#docling.datamodel.pipeline_options.BaseTableStructureOptions">BaseTableStructureOptions</a></code></p>
|
||
|
||
|
||
|
||
<p>Options for the table structure.</p>
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
<p><span class="doc-section-title">Attributes:</span></p>
|
||
<ul>
|
||
<li class="doc-section-item field-body">
|
||
<b><code><a class="autorefs autorefs-internal" title="<code class="doc-symbol doc-symbol-heading doc-symbol-attribute"></code> <span class="doc doc-object-name doc-attribute-name">do_cell_matching</span>
|
||
|
||
|
||
<span class="doc doc-labels">
|
||
<small class="doc doc-label doc-label-class-attribute"><code>class-attribute</code></small>
|
||
<small class="doc doc-label doc-label-instance-attribute"><code>instance-attribute</code></small>
|
||
</span> (<code>docling.datamodel.pipeline_options.TableStructureOptions.do_cell_matching</code>)" href="#docling.datamodel.pipeline_options.TableStructureOptions.do_cell_matching">do_cell_matching</a></code></b>
|
||
(<code><span title="bool">bool</span></code>)
|
||
–
|
||
<div class="doc-md-description">
|
||
|
||
</div>
|
||
</li>
|
||
<li class="doc-section-item field-body">
|
||
<b><code><a class="autorefs autorefs-internal" title="<code class="doc-symbol doc-symbol-heading doc-symbol-attribute"></code> <span class="doc doc-object-name doc-attribute-name">kind</span>
|
||
|
||
|
||
<span class="doc doc-labels">
|
||
<small class="doc doc-label doc-label-class-attribute"><code>class-attribute</code></small>
|
||
</span> (<code>docling.datamodel.pipeline_options.TableStructureOptions.kind</code>)" href="#docling.datamodel.pipeline_options.TableStructureOptions.kind">kind</a></code></b>
|
||
(<code><span title="str">str</span></code>)
|
||
–
|
||
<div class="doc-md-description">
|
||
|
||
</div>
|
||
</li>
|
||
<li class="doc-section-item field-body">
|
||
<b><code><a class="autorefs autorefs-internal" title="<code class="doc-symbol doc-symbol-heading doc-symbol-attribute"></code> <span class="doc doc-object-name doc-attribute-name">mode</span>
|
||
|
||
|
||
<span class="doc doc-labels">
|
||
<small class="doc doc-label doc-label-class-attribute"><code>class-attribute</code></small>
|
||
<small class="doc doc-label doc-label-instance-attribute"><code>instance-attribute</code></small>
|
||
</span> (<code>docling.datamodel.pipeline_options.TableStructureOptions.mode</code>)" href="#docling.datamodel.pipeline_options.TableStructureOptions.mode">mode</a></code></b>
|
||
(<code><a class="autorefs autorefs-internal" title="<code class="doc-symbol doc-symbol-heading doc-symbol-class"></code> <span class="doc doc-object-name doc-class-name">TableFormerMode</span> (<code>docling.datamodel.pipeline_options.TableFormerMode</code>)" href="#docling.datamodel.pipeline_options.TableFormerMode">TableFormerMode</a></code>)
|
||
–
|
||
<div class="doc-md-description">
|
||
|
||
</div>
|
||
</li>
|
||
</ul>
|
||
|
||
|
||
|
||
|
||
<div class="doc doc-children">
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
<div class="doc doc-object doc-attribute">
|
||
|
||
|
||
|
||
<h4 id="docling.datamodel.pipeline_options.TableStructureOptions.do_cell_matching" class="doc doc-heading">
|
||
<code class="doc-symbol doc-symbol-heading doc-symbol-attribute"></code> <span class="doc doc-object-name doc-attribute-name">do_cell_matching</span>
|
||
|
||
|
||
<span class="doc doc-labels">
|
||
<small class="doc doc-label doc-label-class-attribute"><code>class-attribute</code></small>
|
||
<small class="doc doc-label doc-label-instance-attribute"><code>instance-attribute</code></small>
|
||
</span>
|
||
|
||
</h4>
|
||
<div class="doc-signature highlight"><pre><span></span><code><span class="n">do_cell_matching</span><span class="p">:</span> <span class="n"><span title="bool">bool</span></span> <span class="o">=</span> <span class="kc">True</span>
|
||
</code></pre></div>
|
||
|
||
<div class="doc doc-contents ">
|
||
|
||
</div>
|
||
|
||
</div>
|
||
|
||
<div class="doc doc-object doc-attribute">
|
||
|
||
|
||
|
||
<h4 id="docling.datamodel.pipeline_options.TableStructureOptions.kind" class="doc doc-heading">
|
||
<code class="doc-symbol doc-symbol-heading doc-symbol-attribute"></code> <span class="doc doc-object-name doc-attribute-name">kind</span>
|
||
|
||
|
||
<span class="doc doc-labels">
|
||
<small class="doc doc-label doc-label-class-attribute"><code>class-attribute</code></small>
|
||
</span>
|
||
|
||
</h4>
|
||
<div class="doc-signature highlight"><pre><span></span><code><span class="n">kind</span><span class="p">:</span> <span class="n"><span title="str">str</span></span> <span class="o">=</span> <span class="s1">'docling_tableformer'</span>
|
||
</code></pre></div>
|
||
|
||
<div class="doc doc-contents ">
|
||
|
||
</div>
|
||
|
||
</div>
|
||
|
||
<div class="doc doc-object doc-attribute">
|
||
|
||
|
||
|
||
<h4 id="docling.datamodel.pipeline_options.TableStructureOptions.mode" class="doc doc-heading">
|
||
<code class="doc-symbol doc-symbol-heading doc-symbol-attribute"></code> <span class="doc doc-object-name doc-attribute-name">mode</span>
|
||
|
||
|
||
<span class="doc doc-labels">
|
||
<small class="doc doc-label doc-label-class-attribute"><code>class-attribute</code></small>
|
||
<small class="doc doc-label doc-label-instance-attribute"><code>instance-attribute</code></small>
|
||
</span>
|
||
|
||
</h4>
|
||
<div class="doc-signature highlight"><pre><span></span><code><span class="n">mode</span><span class="p">:</span> <span class="n"><a class="autorefs autorefs-internal" title="<code class="doc-symbol doc-symbol-heading doc-symbol-class"></code> <span class="doc doc-object-name doc-class-name">TableFormerMode</span> (<code>docling.datamodel.pipeline_options.TableFormerMode</code>)" href="#docling.datamodel.pipeline_options.TableFormerMode">TableFormerMode</a></span> <span class="o">=</span> <span class="n"><a class="autorefs autorefs-internal" title="<code class="doc-symbol doc-symbol-heading doc-symbol-attribute"></code> <span class="doc doc-object-name doc-attribute-name">ACCURATE</span>
|
||
|
||
|
||
<span class="doc doc-labels">
|
||
<small class="doc doc-label doc-label-class-attribute"><code>class-attribute</code></small>
|
||
<small class="doc doc-label doc-label-instance-attribute"><code>instance-attribute</code></small>
|
||
</span> (<code>docling.datamodel.pipeline_options.TableFormerMode.ACCURATE</code>)" href="#docling.datamodel.pipeline_options.TableFormerMode.ACCURATE">ACCURATE</a></span>
|
||
</code></pre></div>
|
||
|
||
<div class="doc doc-contents ">
|
||
|
||
</div>
|
||
|
||
</div>
|
||
|
||
|
||
|
||
|
||
|
||
|
||
</div>
|
||
|
||
</div>
|
||
|
||
</div>
|
||
|
||
<div class="doc doc-object doc-class">
|
||
|
||
|
||
|
||
<h3 id="docling.datamodel.pipeline_options.TesseractCliOcrOptions" class="doc doc-heading">
|
||
<code class="doc-symbol doc-symbol-heading doc-symbol-class"></code> <span class="doc doc-object-name doc-class-name">TesseractCliOcrOptions</span>
|
||
|
||
|
||
</h3>
|
||
|
||
|
||
<div class="doc doc-contents ">
|
||
<p class="doc doc-class-bases">
|
||
Bases: <code><a class="autorefs autorefs-internal" title="<code class="doc-symbol doc-symbol-heading doc-symbol-class"></code> <span class="doc doc-object-name doc-class-name">OcrOptions</span> (<code>docling.datamodel.pipeline_options.OcrOptions</code>)" href="#docling.datamodel.pipeline_options.OcrOptions">OcrOptions</a></code></p>
|
||
|
||
|
||
|
||
<p>Options for the TesseractCli engine.</p>
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
<p><span class="doc-section-title">Attributes:</span></p>
|
||
<ul>
|
||
<li class="doc-section-item field-body">
|
||
<b><code><a class="autorefs autorefs-internal" title="<code class="doc-symbol doc-symbol-heading doc-symbol-attribute"></code> <span class="doc doc-object-name doc-attribute-name">bitmap_area_threshold</span>
|
||
|
||
|
||
<span class="doc doc-labels">
|
||
<small class="doc doc-label doc-label-class-attribute"><code>class-attribute</code></small>
|
||
<small class="doc doc-label doc-label-instance-attribute"><code>instance-attribute</code></small>
|
||
</span> (<code>docling.datamodel.pipeline_options.TesseractCliOcrOptions.bitmap_area_threshold</code>)" href="#docling.datamodel.pipeline_options.TesseractCliOcrOptions.bitmap_area_threshold">bitmap_area_threshold</a></code></b>
|
||
(<code><span title="float">float</span></code>)
|
||
–
|
||
<div class="doc-md-description">
|
||
|
||
</div>
|
||
</li>
|
||
<li class="doc-section-item field-body">
|
||
<b><code><a class="autorefs autorefs-internal" title="<code class="doc-symbol doc-symbol-heading doc-symbol-attribute"></code> <span class="doc doc-object-name doc-attribute-name">force_full_page_ocr</span>
|
||
|
||
|
||
<span class="doc doc-labels">
|
||
<small class="doc doc-label doc-label-class-attribute"><code>class-attribute</code></small>
|
||
<small class="doc doc-label doc-label-instance-attribute"><code>instance-attribute</code></small>
|
||
</span> (<code>docling.datamodel.pipeline_options.TesseractCliOcrOptions.force_full_page_ocr</code>)" href="#docling.datamodel.pipeline_options.TesseractCliOcrOptions.force_full_page_ocr">force_full_page_ocr</a></code></b>
|
||
(<code><span title="bool">bool</span></code>)
|
||
–
|
||
<div class="doc-md-description">
|
||
|
||
</div>
|
||
</li>
|
||
<li class="doc-section-item field-body">
|
||
<b><code><a class="autorefs autorefs-internal" title="<code class="doc-symbol doc-symbol-heading doc-symbol-attribute"></code> <span class="doc doc-object-name doc-attribute-name">kind</span>
|
||
|
||
|
||
<span class="doc doc-labels">
|
||
<small class="doc doc-label doc-label-class-attribute"><code>class-attribute</code></small>
|
||
</span> (<code>docling.datamodel.pipeline_options.TesseractCliOcrOptions.kind</code>)" href="#docling.datamodel.pipeline_options.TesseractCliOcrOptions.kind">kind</a></code></b>
|
||
(<code><span title="typing.Literal">Literal</span>['tesseract']</code>)
|
||
–
|
||
<div class="doc-md-description">
|
||
|
||
</div>
|
||
</li>
|
||
<li class="doc-section-item field-body">
|
||
<b><code><a class="autorefs autorefs-internal" title="<code class="doc-symbol doc-symbol-heading doc-symbol-attribute"></code> <span class="doc doc-object-name doc-attribute-name">lang</span>
|
||
|
||
|
||
<span class="doc doc-labels">
|
||
<small class="doc doc-label doc-label-class-attribute"><code>class-attribute</code></small>
|
||
<small class="doc doc-label doc-label-instance-attribute"><code>instance-attribute</code></small>
|
||
</span> (<code>docling.datamodel.pipeline_options.TesseractCliOcrOptions.lang</code>)" href="#docling.datamodel.pipeline_options.TesseractCliOcrOptions.lang">lang</a></code></b>
|
||
(<code><span title="typing.List">List</span>[<span title="str">str</span>]</code>)
|
||
–
|
||
<div class="doc-md-description">
|
||
|
||
</div>
|
||
</li>
|
||
<li class="doc-section-item field-body">
|
||
<b><code><a class="autorefs autorefs-internal" title="<code class="doc-symbol doc-symbol-heading doc-symbol-attribute"></code> <span class="doc doc-object-name doc-attribute-name">model_config</span>
|
||
|
||
|
||
<span class="doc doc-labels">
|
||
<small class="doc doc-label doc-label-class-attribute"><code>class-attribute</code></small>
|
||
<small class="doc doc-label doc-label-instance-attribute"><code>instance-attribute</code></small>
|
||
</span> (<code>docling.datamodel.pipeline_options.TesseractCliOcrOptions.model_config</code>)" href="#docling.datamodel.pipeline_options.TesseractCliOcrOptions.model_config">model_config</a></code></b>
|
||
–
|
||
<div class="doc-md-description">
|
||
|
||
</div>
|
||
</li>
|
||
<li class="doc-section-item field-body">
|
||
<b><code><a class="autorefs autorefs-internal" title="<code class="doc-symbol doc-symbol-heading doc-symbol-attribute"></code> <span class="doc doc-object-name doc-attribute-name">path</span>
|
||
|
||
|
||
<span class="doc doc-labels">
|
||
<small class="doc doc-label doc-label-class-attribute"><code>class-attribute</code></small>
|
||
<small class="doc doc-label doc-label-instance-attribute"><code>instance-attribute</code></small>
|
||
</span> (<code>docling.datamodel.pipeline_options.TesseractCliOcrOptions.path</code>)" href="#docling.datamodel.pipeline_options.TesseractCliOcrOptions.path">path</a></code></b>
|
||
(<code><span title="typing.Optional">Optional</span>[<span title="str">str</span>]</code>)
|
||
–
|
||
<div class="doc-md-description">
|
||
|
||
</div>
|
||
</li>
|
||
<li class="doc-section-item field-body">
|
||
<b><code><a class="autorefs autorefs-internal" title="<code class="doc-symbol doc-symbol-heading doc-symbol-attribute"></code> <span class="doc doc-object-name doc-attribute-name">psm</span>
|
||
|
||
|
||
<span class="doc doc-labels">
|
||
<small class="doc doc-label doc-label-class-attribute"><code>class-attribute</code></small>
|
||
<small class="doc doc-label doc-label-instance-attribute"><code>instance-attribute</code></small>
|
||
</span> (<code>docling.datamodel.pipeline_options.TesseractCliOcrOptions.psm</code>)" href="#docling.datamodel.pipeline_options.TesseractCliOcrOptions.psm">psm</a></code></b>
|
||
(<code><span title="typing.Optional">Optional</span>[<span title="int">int</span>]</code>)
|
||
–
|
||
<div class="doc-md-description">
|
||
|
||
</div>
|
||
</li>
|
||
<li class="doc-section-item field-body">
|
||
<b><code><a class="autorefs autorefs-internal" title="<code class="doc-symbol doc-symbol-heading doc-symbol-attribute"></code> <span class="doc doc-object-name doc-attribute-name">tesseract_cmd</span>
|
||
|
||
|
||
<span class="doc doc-labels">
|
||
<small class="doc doc-label doc-label-class-attribute"><code>class-attribute</code></small>
|
||
<small class="doc doc-label doc-label-instance-attribute"><code>instance-attribute</code></small>
|
||
</span> (<code>docling.datamodel.pipeline_options.TesseractCliOcrOptions.tesseract_cmd</code>)" href="#docling.datamodel.pipeline_options.TesseractCliOcrOptions.tesseract_cmd">tesseract_cmd</a></code></b>
|
||
(<code><span title="str">str</span></code>)
|
||
–
|
||
<div class="doc-md-description">
|
||
|
||
</div>
|
||
</li>
|
||
</ul>
|
||
|
||
|
||
|
||
|
||
<div class="doc doc-children">
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
<div class="doc doc-object doc-attribute">
|
||
|
||
|
||
|
||
<h4 id="docling.datamodel.pipeline_options.TesseractCliOcrOptions.bitmap_area_threshold" class="doc doc-heading">
|
||
<code class="doc-symbol doc-symbol-heading doc-symbol-attribute"></code> <span class="doc doc-object-name doc-attribute-name">bitmap_area_threshold</span>
|
||
|
||
|
||
<span class="doc doc-labels">
|
||
<small class="doc doc-label doc-label-class-attribute"><code>class-attribute</code></small>
|
||
<small class="doc doc-label doc-label-instance-attribute"><code>instance-attribute</code></small>
|
||
</span>
|
||
|
||
</h4>
|
||
<div class="doc-signature highlight"><pre><span></span><code><span class="n">bitmap_area_threshold</span><span class="p">:</span> <span class="n"><span title="float">float</span></span> <span class="o">=</span> <span class="mf">0.05</span>
|
||
</code></pre></div>
|
||
|
||
<div class="doc doc-contents ">
|
||
|
||
</div>
|
||
|
||
</div>
|
||
|
||
<div class="doc doc-object doc-attribute">
|
||
|
||
|
||
|
||
<h4 id="docling.datamodel.pipeline_options.TesseractCliOcrOptions.force_full_page_ocr" class="doc doc-heading">
|
||
<code class="doc-symbol doc-symbol-heading doc-symbol-attribute"></code> <span class="doc doc-object-name doc-attribute-name">force_full_page_ocr</span>
|
||
|
||
|
||
<span class="doc doc-labels">
|
||
<small class="doc doc-label doc-label-class-attribute"><code>class-attribute</code></small>
|
||
<small class="doc doc-label doc-label-instance-attribute"><code>instance-attribute</code></small>
|
||
</span>
|
||
|
||
</h4>
|
||
<div class="doc-signature highlight"><pre><span></span><code><span class="n">force_full_page_ocr</span><span class="p">:</span> <span class="n"><span title="bool">bool</span></span> <span class="o">=</span> <span class="kc">False</span>
|
||
</code></pre></div>
|
||
|
||
<div class="doc doc-contents ">
|
||
|
||
</div>
|
||
|
||
</div>
|
||
|
||
<div class="doc doc-object doc-attribute">
|
||
|
||
|
||
|
||
<h4 id="docling.datamodel.pipeline_options.TesseractCliOcrOptions.kind" class="doc doc-heading">
|
||
<code class="doc-symbol doc-symbol-heading doc-symbol-attribute"></code> <span class="doc doc-object-name doc-attribute-name">kind</span>
|
||
|
||
|
||
<span class="doc doc-labels">
|
||
<small class="doc doc-label doc-label-class-attribute"><code>class-attribute</code></small>
|
||
</span>
|
||
|
||
</h4>
|
||
<div class="doc-signature highlight"><pre><span></span><code><span class="n">kind</span><span class="p">:</span> <span class="n"><span title="typing.Literal">Literal</span></span><span class="p">[</span><span class="s1">'tesseract'</span><span class="p">]</span> <span class="o">=</span> <span class="s1">'tesseract'</span>
|
||
</code></pre></div>
|
||
|
||
<div class="doc doc-contents ">
|
||
|
||
</div>
|
||
|
||
</div>
|
||
|
||
<div class="doc doc-object doc-attribute">
|
||
|
||
|
||
|
||
<h4 id="docling.datamodel.pipeline_options.TesseractCliOcrOptions.lang" class="doc doc-heading">
|
||
<code class="doc-symbol doc-symbol-heading doc-symbol-attribute"></code> <span class="doc doc-object-name doc-attribute-name">lang</span>
|
||
|
||
|
||
<span class="doc doc-labels">
|
||
<small class="doc doc-label doc-label-class-attribute"><code>class-attribute</code></small>
|
||
<small class="doc doc-label doc-label-instance-attribute"><code>instance-attribute</code></small>
|
||
</span>
|
||
|
||
</h4>
|
||
<div class="doc-signature highlight"><pre><span></span><code><span class="n">lang</span><span class="p">:</span> <span class="n"><span title="typing.List">List</span></span><span class="p">[</span><span class="n"><span title="str">str</span></span><span class="p">]</span> <span class="o">=</span> <span class="p">[</span><span class="s1">'fra'</span><span class="p">,</span> <span class="s1">'deu'</span><span class="p">,</span> <span class="s1">'spa'</span><span class="p">,</span> <span class="s1">'eng'</span><span class="p">]</span>
|
||
</code></pre></div>
|
||
|
||
<div class="doc doc-contents ">
|
||
|
||
</div>
|
||
|
||
</div>
|
||
|
||
<div class="doc doc-object doc-attribute">
|
||
|
||
|
||
|
||
<h4 id="docling.datamodel.pipeline_options.TesseractCliOcrOptions.model_config" class="doc doc-heading">
|
||
<code class="doc-symbol doc-symbol-heading doc-symbol-attribute"></code> <span class="doc doc-object-name doc-attribute-name">model_config</span>
|
||
|
||
|
||
<span class="doc doc-labels">
|
||
<small class="doc doc-label doc-label-class-attribute"><code>class-attribute</code></small>
|
||
<small class="doc doc-label doc-label-instance-attribute"><code>instance-attribute</code></small>
|
||
</span>
|
||
|
||
</h4>
|
||
<div class="doc-signature highlight"><pre><span></span><code><span class="n">model_config</span> <span class="o">=</span> <span class="n"><span title="pydantic.ConfigDict">ConfigDict</span></span><span class="p">(</span><span class="n"><span title="pydantic.ConfigDict(extra)">extra</span></span><span class="o">=</span><span class="s1">'forbid'</span><span class="p">)</span>
|
||
</code></pre></div>
|
||
|
||
<div class="doc doc-contents ">
|
||
|
||
</div>
|
||
|
||
</div>
|
||
|
||
<div class="doc doc-object doc-attribute">
|
||
|
||
|
||
|
||
<h4 id="docling.datamodel.pipeline_options.TesseractCliOcrOptions.path" class="doc doc-heading">
|
||
<code class="doc-symbol doc-symbol-heading doc-symbol-attribute"></code> <span class="doc doc-object-name doc-attribute-name">path</span>
|
||
|
||
|
||
<span class="doc doc-labels">
|
||
<small class="doc doc-label doc-label-class-attribute"><code>class-attribute</code></small>
|
||
<small class="doc doc-label doc-label-instance-attribute"><code>instance-attribute</code></small>
|
||
</span>
|
||
|
||
</h4>
|
||
<div class="doc-signature highlight"><pre><span></span><code><span class="n">path</span><span class="p">:</span> <span class="n"><span title="typing.Optional">Optional</span></span><span class="p">[</span><span class="n"><span title="str">str</span></span><span class="p">]</span> <span class="o">=</span> <span class="kc">None</span>
|
||
</code></pre></div>
|
||
|
||
<div class="doc doc-contents ">
|
||
|
||
</div>
|
||
|
||
</div>
|
||
|
||
<div class="doc doc-object doc-attribute">
|
||
|
||
|
||
|
||
<h4 id="docling.datamodel.pipeline_options.TesseractCliOcrOptions.psm" class="doc doc-heading">
|
||
<code class="doc-symbol doc-symbol-heading doc-symbol-attribute"></code> <span class="doc doc-object-name doc-attribute-name">psm</span>
|
||
|
||
|
||
<span class="doc doc-labels">
|
||
<small class="doc doc-label doc-label-class-attribute"><code>class-attribute</code></small>
|
||
<small class="doc doc-label doc-label-instance-attribute"><code>instance-attribute</code></small>
|
||
</span>
|
||
|
||
</h4>
|
||
<div class="doc-signature highlight"><pre><span></span><code><span class="n">psm</span><span class="p">:</span> <span class="n"><span title="typing.Optional">Optional</span></span><span class="p">[</span><span class="n"><span title="int">int</span></span><span class="p">]</span> <span class="o">=</span> <span class="kc">None</span>
|
||
</code></pre></div>
|
||
|
||
<div class="doc doc-contents ">
|
||
|
||
</div>
|
||
|
||
</div>
|
||
|
||
<div class="doc doc-object doc-attribute">
|
||
|
||
|
||
|
||
<h4 id="docling.datamodel.pipeline_options.TesseractCliOcrOptions.tesseract_cmd" class="doc doc-heading">
|
||
<code class="doc-symbol doc-symbol-heading doc-symbol-attribute"></code> <span class="doc doc-object-name doc-attribute-name">tesseract_cmd</span>
|
||
|
||
|
||
<span class="doc doc-labels">
|
||
<small class="doc doc-label doc-label-class-attribute"><code>class-attribute</code></small>
|
||
<small class="doc doc-label doc-label-instance-attribute"><code>instance-attribute</code></small>
|
||
</span>
|
||
|
||
</h4>
|
||
<div class="doc-signature highlight"><pre><span></span><code><span class="n">tesseract_cmd</span><span class="p">:</span> <span class="n"><span title="str">str</span></span> <span class="o">=</span> <span class="s1">'tesseract'</span>
|
||
</code></pre></div>
|
||
|
||
<div class="doc doc-contents ">
|
||
|
||
</div>
|
||
|
||
</div>
|
||
|
||
|
||
|
||
|
||
|
||
|
||
</div>
|
||
|
||
</div>
|
||
|
||
</div>
|
||
|
||
<div class="doc doc-object doc-class">
|
||
|
||
|
||
|
||
<h3 id="docling.datamodel.pipeline_options.TesseractOcrOptions" class="doc doc-heading">
|
||
<code class="doc-symbol doc-symbol-heading doc-symbol-class"></code> <span class="doc doc-object-name doc-class-name">TesseractOcrOptions</span>
|
||
|
||
|
||
</h3>
|
||
|
||
|
||
<div class="doc doc-contents ">
|
||
<p class="doc doc-class-bases">
|
||
Bases: <code><a class="autorefs autorefs-internal" title="<code class="doc-symbol doc-symbol-heading doc-symbol-class"></code> <span class="doc doc-object-name doc-class-name">OcrOptions</span> (<code>docling.datamodel.pipeline_options.OcrOptions</code>)" href="#docling.datamodel.pipeline_options.OcrOptions">OcrOptions</a></code></p>
|
||
|
||
|
||
|
||
<p>Options for the Tesseract engine.</p>
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
<p><span class="doc-section-title">Attributes:</span></p>
|
||
<ul>
|
||
<li class="doc-section-item field-body">
|
||
<b><code><a class="autorefs autorefs-internal" title="<code class="doc-symbol doc-symbol-heading doc-symbol-attribute"></code> <span class="doc doc-object-name doc-attribute-name">bitmap_area_threshold</span>
|
||
|
||
|
||
<span class="doc doc-labels">
|
||
<small class="doc doc-label doc-label-class-attribute"><code>class-attribute</code></small>
|
||
<small class="doc doc-label doc-label-instance-attribute"><code>instance-attribute</code></small>
|
||
</span> (<code>docling.datamodel.pipeline_options.TesseractOcrOptions.bitmap_area_threshold</code>)" href="#docling.datamodel.pipeline_options.TesseractOcrOptions.bitmap_area_threshold">bitmap_area_threshold</a></code></b>
|
||
(<code><span title="float">float</span></code>)
|
||
–
|
||
<div class="doc-md-description">
|
||
|
||
</div>
|
||
</li>
|
||
<li class="doc-section-item field-body">
|
||
<b><code><a class="autorefs autorefs-internal" title="<code class="doc-symbol doc-symbol-heading doc-symbol-attribute"></code> <span class="doc doc-object-name doc-attribute-name">force_full_page_ocr</span>
|
||
|
||
|
||
<span class="doc doc-labels">
|
||
<small class="doc doc-label doc-label-class-attribute"><code>class-attribute</code></small>
|
||
<small class="doc doc-label doc-label-instance-attribute"><code>instance-attribute</code></small>
|
||
</span> (<code>docling.datamodel.pipeline_options.TesseractOcrOptions.force_full_page_ocr</code>)" href="#docling.datamodel.pipeline_options.TesseractOcrOptions.force_full_page_ocr">force_full_page_ocr</a></code></b>
|
||
(<code><span title="bool">bool</span></code>)
|
||
–
|
||
<div class="doc-md-description">
|
||
|
||
</div>
|
||
</li>
|
||
<li class="doc-section-item field-body">
|
||
<b><code><a class="autorefs autorefs-internal" title="<code class="doc-symbol doc-symbol-heading doc-symbol-attribute"></code> <span class="doc doc-object-name doc-attribute-name">kind</span>
|
||
|
||
|
||
<span class="doc doc-labels">
|
||
<small class="doc doc-label doc-label-class-attribute"><code>class-attribute</code></small>
|
||
</span> (<code>docling.datamodel.pipeline_options.TesseractOcrOptions.kind</code>)" href="#docling.datamodel.pipeline_options.TesseractOcrOptions.kind">kind</a></code></b>
|
||
(<code><span title="typing.Literal">Literal</span>['tesserocr']</code>)
|
||
–
|
||
<div class="doc-md-description">
|
||
|
||
</div>
|
||
</li>
|
||
<li class="doc-section-item field-body">
|
||
<b><code><a class="autorefs autorefs-internal" title="<code class="doc-symbol doc-symbol-heading doc-symbol-attribute"></code> <span class="doc doc-object-name doc-attribute-name">lang</span>
|
||
|
||
|
||
<span class="doc doc-labels">
|
||
<small class="doc doc-label doc-label-class-attribute"><code>class-attribute</code></small>
|
||
<small class="doc doc-label doc-label-instance-attribute"><code>instance-attribute</code></small>
|
||
</span> (<code>docling.datamodel.pipeline_options.TesseractOcrOptions.lang</code>)" href="#docling.datamodel.pipeline_options.TesseractOcrOptions.lang">lang</a></code></b>
|
||
(<code><span title="typing.List">List</span>[<span title="str">str</span>]</code>)
|
||
–
|
||
<div class="doc-md-description">
|
||
|
||
</div>
|
||
</li>
|
||
<li class="doc-section-item field-body">
|
||
<b><code><a class="autorefs autorefs-internal" title="<code class="doc-symbol doc-symbol-heading doc-symbol-attribute"></code> <span class="doc doc-object-name doc-attribute-name">model_config</span>
|
||
|
||
|
||
<span class="doc doc-labels">
|
||
<small class="doc doc-label doc-label-class-attribute"><code>class-attribute</code></small>
|
||
<small class="doc doc-label doc-label-instance-attribute"><code>instance-attribute</code></small>
|
||
</span> (<code>docling.datamodel.pipeline_options.TesseractOcrOptions.model_config</code>)" href="#docling.datamodel.pipeline_options.TesseractOcrOptions.model_config">model_config</a></code></b>
|
||
–
|
||
<div class="doc-md-description">
|
||
|
||
</div>
|
||
</li>
|
||
<li class="doc-section-item field-body">
|
||
<b><code><a class="autorefs autorefs-internal" title="<code class="doc-symbol doc-symbol-heading doc-symbol-attribute"></code> <span class="doc doc-object-name doc-attribute-name">path</span>
|
||
|
||
|
||
<span class="doc doc-labels">
|
||
<small class="doc doc-label doc-label-class-attribute"><code>class-attribute</code></small>
|
||
<small class="doc doc-label doc-label-instance-attribute"><code>instance-attribute</code></small>
|
||
</span> (<code>docling.datamodel.pipeline_options.TesseractOcrOptions.path</code>)" href="#docling.datamodel.pipeline_options.TesseractOcrOptions.path">path</a></code></b>
|
||
(<code><span title="typing.Optional">Optional</span>[<span title="str">str</span>]</code>)
|
||
–
|
||
<div class="doc-md-description">
|
||
|
||
</div>
|
||
</li>
|
||
<li class="doc-section-item field-body">
|
||
<b><code><a class="autorefs autorefs-internal" title="<code class="doc-symbol doc-symbol-heading doc-symbol-attribute"></code> <span class="doc doc-object-name doc-attribute-name">psm</span>
|
||
|
||
|
||
<span class="doc doc-labels">
|
||
<small class="doc doc-label doc-label-class-attribute"><code>class-attribute</code></small>
|
||
<small class="doc doc-label doc-label-instance-attribute"><code>instance-attribute</code></small>
|
||
</span> (<code>docling.datamodel.pipeline_options.TesseractOcrOptions.psm</code>)" href="#docling.datamodel.pipeline_options.TesseractOcrOptions.psm">psm</a></code></b>
|
||
(<code><span title="typing.Optional">Optional</span>[<span title="int">int</span>]</code>)
|
||
–
|
||
<div class="doc-md-description">
|
||
|
||
</div>
|
||
</li>
|
||
</ul>
|
||
|
||
|
||
|
||
|
||
<div class="doc doc-children">
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
<div class="doc doc-object doc-attribute">
|
||
|
||
|
||
|
||
<h4 id="docling.datamodel.pipeline_options.TesseractOcrOptions.bitmap_area_threshold" class="doc doc-heading">
|
||
<code class="doc-symbol doc-symbol-heading doc-symbol-attribute"></code> <span class="doc doc-object-name doc-attribute-name">bitmap_area_threshold</span>
|
||
|
||
|
||
<span class="doc doc-labels">
|
||
<small class="doc doc-label doc-label-class-attribute"><code>class-attribute</code></small>
|
||
<small class="doc doc-label doc-label-instance-attribute"><code>instance-attribute</code></small>
|
||
</span>
|
||
|
||
</h4>
|
||
<div class="doc-signature highlight"><pre><span></span><code><span class="n">bitmap_area_threshold</span><span class="p">:</span> <span class="n"><span title="float">float</span></span> <span class="o">=</span> <span class="mf">0.05</span>
|
||
</code></pre></div>
|
||
|
||
<div class="doc doc-contents ">
|
||
|
||
</div>
|
||
|
||
</div>
|
||
|
||
<div class="doc doc-object doc-attribute">
|
||
|
||
|
||
|
||
<h4 id="docling.datamodel.pipeline_options.TesseractOcrOptions.force_full_page_ocr" class="doc doc-heading">
|
||
<code class="doc-symbol doc-symbol-heading doc-symbol-attribute"></code> <span class="doc doc-object-name doc-attribute-name">force_full_page_ocr</span>
|
||
|
||
|
||
<span class="doc doc-labels">
|
||
<small class="doc doc-label doc-label-class-attribute"><code>class-attribute</code></small>
|
||
<small class="doc doc-label doc-label-instance-attribute"><code>instance-attribute</code></small>
|
||
</span>
|
||
|
||
</h4>
|
||
<div class="doc-signature highlight"><pre><span></span><code><span class="n">force_full_page_ocr</span><span class="p">:</span> <span class="n"><span title="bool">bool</span></span> <span class="o">=</span> <span class="kc">False</span>
|
||
</code></pre></div>
|
||
|
||
<div class="doc doc-contents ">
|
||
|
||
</div>
|
||
|
||
</div>
|
||
|
||
<div class="doc doc-object doc-attribute">
|
||
|
||
|
||
|
||
<h4 id="docling.datamodel.pipeline_options.TesseractOcrOptions.kind" class="doc doc-heading">
|
||
<code class="doc-symbol doc-symbol-heading doc-symbol-attribute"></code> <span class="doc doc-object-name doc-attribute-name">kind</span>
|
||
|
||
|
||
<span class="doc doc-labels">
|
||
<small class="doc doc-label doc-label-class-attribute"><code>class-attribute</code></small>
|
||
</span>
|
||
|
||
</h4>
|
||
<div class="doc-signature highlight"><pre><span></span><code><span class="n">kind</span><span class="p">:</span> <span class="n"><span title="typing.Literal">Literal</span></span><span class="p">[</span><span class="s1">'tesserocr'</span><span class="p">]</span> <span class="o">=</span> <span class="s1">'tesserocr'</span>
|
||
</code></pre></div>
|
||
|
||
<div class="doc doc-contents ">
|
||
|
||
</div>
|
||
|
||
</div>
|
||
|
||
<div class="doc doc-object doc-attribute">
|
||
|
||
|
||
|
||
<h4 id="docling.datamodel.pipeline_options.TesseractOcrOptions.lang" class="doc doc-heading">
|
||
<code class="doc-symbol doc-symbol-heading doc-symbol-attribute"></code> <span class="doc doc-object-name doc-attribute-name">lang</span>
|
||
|
||
|
||
<span class="doc doc-labels">
|
||
<small class="doc doc-label doc-label-class-attribute"><code>class-attribute</code></small>
|
||
<small class="doc doc-label doc-label-instance-attribute"><code>instance-attribute</code></small>
|
||
</span>
|
||
|
||
</h4>
|
||
<div class="doc-signature highlight"><pre><span></span><code><span class="n">lang</span><span class="p">:</span> <span class="n"><span title="typing.List">List</span></span><span class="p">[</span><span class="n"><span title="str">str</span></span><span class="p">]</span> <span class="o">=</span> <span class="p">[</span><span class="s1">'fra'</span><span class="p">,</span> <span class="s1">'deu'</span><span class="p">,</span> <span class="s1">'spa'</span><span class="p">,</span> <span class="s1">'eng'</span><span class="p">]</span>
|
||
</code></pre></div>
|
||
|
||
<div class="doc doc-contents ">
|
||
|
||
</div>
|
||
|
||
</div>
|
||
|
||
<div class="doc doc-object doc-attribute">
|
||
|
||
|
||
|
||
<h4 id="docling.datamodel.pipeline_options.TesseractOcrOptions.model_config" class="doc doc-heading">
|
||
<code class="doc-symbol doc-symbol-heading doc-symbol-attribute"></code> <span class="doc doc-object-name doc-attribute-name">model_config</span>
|
||
|
||
|
||
<span class="doc doc-labels">
|
||
<small class="doc doc-label doc-label-class-attribute"><code>class-attribute</code></small>
|
||
<small class="doc doc-label doc-label-instance-attribute"><code>instance-attribute</code></small>
|
||
</span>
|
||
|
||
</h4>
|
||
<div class="doc-signature highlight"><pre><span></span><code><span class="n">model_config</span> <span class="o">=</span> <span class="n"><span title="pydantic.ConfigDict">ConfigDict</span></span><span class="p">(</span><span class="n"><span title="pydantic.ConfigDict(extra)">extra</span></span><span class="o">=</span><span class="s1">'forbid'</span><span class="p">)</span>
|
||
</code></pre></div>
|
||
|
||
<div class="doc doc-contents ">
|
||
|
||
</div>
|
||
|
||
</div>
|
||
|
||
<div class="doc doc-object doc-attribute">
|
||
|
||
|
||
|
||
<h4 id="docling.datamodel.pipeline_options.TesseractOcrOptions.path" class="doc doc-heading">
|
||
<code class="doc-symbol doc-symbol-heading doc-symbol-attribute"></code> <span class="doc doc-object-name doc-attribute-name">path</span>
|
||
|
||
|
||
<span class="doc doc-labels">
|
||
<small class="doc doc-label doc-label-class-attribute"><code>class-attribute</code></small>
|
||
<small class="doc doc-label doc-label-instance-attribute"><code>instance-attribute</code></small>
|
||
</span>
|
||
|
||
</h4>
|
||
<div class="doc-signature highlight"><pre><span></span><code><span class="n">path</span><span class="p">:</span> <span class="n"><span title="typing.Optional">Optional</span></span><span class="p">[</span><span class="n"><span title="str">str</span></span><span class="p">]</span> <span class="o">=</span> <span class="kc">None</span>
|
||
</code></pre></div>
|
||
|
||
<div class="doc doc-contents ">
|
||
|
||
</div>
|
||
|
||
</div>
|
||
|
||
<div class="doc doc-object doc-attribute">
|
||
|
||
|
||
|
||
<h4 id="docling.datamodel.pipeline_options.TesseractOcrOptions.psm" class="doc doc-heading">
|
||
<code class="doc-symbol doc-symbol-heading doc-symbol-attribute"></code> <span class="doc doc-object-name doc-attribute-name">psm</span>
|
||
|
||
|
||
<span class="doc doc-labels">
|
||
<small class="doc doc-label doc-label-class-attribute"><code>class-attribute</code></small>
|
||
<small class="doc doc-label doc-label-instance-attribute"><code>instance-attribute</code></small>
|
||
</span>
|
||
|
||
</h4>
|
||
<div class="doc-signature highlight"><pre><span></span><code><span class="n">psm</span><span class="p">:</span> <span class="n"><span title="typing.Optional">Optional</span></span><span class="p">[</span><span class="n"><span title="int">int</span></span><span class="p">]</span> <span class="o">=</span> <span class="kc">None</span>
|
||
</code></pre></div>
|
||
|
||
<div class="doc doc-contents ">
|
||
|
||
</div>
|
||
|
||
</div>
|
||
|
||
|
||
|
||
|
||
|
||
|
||
</div>
|
||
|
||
</div>
|
||
|
||
</div>
|
||
|
||
<div class="doc doc-object doc-class">
|
||
|
||
|
||
|
||
<h3 id="docling.datamodel.pipeline_options.ThreadedPdfPipelineOptions" class="doc doc-heading">
|
||
<code class="doc-symbol doc-symbol-heading doc-symbol-class"></code> <span class="doc doc-object-name doc-class-name">ThreadedPdfPipelineOptions</span>
|
||
|
||
|
||
</h3>
|
||
|
||
|
||
<div class="doc doc-contents ">
|
||
<p class="doc doc-class-bases">
|
||
Bases: <code><a class="autorefs autorefs-internal" title="<code class="doc-symbol doc-symbol-heading doc-symbol-class"></code> <span class="doc doc-object-name doc-class-name">PdfPipelineOptions</span> (<code>docling.datamodel.pipeline_options.PdfPipelineOptions</code>)" href="#docling.datamodel.pipeline_options.PdfPipelineOptions">PdfPipelineOptions</a></code></p>
|
||
|
||
|
||
|
||
<p>Pipeline options for the threaded PDF pipeline with batching and backpressure control</p>
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
<p><span class="doc-section-title">Attributes:</span></p>
|
||
<ul>
|
||
<li class="doc-section-item field-body">
|
||
<b><code><a class="autorefs autorefs-internal" title="<code class="doc-symbol doc-symbol-heading doc-symbol-attribute"></code> <span class="doc doc-object-name doc-attribute-name">accelerator_options</span>
|
||
|
||
|
||
<span class="doc doc-labels">
|
||
<small class="doc doc-label doc-label-class-attribute"><code>class-attribute</code></small>
|
||
<small class="doc doc-label doc-label-instance-attribute"><code>instance-attribute</code></small>
|
||
</span> (<code>docling.datamodel.pipeline_options.ThreadedPdfPipelineOptions.accelerator_options</code>)" href="#docling.datamodel.pipeline_options.ThreadedPdfPipelineOptions.accelerator_options">accelerator_options</a></code></b>
|
||
(<code><span title="docling.datamodel.accelerator_options.AcceleratorOptions">AcceleratorOptions</span></code>)
|
||
–
|
||
<div class="doc-md-description">
|
||
|
||
</div>
|
||
</li>
|
||
<li class="doc-section-item field-body">
|
||
<b><code><a class="autorefs autorefs-internal" title="<code class="doc-symbol doc-symbol-heading doc-symbol-attribute"></code> <span class="doc doc-object-name doc-attribute-name">allow_external_plugins</span>
|
||
|
||
|
||
<span class="doc doc-labels">
|
||
<small class="doc doc-label doc-label-class-attribute"><code>class-attribute</code></small>
|
||
<small class="doc doc-label doc-label-instance-attribute"><code>instance-attribute</code></small>
|
||
</span> (<code>docling.datamodel.pipeline_options.ThreadedPdfPipelineOptions.allow_external_plugins</code>)" href="#docling.datamodel.pipeline_options.ThreadedPdfPipelineOptions.allow_external_plugins">allow_external_plugins</a></code></b>
|
||
(<code><span title="bool">bool</span></code>)
|
||
–
|
||
<div class="doc-md-description">
|
||
|
||
</div>
|
||
</li>
|
||
<li class="doc-section-item field-body">
|
||
<b><code><a class="autorefs autorefs-internal" title="<code class="doc-symbol doc-symbol-heading doc-symbol-attribute"></code> <span class="doc doc-object-name doc-attribute-name">artifacts_path</span>
|
||
|
||
|
||
<span class="doc doc-labels">
|
||
<small class="doc doc-label doc-label-class-attribute"><code>class-attribute</code></small>
|
||
<small class="doc doc-label doc-label-instance-attribute"><code>instance-attribute</code></small>
|
||
</span> (<code>docling.datamodel.pipeline_options.ThreadedPdfPipelineOptions.artifacts_path</code>)" href="#docling.datamodel.pipeline_options.ThreadedPdfPipelineOptions.artifacts_path">artifacts_path</a></code></b>
|
||
(<code><span title="typing.Optional">Optional</span>[<span title="typing.Union">Union</span>[<span title="pathlib.Path">Path</span>, <span title="str">str</span>]]</code>)
|
||
–
|
||
<div class="doc-md-description">
|
||
|
||
</div>
|
||
</li>
|
||
<li class="doc-section-item field-body">
|
||
<b><code><a class="autorefs autorefs-internal" title="<code class="doc-symbol doc-symbol-heading doc-symbol-attribute"></code> <span class="doc doc-object-name doc-attribute-name">batch_polling_interval_seconds</span>
|
||
|
||
|
||
<span class="doc doc-labels">
|
||
<small class="doc doc-label doc-label-class-attribute"><code>class-attribute</code></small>
|
||
<small class="doc doc-label doc-label-instance-attribute"><code>instance-attribute</code></small>
|
||
</span> (<code>docling.datamodel.pipeline_options.ThreadedPdfPipelineOptions.batch_polling_interval_seconds</code>)" href="#docling.datamodel.pipeline_options.ThreadedPdfPipelineOptions.batch_polling_interval_seconds">batch_polling_interval_seconds</a></code></b>
|
||
(<code><span title="float">float</span></code>)
|
||
–
|
||
<div class="doc-md-description">
|
||
|
||
</div>
|
||
</li>
|
||
<li class="doc-section-item field-body">
|
||
<b><code><a class="autorefs autorefs-internal" title="<code class="doc-symbol doc-symbol-heading doc-symbol-attribute"></code> <span class="doc doc-object-name doc-attribute-name">do_code_enrichment</span>
|
||
|
||
|
||
<span class="doc doc-labels">
|
||
<small class="doc doc-label doc-label-class-attribute"><code>class-attribute</code></small>
|
||
<small class="doc doc-label doc-label-instance-attribute"><code>instance-attribute</code></small>
|
||
</span> (<code>docling.datamodel.pipeline_options.ThreadedPdfPipelineOptions.do_code_enrichment</code>)" href="#docling.datamodel.pipeline_options.ThreadedPdfPipelineOptions.do_code_enrichment">do_code_enrichment</a></code></b>
|
||
(<code><span title="bool">bool</span></code>)
|
||
–
|
||
<div class="doc-md-description">
|
||
|
||
</div>
|
||
</li>
|
||
<li class="doc-section-item field-body">
|
||
<b><code><a class="autorefs autorefs-internal" title="<code class="doc-symbol doc-symbol-heading doc-symbol-attribute"></code> <span class="doc doc-object-name doc-attribute-name">do_formula_enrichment</span>
|
||
|
||
|
||
<span class="doc doc-labels">
|
||
<small class="doc doc-label doc-label-class-attribute"><code>class-attribute</code></small>
|
||
<small class="doc doc-label doc-label-instance-attribute"><code>instance-attribute</code></small>
|
||
</span> (<code>docling.datamodel.pipeline_options.ThreadedPdfPipelineOptions.do_formula_enrichment</code>)" href="#docling.datamodel.pipeline_options.ThreadedPdfPipelineOptions.do_formula_enrichment">do_formula_enrichment</a></code></b>
|
||
(<code><span title="bool">bool</span></code>)
|
||
–
|
||
<div class="doc-md-description">
|
||
|
||
</div>
|
||
</li>
|
||
<li class="doc-section-item field-body">
|
||
<b><code><a class="autorefs autorefs-internal" title="<code class="doc-symbol doc-symbol-heading doc-symbol-attribute"></code> <span class="doc doc-object-name doc-attribute-name">do_ocr</span>
|
||
|
||
|
||
<span class="doc doc-labels">
|
||
<small class="doc doc-label doc-label-class-attribute"><code>class-attribute</code></small>
|
||
<small class="doc doc-label doc-label-instance-attribute"><code>instance-attribute</code></small>
|
||
</span> (<code>docling.datamodel.pipeline_options.ThreadedPdfPipelineOptions.do_ocr</code>)" href="#docling.datamodel.pipeline_options.ThreadedPdfPipelineOptions.do_ocr">do_ocr</a></code></b>
|
||
(<code><span title="bool">bool</span></code>)
|
||
–
|
||
<div class="doc-md-description">
|
||
|
||
</div>
|
||
</li>
|
||
<li class="doc-section-item field-body">
|
||
<b><code><a class="autorefs autorefs-internal" title="<code class="doc-symbol doc-symbol-heading doc-symbol-attribute"></code> <span class="doc doc-object-name doc-attribute-name">do_picture_classification</span>
|
||
|
||
|
||
<span class="doc doc-labels">
|
||
<small class="doc doc-label doc-label-class-attribute"><code>class-attribute</code></small>
|
||
<small class="doc doc-label doc-label-instance-attribute"><code>instance-attribute</code></small>
|
||
</span> (<code>docling.datamodel.pipeline_options.ThreadedPdfPipelineOptions.do_picture_classification</code>)" href="#docling.datamodel.pipeline_options.ThreadedPdfPipelineOptions.do_picture_classification">do_picture_classification</a></code></b>
|
||
(<code><span title="bool">bool</span></code>)
|
||
–
|
||
<div class="doc-md-description">
|
||
|
||
</div>
|
||
</li>
|
||
<li class="doc-section-item field-body">
|
||
<b><code><a class="autorefs autorefs-internal" title="<code class="doc-symbol doc-symbol-heading doc-symbol-attribute"></code> <span class="doc doc-object-name doc-attribute-name">do_picture_description</span>
|
||
|
||
|
||
<span class="doc doc-labels">
|
||
<small class="doc doc-label doc-label-class-attribute"><code>class-attribute</code></small>
|
||
<small class="doc doc-label doc-label-instance-attribute"><code>instance-attribute</code></small>
|
||
</span> (<code>docling.datamodel.pipeline_options.ThreadedPdfPipelineOptions.do_picture_description</code>)" href="#docling.datamodel.pipeline_options.ThreadedPdfPipelineOptions.do_picture_description">do_picture_description</a></code></b>
|
||
(<code><span title="bool">bool</span></code>)
|
||
–
|
||
<div class="doc-md-description">
|
||
|
||
</div>
|
||
</li>
|
||
<li class="doc-section-item field-body">
|
||
<b><code><a class="autorefs autorefs-internal" title="<code class="doc-symbol doc-symbol-heading doc-symbol-attribute"></code> <span class="doc doc-object-name doc-attribute-name">do_table_structure</span>
|
||
|
||
|
||
<span class="doc doc-labels">
|
||
<small class="doc doc-label doc-label-class-attribute"><code>class-attribute</code></small>
|
||
<small class="doc doc-label doc-label-instance-attribute"><code>instance-attribute</code></small>
|
||
</span> (<code>docling.datamodel.pipeline_options.ThreadedPdfPipelineOptions.do_table_structure</code>)" href="#docling.datamodel.pipeline_options.ThreadedPdfPipelineOptions.do_table_structure">do_table_structure</a></code></b>
|
||
(<code><span title="bool">bool</span></code>)
|
||
–
|
||
<div class="doc-md-description">
|
||
|
||
</div>
|
||
</li>
|
||
<li class="doc-section-item field-body">
|
||
<b><code><a class="autorefs autorefs-internal" title="<code class="doc-symbol doc-symbol-heading doc-symbol-attribute"></code> <span class="doc doc-object-name doc-attribute-name">document_timeout</span>
|
||
|
||
|
||
<span class="doc doc-labels">
|
||
<small class="doc doc-label doc-label-class-attribute"><code>class-attribute</code></small>
|
||
<small class="doc doc-label doc-label-instance-attribute"><code>instance-attribute</code></small>
|
||
</span> (<code>docling.datamodel.pipeline_options.ThreadedPdfPipelineOptions.document_timeout</code>)" href="#docling.datamodel.pipeline_options.ThreadedPdfPipelineOptions.document_timeout">document_timeout</a></code></b>
|
||
(<code><span title="typing.Optional">Optional</span>[<span title="float">float</span>]</code>)
|
||
–
|
||
<div class="doc-md-description">
|
||
|
||
</div>
|
||
</li>
|
||
<li class="doc-section-item field-body">
|
||
<b><code><a class="autorefs autorefs-internal" title="<code class="doc-symbol doc-symbol-heading doc-symbol-attribute"></code> <span class="doc doc-object-name doc-attribute-name">enable_remote_services</span>
|
||
|
||
|
||
<span class="doc doc-labels">
|
||
<small class="doc doc-label doc-label-class-attribute"><code>class-attribute</code></small>
|
||
<small class="doc doc-label doc-label-instance-attribute"><code>instance-attribute</code></small>
|
||
</span> (<code>docling.datamodel.pipeline_options.ThreadedPdfPipelineOptions.enable_remote_services</code>)" href="#docling.datamodel.pipeline_options.ThreadedPdfPipelineOptions.enable_remote_services">enable_remote_services</a></code></b>
|
||
(<code><span title="bool">bool</span></code>)
|
||
–
|
||
<div class="doc-md-description">
|
||
|
||
</div>
|
||
</li>
|
||
<li class="doc-section-item field-body">
|
||
<b><code><a class="autorefs autorefs-internal" title="<code class="doc-symbol doc-symbol-heading doc-symbol-attribute"></code> <span class="doc doc-object-name doc-attribute-name">force_backend_text</span>
|
||
|
||
|
||
<span class="doc doc-labels">
|
||
<small class="doc doc-label doc-label-class-attribute"><code>class-attribute</code></small>
|
||
<small class="doc doc-label doc-label-instance-attribute"><code>instance-attribute</code></small>
|
||
</span> (<code>docling.datamodel.pipeline_options.ThreadedPdfPipelineOptions.force_backend_text</code>)" href="#docling.datamodel.pipeline_options.ThreadedPdfPipelineOptions.force_backend_text">force_backend_text</a></code></b>
|
||
(<code><span title="bool">bool</span></code>)
|
||
–
|
||
<div class="doc-md-description">
|
||
|
||
</div>
|
||
</li>
|
||
<li class="doc-section-item field-body">
|
||
<b><code><a class="autorefs autorefs-internal" title="<code class="doc-symbol doc-symbol-heading doc-symbol-attribute"></code> <span class="doc doc-object-name doc-attribute-name">generate_page_images</span>
|
||
|
||
|
||
<span class="doc doc-labels">
|
||
<small class="doc doc-label doc-label-class-attribute"><code>class-attribute</code></small>
|
||
<small class="doc doc-label doc-label-instance-attribute"><code>instance-attribute</code></small>
|
||
</span> (<code>docling.datamodel.pipeline_options.ThreadedPdfPipelineOptions.generate_page_images</code>)" href="#docling.datamodel.pipeline_options.ThreadedPdfPipelineOptions.generate_page_images">generate_page_images</a></code></b>
|
||
(<code><span title="bool">bool</span></code>)
|
||
–
|
||
<div class="doc-md-description">
|
||
|
||
</div>
|
||
</li>
|
||
<li class="doc-section-item field-body">
|
||
<b><code><a class="autorefs autorefs-internal" title="<code class="doc-symbol doc-symbol-heading doc-symbol-attribute"></code> <span class="doc doc-object-name doc-attribute-name">generate_parsed_pages</span>
|
||
|
||
|
||
<span class="doc doc-labels">
|
||
<small class="doc doc-label doc-label-class-attribute"><code>class-attribute</code></small>
|
||
<small class="doc doc-label doc-label-instance-attribute"><code>instance-attribute</code></small>
|
||
</span> (<code>docling.datamodel.pipeline_options.ThreadedPdfPipelineOptions.generate_parsed_pages</code>)" href="#docling.datamodel.pipeline_options.ThreadedPdfPipelineOptions.generate_parsed_pages">generate_parsed_pages</a></code></b>
|
||
(<code><span title="bool">bool</span></code>)
|
||
–
|
||
<div class="doc-md-description">
|
||
|
||
</div>
|
||
</li>
|
||
<li class="doc-section-item field-body">
|
||
<b><code><a class="autorefs autorefs-internal" title="<code class="doc-symbol doc-symbol-heading doc-symbol-attribute"></code> <span class="doc doc-object-name doc-attribute-name">generate_picture_images</span>
|
||
|
||
|
||
<span class="doc doc-labels">
|
||
<small class="doc doc-label doc-label-class-attribute"><code>class-attribute</code></small>
|
||
<small class="doc doc-label doc-label-instance-attribute"><code>instance-attribute</code></small>
|
||
</span> (<code>docling.datamodel.pipeline_options.ThreadedPdfPipelineOptions.generate_picture_images</code>)" href="#docling.datamodel.pipeline_options.ThreadedPdfPipelineOptions.generate_picture_images">generate_picture_images</a></code></b>
|
||
(<code><span title="bool">bool</span></code>)
|
||
–
|
||
<div class="doc-md-description">
|
||
|
||
</div>
|
||
</li>
|
||
<li class="doc-section-item field-body">
|
||
<b><code><a class="autorefs autorefs-internal" title="<code class="doc-symbol doc-symbol-heading doc-symbol-attribute"></code> <span class="doc doc-object-name doc-attribute-name">generate_table_images</span>
|
||
|
||
|
||
<span class="doc doc-labels">
|
||
<small class="doc doc-label doc-label-class-attribute"><code>class-attribute</code></small>
|
||
<small class="doc doc-label doc-label-instance-attribute"><code>instance-attribute</code></small>
|
||
</span> (<code>docling.datamodel.pipeline_options.ThreadedPdfPipelineOptions.generate_table_images</code>)" href="#docling.datamodel.pipeline_options.ThreadedPdfPipelineOptions.generate_table_images">generate_table_images</a></code></b>
|
||
(<code><span title="bool">bool</span></code>)
|
||
–
|
||
<div class="doc-md-description">
|
||
|
||
</div>
|
||
</li>
|
||
<li class="doc-section-item field-body">
|
||
<b><code><a class="autorefs autorefs-internal" title="<code class="doc-symbol doc-symbol-heading doc-symbol-attribute"></code> <span class="doc doc-object-name doc-attribute-name">images_scale</span>
|
||
|
||
|
||
<span class="doc doc-labels">
|
||
<small class="doc doc-label doc-label-class-attribute"><code>class-attribute</code></small>
|
||
<small class="doc doc-label doc-label-instance-attribute"><code>instance-attribute</code></small>
|
||
</span> (<code>docling.datamodel.pipeline_options.ThreadedPdfPipelineOptions.images_scale</code>)" href="#docling.datamodel.pipeline_options.ThreadedPdfPipelineOptions.images_scale">images_scale</a></code></b>
|
||
(<code><span title="float">float</span></code>)
|
||
–
|
||
<div class="doc-md-description">
|
||
|
||
</div>
|
||
</li>
|
||
<li class="doc-section-item field-body">
|
||
<b><code><a class="autorefs autorefs-internal" title="<code class="doc-symbol doc-symbol-heading doc-symbol-attribute"></code> <span class="doc doc-object-name doc-attribute-name">kind</span>
|
||
|
||
|
||
<span class="doc doc-labels">
|
||
<small class="doc doc-label doc-label-class-attribute"><code>class-attribute</code></small>
|
||
</span> (<code>docling.datamodel.pipeline_options.ThreadedPdfPipelineOptions.kind</code>)" href="#docling.datamodel.pipeline_options.ThreadedPdfPipelineOptions.kind">kind</a></code></b>
|
||
(<code><span title="str">str</span></code>)
|
||
–
|
||
<div class="doc-md-description">
|
||
|
||
</div>
|
||
</li>
|
||
<li class="doc-section-item field-body">
|
||
<b><code><a class="autorefs autorefs-internal" title="<code class="doc-symbol doc-symbol-heading doc-symbol-attribute"></code> <span class="doc doc-object-name doc-attribute-name">layout_batch_size</span>
|
||
|
||
|
||
<span class="doc doc-labels">
|
||
<small class="doc doc-label doc-label-class-attribute"><code>class-attribute</code></small>
|
||
<small class="doc doc-label doc-label-instance-attribute"><code>instance-attribute</code></small>
|
||
</span> (<code>docling.datamodel.pipeline_options.ThreadedPdfPipelineOptions.layout_batch_size</code>)" href="#docling.datamodel.pipeline_options.ThreadedPdfPipelineOptions.layout_batch_size">layout_batch_size</a></code></b>
|
||
(<code><span title="int">int</span></code>)
|
||
–
|
||
<div class="doc-md-description">
|
||
|
||
</div>
|
||
</li>
|
||
<li class="doc-section-item field-body">
|
||
<b><code><a class="autorefs autorefs-internal" title="<code class="doc-symbol doc-symbol-heading doc-symbol-attribute"></code> <span class="doc doc-object-name doc-attribute-name">layout_options</span>
|
||
|
||
|
||
<span class="doc doc-labels">
|
||
<small class="doc doc-label doc-label-class-attribute"><code>class-attribute</code></small>
|
||
<small class="doc doc-label doc-label-instance-attribute"><code>instance-attribute</code></small>
|
||
</span> (<code>docling.datamodel.pipeline_options.ThreadedPdfPipelineOptions.layout_options</code>)" href="#docling.datamodel.pipeline_options.ThreadedPdfPipelineOptions.layout_options">layout_options</a></code></b>
|
||
(<code><a class="autorefs autorefs-internal" title="<code class="doc-symbol doc-symbol-heading doc-symbol-class"></code> <span class="doc doc-object-name doc-class-name">BaseLayoutOptions</span> (<code>docling.datamodel.pipeline_options.BaseLayoutOptions</code>)" href="#docling.datamodel.pipeline_options.BaseLayoutOptions">BaseLayoutOptions</a></code>)
|
||
–
|
||
<div class="doc-md-description">
|
||
|
||
</div>
|
||
</li>
|
||
<li class="doc-section-item field-body">
|
||
<b><code><a class="autorefs autorefs-internal" title="<code class="doc-symbol doc-symbol-heading doc-symbol-attribute"></code> <span class="doc doc-object-name doc-attribute-name">ocr_batch_size</span>
|
||
|
||
|
||
<span class="doc doc-labels">
|
||
<small class="doc doc-label doc-label-class-attribute"><code>class-attribute</code></small>
|
||
<small class="doc doc-label doc-label-instance-attribute"><code>instance-attribute</code></small>
|
||
</span> (<code>docling.datamodel.pipeline_options.ThreadedPdfPipelineOptions.ocr_batch_size</code>)" href="#docling.datamodel.pipeline_options.ThreadedPdfPipelineOptions.ocr_batch_size">ocr_batch_size</a></code></b>
|
||
(<code><span title="int">int</span></code>)
|
||
–
|
||
<div class="doc-md-description">
|
||
|
||
</div>
|
||
</li>
|
||
<li class="doc-section-item field-body">
|
||
<b><code><a class="autorefs autorefs-internal" title="<code class="doc-symbol doc-symbol-heading doc-symbol-attribute"></code> <span class="doc doc-object-name doc-attribute-name">ocr_options</span>
|
||
|
||
|
||
<span class="doc doc-labels">
|
||
<small class="doc doc-label doc-label-class-attribute"><code>class-attribute</code></small>
|
||
<small class="doc doc-label doc-label-instance-attribute"><code>instance-attribute</code></small>
|
||
</span> (<code>docling.datamodel.pipeline_options.ThreadedPdfPipelineOptions.ocr_options</code>)" href="#docling.datamodel.pipeline_options.ThreadedPdfPipelineOptions.ocr_options">ocr_options</a></code></b>
|
||
(<code><a class="autorefs autorefs-internal" title="<code class="doc-symbol doc-symbol-heading doc-symbol-class"></code> <span class="doc doc-object-name doc-class-name">OcrOptions</span> (<code>docling.datamodel.pipeline_options.OcrOptions</code>)" href="#docling.datamodel.pipeline_options.OcrOptions">OcrOptions</a></code>)
|
||
–
|
||
<div class="doc-md-description">
|
||
|
||
</div>
|
||
</li>
|
||
<li class="doc-section-item field-body">
|
||
<b><code><a class="autorefs autorefs-internal" title="<code class="doc-symbol doc-symbol-heading doc-symbol-attribute"></code> <span class="doc doc-object-name doc-attribute-name">picture_description_options</span>
|
||
|
||
|
||
<span class="doc doc-labels">
|
||
<small class="doc doc-label doc-label-class-attribute"><code>class-attribute</code></small>
|
||
<small class="doc doc-label doc-label-instance-attribute"><code>instance-attribute</code></small>
|
||
</span> (<code>docling.datamodel.pipeline_options.ThreadedPdfPipelineOptions.picture_description_options</code>)" href="#docling.datamodel.pipeline_options.ThreadedPdfPipelineOptions.picture_description_options">picture_description_options</a></code></b>
|
||
(<code><a class="autorefs autorefs-internal" title="<code class="doc-symbol doc-symbol-heading doc-symbol-class"></code> <span class="doc doc-object-name doc-class-name">PictureDescriptionBaseOptions</span> (<code>docling.datamodel.pipeline_options.PictureDescriptionBaseOptions</code>)" href="#docling.datamodel.pipeline_options.PictureDescriptionBaseOptions">PictureDescriptionBaseOptions</a></code>)
|
||
–
|
||
<div class="doc-md-description">
|
||
|
||
</div>
|
||
</li>
|
||
<li class="doc-section-item field-body">
|
||
<b><code><a class="autorefs autorefs-internal" title="<code class="doc-symbol doc-symbol-heading doc-symbol-attribute"></code> <span class="doc doc-object-name doc-attribute-name">queue_max_size</span>
|
||
|
||
|
||
<span class="doc doc-labels">
|
||
<small class="doc doc-label doc-label-class-attribute"><code>class-attribute</code></small>
|
||
<small class="doc doc-label doc-label-instance-attribute"><code>instance-attribute</code></small>
|
||
</span> (<code>docling.datamodel.pipeline_options.ThreadedPdfPipelineOptions.queue_max_size</code>)" href="#docling.datamodel.pipeline_options.ThreadedPdfPipelineOptions.queue_max_size">queue_max_size</a></code></b>
|
||
(<code><span title="int">int</span></code>)
|
||
–
|
||
<div class="doc-md-description">
|
||
|
||
</div>
|
||
</li>
|
||
<li class="doc-section-item field-body">
|
||
<b><code><a class="autorefs autorefs-internal" title="<code class="doc-symbol doc-symbol-heading doc-symbol-attribute"></code> <span class="doc doc-object-name doc-attribute-name">table_batch_size</span>
|
||
|
||
|
||
<span class="doc doc-labels">
|
||
<small class="doc doc-label doc-label-class-attribute"><code>class-attribute</code></small>
|
||
<small class="doc doc-label doc-label-instance-attribute"><code>instance-attribute</code></small>
|
||
</span> (<code>docling.datamodel.pipeline_options.ThreadedPdfPipelineOptions.table_batch_size</code>)" href="#docling.datamodel.pipeline_options.ThreadedPdfPipelineOptions.table_batch_size">table_batch_size</a></code></b>
|
||
(<code><span title="int">int</span></code>)
|
||
–
|
||
<div class="doc-md-description">
|
||
|
||
</div>
|
||
</li>
|
||
<li class="doc-section-item field-body">
|
||
<b><code><a class="autorefs autorefs-internal" title="<code class="doc-symbol doc-symbol-heading doc-symbol-attribute"></code> <span class="doc doc-object-name doc-attribute-name">table_structure_options</span>
|
||
|
||
|
||
<span class="doc doc-labels">
|
||
<small class="doc doc-label doc-label-class-attribute"><code>class-attribute</code></small>
|
||
<small class="doc doc-label doc-label-instance-attribute"><code>instance-attribute</code></small>
|
||
</span> (<code>docling.datamodel.pipeline_options.ThreadedPdfPipelineOptions.table_structure_options</code>)" href="#docling.datamodel.pipeline_options.ThreadedPdfPipelineOptions.table_structure_options">table_structure_options</a></code></b>
|
||
(<code><a class="autorefs autorefs-internal" title="<code class="doc-symbol doc-symbol-heading doc-symbol-class"></code> <span class="doc doc-object-name doc-class-name">BaseTableStructureOptions</span> (<code>docling.datamodel.pipeline_options.BaseTableStructureOptions</code>)" href="#docling.datamodel.pipeline_options.BaseTableStructureOptions">BaseTableStructureOptions</a></code>)
|
||
–
|
||
<div class="doc-md-description">
|
||
|
||
</div>
|
||
</li>
|
||
</ul>
|
||
|
||
|
||
|
||
|
||
<div class="doc doc-children">
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
<div class="doc doc-object doc-attribute">
|
||
|
||
|
||
|
||
<h4 id="docling.datamodel.pipeline_options.ThreadedPdfPipelineOptions.accelerator_options" class="doc doc-heading">
|
||
<code class="doc-symbol doc-symbol-heading doc-symbol-attribute"></code> <span class="doc doc-object-name doc-attribute-name">accelerator_options</span>
|
||
|
||
|
||
<span class="doc doc-labels">
|
||
<small class="doc doc-label doc-label-class-attribute"><code>class-attribute</code></small>
|
||
<small class="doc doc-label doc-label-instance-attribute"><code>instance-attribute</code></small>
|
||
</span>
|
||
|
||
</h4>
|
||
<div class="doc-signature highlight"><pre><span></span><code><span class="n">accelerator_options</span><span class="p">:</span> <span class="n"><span title="docling.datamodel.accelerator_options.AcceleratorOptions">AcceleratorOptions</span></span> <span class="o">=</span> <span class="n"><span title="docling.datamodel.accelerator_options.AcceleratorOptions">AcceleratorOptions</span></span><span class="p">()</span>
|
||
</code></pre></div>
|
||
|
||
<div class="doc doc-contents ">
|
||
|
||
</div>
|
||
|
||
</div>
|
||
|
||
<div class="doc doc-object doc-attribute">
|
||
|
||
|
||
|
||
<h4 id="docling.datamodel.pipeline_options.ThreadedPdfPipelineOptions.allow_external_plugins" class="doc doc-heading">
|
||
<code class="doc-symbol doc-symbol-heading doc-symbol-attribute"></code> <span class="doc doc-object-name doc-attribute-name">allow_external_plugins</span>
|
||
|
||
|
||
<span class="doc doc-labels">
|
||
<small class="doc doc-label doc-label-class-attribute"><code>class-attribute</code></small>
|
||
<small class="doc doc-label doc-label-instance-attribute"><code>instance-attribute</code></small>
|
||
</span>
|
||
|
||
</h4>
|
||
<div class="doc-signature highlight"><pre><span></span><code><span class="n">allow_external_plugins</span><span class="p">:</span> <span class="n"><span title="bool">bool</span></span> <span class="o">=</span> <span class="kc">False</span>
|
||
</code></pre></div>
|
||
|
||
<div class="doc doc-contents ">
|
||
|
||
</div>
|
||
|
||
</div>
|
||
|
||
<div class="doc doc-object doc-attribute">
|
||
|
||
|
||
|
||
<h4 id="docling.datamodel.pipeline_options.ThreadedPdfPipelineOptions.artifacts_path" class="doc doc-heading">
|
||
<code class="doc-symbol doc-symbol-heading doc-symbol-attribute"></code> <span class="doc doc-object-name doc-attribute-name">artifacts_path</span>
|
||
|
||
|
||
<span class="doc doc-labels">
|
||
<small class="doc doc-label doc-label-class-attribute"><code>class-attribute</code></small>
|
||
<small class="doc doc-label doc-label-instance-attribute"><code>instance-attribute</code></small>
|
||
</span>
|
||
|
||
</h4>
|
||
<div class="doc-signature highlight"><pre><span></span><code><span class="n">artifacts_path</span><span class="p">:</span> <span class="n"><span title="typing.Optional">Optional</span></span><span class="p">[</span><span class="n"><span title="typing.Union">Union</span></span><span class="p">[</span><span class="n"><span title="pathlib.Path">Path</span></span><span class="p">,</span> <span class="n"><span title="str">str</span></span><span class="p">]]</span> <span class="o">=</span> <span class="kc">None</span>
|
||
</code></pre></div>
|
||
|
||
<div class="doc doc-contents ">
|
||
|
||
</div>
|
||
|
||
</div>
|
||
|
||
<div class="doc doc-object doc-attribute">
|
||
|
||
|
||
|
||
<h4 id="docling.datamodel.pipeline_options.ThreadedPdfPipelineOptions.batch_polling_interval_seconds" class="doc doc-heading">
|
||
<code class="doc-symbol doc-symbol-heading doc-symbol-attribute"></code> <span class="doc doc-object-name doc-attribute-name">batch_polling_interval_seconds</span>
|
||
|
||
|
||
<span class="doc doc-labels">
|
||
<small class="doc doc-label doc-label-class-attribute"><code>class-attribute</code></small>
|
||
<small class="doc doc-label doc-label-instance-attribute"><code>instance-attribute</code></small>
|
||
</span>
|
||
|
||
</h4>
|
||
<div class="doc-signature highlight"><pre><span></span><code><span class="n">batch_polling_interval_seconds</span><span class="p">:</span> <span class="n"><span title="float">float</span></span> <span class="o">=</span> <span class="mf">0.5</span>
|
||
</code></pre></div>
|
||
|
||
<div class="doc doc-contents ">
|
||
|
||
</div>
|
||
|
||
</div>
|
||
|
||
<div class="doc doc-object doc-attribute">
|
||
|
||
|
||
|
||
<h4 id="docling.datamodel.pipeline_options.ThreadedPdfPipelineOptions.do_code_enrichment" class="doc doc-heading">
|
||
<code class="doc-symbol doc-symbol-heading doc-symbol-attribute"></code> <span class="doc doc-object-name doc-attribute-name">do_code_enrichment</span>
|
||
|
||
|
||
<span class="doc doc-labels">
|
||
<small class="doc doc-label doc-label-class-attribute"><code>class-attribute</code></small>
|
||
<small class="doc doc-label doc-label-instance-attribute"><code>instance-attribute</code></small>
|
||
</span>
|
||
|
||
</h4>
|
||
<div class="doc-signature highlight"><pre><span></span><code><span class="n">do_code_enrichment</span><span class="p">:</span> <span class="n"><span title="bool">bool</span></span> <span class="o">=</span> <span class="kc">False</span>
|
||
</code></pre></div>
|
||
|
||
<div class="doc doc-contents ">
|
||
|
||
</div>
|
||
|
||
</div>
|
||
|
||
<div class="doc doc-object doc-attribute">
|
||
|
||
|
||
|
||
<h4 id="docling.datamodel.pipeline_options.ThreadedPdfPipelineOptions.do_formula_enrichment" class="doc doc-heading">
|
||
<code class="doc-symbol doc-symbol-heading doc-symbol-attribute"></code> <span class="doc doc-object-name doc-attribute-name">do_formula_enrichment</span>
|
||
|
||
|
||
<span class="doc doc-labels">
|
||
<small class="doc doc-label doc-label-class-attribute"><code>class-attribute</code></small>
|
||
<small class="doc doc-label doc-label-instance-attribute"><code>instance-attribute</code></small>
|
||
</span>
|
||
|
||
</h4>
|
||
<div class="doc-signature highlight"><pre><span></span><code><span class="n">do_formula_enrichment</span><span class="p">:</span> <span class="n"><span title="bool">bool</span></span> <span class="o">=</span> <span class="kc">False</span>
|
||
</code></pre></div>
|
||
|
||
<div class="doc doc-contents ">
|
||
|
||
</div>
|
||
|
||
</div>
|
||
|
||
<div class="doc doc-object doc-attribute">
|
||
|
||
|
||
|
||
<h4 id="docling.datamodel.pipeline_options.ThreadedPdfPipelineOptions.do_ocr" class="doc doc-heading">
|
||
<code class="doc-symbol doc-symbol-heading doc-symbol-attribute"></code> <span class="doc doc-object-name doc-attribute-name">do_ocr</span>
|
||
|
||
|
||
<span class="doc doc-labels">
|
||
<small class="doc doc-label doc-label-class-attribute"><code>class-attribute</code></small>
|
||
<small class="doc doc-label doc-label-instance-attribute"><code>instance-attribute</code></small>
|
||
</span>
|
||
|
||
</h4>
|
||
<div class="doc-signature highlight"><pre><span></span><code><span class="n">do_ocr</span><span class="p">:</span> <span class="n"><span title="bool">bool</span></span> <span class="o">=</span> <span class="kc">True</span>
|
||
</code></pre></div>
|
||
|
||
<div class="doc doc-contents ">
|
||
|
||
</div>
|
||
|
||
</div>
|
||
|
||
<div class="doc doc-object doc-attribute">
|
||
|
||
|
||
|
||
<h4 id="docling.datamodel.pipeline_options.ThreadedPdfPipelineOptions.do_picture_classification" class="doc doc-heading">
|
||
<code class="doc-symbol doc-symbol-heading doc-symbol-attribute"></code> <span class="doc doc-object-name doc-attribute-name">do_picture_classification</span>
|
||
|
||
|
||
<span class="doc doc-labels">
|
||
<small class="doc doc-label doc-label-class-attribute"><code>class-attribute</code></small>
|
||
<small class="doc doc-label doc-label-instance-attribute"><code>instance-attribute</code></small>
|
||
</span>
|
||
|
||
</h4>
|
||
<div class="doc-signature highlight"><pre><span></span><code><span class="n">do_picture_classification</span><span class="p">:</span> <span class="n"><span title="bool">bool</span></span> <span class="o">=</span> <span class="kc">False</span>
|
||
</code></pre></div>
|
||
|
||
<div class="doc doc-contents ">
|
||
|
||
</div>
|
||
|
||
</div>
|
||
|
||
<div class="doc doc-object doc-attribute">
|
||
|
||
|
||
|
||
<h4 id="docling.datamodel.pipeline_options.ThreadedPdfPipelineOptions.do_picture_description" class="doc doc-heading">
|
||
<code class="doc-symbol doc-symbol-heading doc-symbol-attribute"></code> <span class="doc doc-object-name doc-attribute-name">do_picture_description</span>
|
||
|
||
|
||
<span class="doc doc-labels">
|
||
<small class="doc doc-label doc-label-class-attribute"><code>class-attribute</code></small>
|
||
<small class="doc doc-label doc-label-instance-attribute"><code>instance-attribute</code></small>
|
||
</span>
|
||
|
||
</h4>
|
||
<div class="doc-signature highlight"><pre><span></span><code><span class="n">do_picture_description</span><span class="p">:</span> <span class="n"><span title="bool">bool</span></span> <span class="o">=</span> <span class="kc">False</span>
|
||
</code></pre></div>
|
||
|
||
<div class="doc doc-contents ">
|
||
|
||
</div>
|
||
|
||
</div>
|
||
|
||
<div class="doc doc-object doc-attribute">
|
||
|
||
|
||
|
||
<h4 id="docling.datamodel.pipeline_options.ThreadedPdfPipelineOptions.do_table_structure" class="doc doc-heading">
|
||
<code class="doc-symbol doc-symbol-heading doc-symbol-attribute"></code> <span class="doc doc-object-name doc-attribute-name">do_table_structure</span>
|
||
|
||
|
||
<span class="doc doc-labels">
|
||
<small class="doc doc-label doc-label-class-attribute"><code>class-attribute</code></small>
|
||
<small class="doc doc-label doc-label-instance-attribute"><code>instance-attribute</code></small>
|
||
</span>
|
||
|
||
</h4>
|
||
<div class="doc-signature highlight"><pre><span></span><code><span class="n">do_table_structure</span><span class="p">:</span> <span class="n"><span title="bool">bool</span></span> <span class="o">=</span> <span class="kc">True</span>
|
||
</code></pre></div>
|
||
|
||
<div class="doc doc-contents ">
|
||
|
||
</div>
|
||
|
||
</div>
|
||
|
||
<div class="doc doc-object doc-attribute">
|
||
|
||
|
||
|
||
<h4 id="docling.datamodel.pipeline_options.ThreadedPdfPipelineOptions.document_timeout" class="doc doc-heading">
|
||
<code class="doc-symbol doc-symbol-heading doc-symbol-attribute"></code> <span class="doc doc-object-name doc-attribute-name">document_timeout</span>
|
||
|
||
|
||
<span class="doc doc-labels">
|
||
<small class="doc doc-label doc-label-class-attribute"><code>class-attribute</code></small>
|
||
<small class="doc doc-label doc-label-instance-attribute"><code>instance-attribute</code></small>
|
||
</span>
|
||
|
||
</h4>
|
||
<div class="doc-signature highlight"><pre><span></span><code><span class="n">document_timeout</span><span class="p">:</span> <span class="n"><span title="typing.Optional">Optional</span></span><span class="p">[</span><span class="n"><span title="float">float</span></span><span class="p">]</span> <span class="o">=</span> <span class="kc">None</span>
|
||
</code></pre></div>
|
||
|
||
<div class="doc doc-contents ">
|
||
|
||
</div>
|
||
|
||
</div>
|
||
|
||
<div class="doc doc-object doc-attribute">
|
||
|
||
|
||
|
||
<h4 id="docling.datamodel.pipeline_options.ThreadedPdfPipelineOptions.enable_remote_services" class="doc doc-heading">
|
||
<code class="doc-symbol doc-symbol-heading doc-symbol-attribute"></code> <span class="doc doc-object-name doc-attribute-name">enable_remote_services</span>
|
||
|
||
|
||
<span class="doc doc-labels">
|
||
<small class="doc doc-label doc-label-class-attribute"><code>class-attribute</code></small>
|
||
<small class="doc doc-label doc-label-instance-attribute"><code>instance-attribute</code></small>
|
||
</span>
|
||
|
||
</h4>
|
||
<div class="doc-signature highlight"><pre><span></span><code><span class="n">enable_remote_services</span><span class="p">:</span> <span class="n"><span title="bool">bool</span></span> <span class="o">=</span> <span class="kc">False</span>
|
||
</code></pre></div>
|
||
|
||
<div class="doc doc-contents ">
|
||
|
||
</div>
|
||
|
||
</div>
|
||
|
||
<div class="doc doc-object doc-attribute">
|
||
|
||
|
||
|
||
<h4 id="docling.datamodel.pipeline_options.ThreadedPdfPipelineOptions.force_backend_text" class="doc doc-heading">
|
||
<code class="doc-symbol doc-symbol-heading doc-symbol-attribute"></code> <span class="doc doc-object-name doc-attribute-name">force_backend_text</span>
|
||
|
||
|
||
<span class="doc doc-labels">
|
||
<small class="doc doc-label doc-label-class-attribute"><code>class-attribute</code></small>
|
||
<small class="doc doc-label doc-label-instance-attribute"><code>instance-attribute</code></small>
|
||
</span>
|
||
|
||
</h4>
|
||
<div class="doc-signature highlight"><pre><span></span><code><span class="n">force_backend_text</span><span class="p">:</span> <span class="n"><span title="bool">bool</span></span> <span class="o">=</span> <span class="kc">False</span>
|
||
</code></pre></div>
|
||
|
||
<div class="doc doc-contents ">
|
||
|
||
</div>
|
||
|
||
</div>
|
||
|
||
<div class="doc doc-object doc-attribute">
|
||
|
||
|
||
|
||
<h4 id="docling.datamodel.pipeline_options.ThreadedPdfPipelineOptions.generate_page_images" class="doc doc-heading">
|
||
<code class="doc-symbol doc-symbol-heading doc-symbol-attribute"></code> <span class="doc doc-object-name doc-attribute-name">generate_page_images</span>
|
||
|
||
|
||
<span class="doc doc-labels">
|
||
<small class="doc doc-label doc-label-class-attribute"><code>class-attribute</code></small>
|
||
<small class="doc doc-label doc-label-instance-attribute"><code>instance-attribute</code></small>
|
||
</span>
|
||
|
||
</h4>
|
||
<div class="doc-signature highlight"><pre><span></span><code><span class="n">generate_page_images</span><span class="p">:</span> <span class="n"><span title="bool">bool</span></span> <span class="o">=</span> <span class="kc">False</span>
|
||
</code></pre></div>
|
||
|
||
<div class="doc doc-contents ">
|
||
|
||
</div>
|
||
|
||
</div>
|
||
|
||
<div class="doc doc-object doc-attribute">
|
||
|
||
|
||
|
||
<h4 id="docling.datamodel.pipeline_options.ThreadedPdfPipelineOptions.generate_parsed_pages" class="doc doc-heading">
|
||
<code class="doc-symbol doc-symbol-heading doc-symbol-attribute"></code> <span class="doc doc-object-name doc-attribute-name">generate_parsed_pages</span>
|
||
|
||
|
||
<span class="doc doc-labels">
|
||
<small class="doc doc-label doc-label-class-attribute"><code>class-attribute</code></small>
|
||
<small class="doc doc-label doc-label-instance-attribute"><code>instance-attribute</code></small>
|
||
</span>
|
||
|
||
</h4>
|
||
<div class="doc-signature highlight"><pre><span></span><code><span class="n">generate_parsed_pages</span><span class="p">:</span> <span class="n"><span title="bool">bool</span></span> <span class="o">=</span> <span class="kc">False</span>
|
||
</code></pre></div>
|
||
|
||
<div class="doc doc-contents ">
|
||
|
||
</div>
|
||
|
||
</div>
|
||
|
||
<div class="doc doc-object doc-attribute">
|
||
|
||
|
||
|
||
<h4 id="docling.datamodel.pipeline_options.ThreadedPdfPipelineOptions.generate_picture_images" class="doc doc-heading">
|
||
<code class="doc-symbol doc-symbol-heading doc-symbol-attribute"></code> <span class="doc doc-object-name doc-attribute-name">generate_picture_images</span>
|
||
|
||
|
||
<span class="doc doc-labels">
|
||
<small class="doc doc-label doc-label-class-attribute"><code>class-attribute</code></small>
|
||
<small class="doc doc-label doc-label-instance-attribute"><code>instance-attribute</code></small>
|
||
</span>
|
||
|
||
</h4>
|
||
<div class="doc-signature highlight"><pre><span></span><code><span class="n">generate_picture_images</span><span class="p">:</span> <span class="n"><span title="bool">bool</span></span> <span class="o">=</span> <span class="kc">False</span>
|
||
</code></pre></div>
|
||
|
||
<div class="doc doc-contents ">
|
||
|
||
</div>
|
||
|
||
</div>
|
||
|
||
<div class="doc doc-object doc-attribute">
|
||
|
||
|
||
|
||
<h4 id="docling.datamodel.pipeline_options.ThreadedPdfPipelineOptions.generate_table_images" class="doc doc-heading">
|
||
<code class="doc-symbol doc-symbol-heading doc-symbol-attribute"></code> <span class="doc doc-object-name doc-attribute-name">generate_table_images</span>
|
||
|
||
|
||
<span class="doc doc-labels">
|
||
<small class="doc doc-label doc-label-class-attribute"><code>class-attribute</code></small>
|
||
<small class="doc doc-label doc-label-instance-attribute"><code>instance-attribute</code></small>
|
||
</span>
|
||
|
||
</h4>
|
||
<div class="doc-signature highlight"><pre><span></span><code><span class="n">generate_table_images</span><span class="p">:</span> <span class="n"><span title="bool">bool</span></span> <span class="o">=</span> <span class="n"><span title="pydantic.Field">Field</span></span><span class="p">(</span><span class="n"><span title="pydantic.Field(default)">default</span></span><span class="o">=</span><span class="kc">False</span><span class="p">,</span> <span class="n"><span title="pydantic.Field(deprecated)">deprecated</span></span><span class="o">=</span><span class="s1">'Field `generate_table_images` is deprecated. To obtain table images, set `PdfPipelineOptions.generate_page_images = True` before conversion and then use the `TableItem.get_image` function.'</span><span class="p">)</span>
|
||
</code></pre></div>
|
||
|
||
<div class="doc doc-contents ">
|
||
|
||
</div>
|
||
|
||
</div>
|
||
|
||
<div class="doc doc-object doc-attribute">
|
||
|
||
|
||
|
||
<h4 id="docling.datamodel.pipeline_options.ThreadedPdfPipelineOptions.images_scale" class="doc doc-heading">
|
||
<code class="doc-symbol doc-symbol-heading doc-symbol-attribute"></code> <span class="doc doc-object-name doc-attribute-name">images_scale</span>
|
||
|
||
|
||
<span class="doc doc-labels">
|
||
<small class="doc doc-label doc-label-class-attribute"><code>class-attribute</code></small>
|
||
<small class="doc doc-label doc-label-instance-attribute"><code>instance-attribute</code></small>
|
||
</span>
|
||
|
||
</h4>
|
||
<div class="doc-signature highlight"><pre><span></span><code><span class="n">images_scale</span><span class="p">:</span> <span class="n"><span title="float">float</span></span> <span class="o">=</span> <span class="mf">1.0</span>
|
||
</code></pre></div>
|
||
|
||
<div class="doc doc-contents ">
|
||
|
||
</div>
|
||
|
||
</div>
|
||
|
||
<div class="doc doc-object doc-attribute">
|
||
|
||
|
||
|
||
<h4 id="docling.datamodel.pipeline_options.ThreadedPdfPipelineOptions.kind" class="doc doc-heading">
|
||
<code class="doc-symbol doc-symbol-heading doc-symbol-attribute"></code> <span class="doc doc-object-name doc-attribute-name">kind</span>
|
||
|
||
|
||
<span class="doc doc-labels">
|
||
<small class="doc doc-label doc-label-class-attribute"><code>class-attribute</code></small>
|
||
</span>
|
||
|
||
</h4>
|
||
<div class="doc-signature highlight"><pre><span></span><code><span class="n">kind</span><span class="p">:</span> <span class="n"><span title="str">str</span></span>
|
||
</code></pre></div>
|
||
|
||
<div class="doc doc-contents ">
|
||
|
||
</div>
|
||
|
||
</div>
|
||
|
||
<div class="doc doc-object doc-attribute">
|
||
|
||
|
||
|
||
<h4 id="docling.datamodel.pipeline_options.ThreadedPdfPipelineOptions.layout_batch_size" class="doc doc-heading">
|
||
<code class="doc-symbol doc-symbol-heading doc-symbol-attribute"></code> <span class="doc doc-object-name doc-attribute-name">layout_batch_size</span>
|
||
|
||
|
||
<span class="doc doc-labels">
|
||
<small class="doc doc-label doc-label-class-attribute"><code>class-attribute</code></small>
|
||
<small class="doc doc-label doc-label-instance-attribute"><code>instance-attribute</code></small>
|
||
</span>
|
||
|
||
</h4>
|
||
<div class="doc-signature highlight"><pre><span></span><code><span class="n">layout_batch_size</span><span class="p">:</span> <span class="n"><span title="int">int</span></span> <span class="o">=</span> <span class="mi">4</span>
|
||
</code></pre></div>
|
||
|
||
<div class="doc doc-contents ">
|
||
|
||
</div>
|
||
|
||
</div>
|
||
|
||
<div class="doc doc-object doc-attribute">
|
||
|
||
|
||
|
||
<h4 id="docling.datamodel.pipeline_options.ThreadedPdfPipelineOptions.layout_options" class="doc doc-heading">
|
||
<code class="doc-symbol doc-symbol-heading doc-symbol-attribute"></code> <span class="doc doc-object-name doc-attribute-name">layout_options</span>
|
||
|
||
|
||
<span class="doc doc-labels">
|
||
<small class="doc doc-label doc-label-class-attribute"><code>class-attribute</code></small>
|
||
<small class="doc doc-label doc-label-instance-attribute"><code>instance-attribute</code></small>
|
||
</span>
|
||
|
||
</h4>
|
||
<div class="doc-signature highlight"><pre><span></span><code><span class="n">layout_options</span><span class="p">:</span> <span class="n"><a class="autorefs autorefs-internal" title="<code class="doc-symbol doc-symbol-heading doc-symbol-class"></code> <span class="doc doc-object-name doc-class-name">BaseLayoutOptions</span> (<code>docling.datamodel.pipeline_options.BaseLayoutOptions</code>)" href="#docling.datamodel.pipeline_options.BaseLayoutOptions">BaseLayoutOptions</a></span> <span class="o">=</span> <span class="n"><a class="autorefs autorefs-internal" title="<code class="doc-symbol doc-symbol-heading doc-symbol-class"></code> <span class="doc doc-object-name doc-class-name">LayoutOptions</span> (<code>docling.datamodel.pipeline_options.LayoutOptions</code>)" href="#docling.datamodel.pipeline_options.LayoutOptions">LayoutOptions</a></span><span class="p">()</span>
|
||
</code></pre></div>
|
||
|
||
<div class="doc doc-contents ">
|
||
|
||
</div>
|
||
|
||
</div>
|
||
|
||
<div class="doc doc-object doc-attribute">
|
||
|
||
|
||
|
||
<h4 id="docling.datamodel.pipeline_options.ThreadedPdfPipelineOptions.ocr_batch_size" class="doc doc-heading">
|
||
<code class="doc-symbol doc-symbol-heading doc-symbol-attribute"></code> <span class="doc doc-object-name doc-attribute-name">ocr_batch_size</span>
|
||
|
||
|
||
<span class="doc doc-labels">
|
||
<small class="doc doc-label doc-label-class-attribute"><code>class-attribute</code></small>
|
||
<small class="doc doc-label doc-label-instance-attribute"><code>instance-attribute</code></small>
|
||
</span>
|
||
|
||
</h4>
|
||
<div class="doc-signature highlight"><pre><span></span><code><span class="n">ocr_batch_size</span><span class="p">:</span> <span class="n"><span title="int">int</span></span> <span class="o">=</span> <span class="mi">4</span>
|
||
</code></pre></div>
|
||
|
||
<div class="doc doc-contents ">
|
||
|
||
</div>
|
||
|
||
</div>
|
||
|
||
<div class="doc doc-object doc-attribute">
|
||
|
||
|
||
|
||
<h4 id="docling.datamodel.pipeline_options.ThreadedPdfPipelineOptions.ocr_options" class="doc doc-heading">
|
||
<code class="doc-symbol doc-symbol-heading doc-symbol-attribute"></code> <span class="doc doc-object-name doc-attribute-name">ocr_options</span>
|
||
|
||
|
||
<span class="doc doc-labels">
|
||
<small class="doc doc-label doc-label-class-attribute"><code>class-attribute</code></small>
|
||
<small class="doc doc-label doc-label-instance-attribute"><code>instance-attribute</code></small>
|
||
</span>
|
||
|
||
</h4>
|
||
<div class="doc-signature highlight"><pre><span></span><code><span class="n">ocr_options</span><span class="p">:</span> <span class="n"><a class="autorefs autorefs-internal" title="<code class="doc-symbol doc-symbol-heading doc-symbol-class"></code> <span class="doc doc-object-name doc-class-name">OcrOptions</span> (<code>docling.datamodel.pipeline_options.OcrOptions</code>)" href="#docling.datamodel.pipeline_options.OcrOptions">OcrOptions</a></span> <span class="o">=</span> <span class="n"><a class="autorefs autorefs-internal" title="<code class="doc-symbol doc-symbol-heading doc-symbol-class"></code> <span class="doc doc-object-name doc-class-name">OcrAutoOptions</span> (<code>docling.datamodel.pipeline_options.OcrAutoOptions</code>)" href="#docling.datamodel.pipeline_options.OcrAutoOptions">OcrAutoOptions</a></span><span class="p">()</span>
|
||
</code></pre></div>
|
||
|
||
<div class="doc doc-contents ">
|
||
|
||
</div>
|
||
|
||
</div>
|
||
|
||
<div class="doc doc-object doc-attribute">
|
||
|
||
|
||
|
||
<h4 id="docling.datamodel.pipeline_options.ThreadedPdfPipelineOptions.picture_description_options" class="doc doc-heading">
|
||
<code class="doc-symbol doc-symbol-heading doc-symbol-attribute"></code> <span class="doc doc-object-name doc-attribute-name">picture_description_options</span>
|
||
|
||
|
||
<span class="doc doc-labels">
|
||
<small class="doc doc-label doc-label-class-attribute"><code>class-attribute</code></small>
|
||
<small class="doc doc-label doc-label-instance-attribute"><code>instance-attribute</code></small>
|
||
</span>
|
||
|
||
</h4>
|
||
<div class="doc-signature highlight"><pre><span></span><code><span class="n">picture_description_options</span><span class="p">:</span> <span class="n"><a class="autorefs autorefs-internal" title="<code class="doc-symbol doc-symbol-heading doc-symbol-class"></code> <span class="doc doc-object-name doc-class-name">PictureDescriptionBaseOptions</span> (<code>docling.datamodel.pipeline_options.PictureDescriptionBaseOptions</code>)" href="#docling.datamodel.pipeline_options.PictureDescriptionBaseOptions">PictureDescriptionBaseOptions</a></span> <span class="o">=</span> <span class="n"><a class="autorefs autorefs-internal" title="<code class="doc-symbol doc-symbol-heading doc-symbol-attribute"></code> <span class="doc doc-object-name doc-attribute-name">smolvlm_picture_description</span>
|
||
|
||
|
||
<span class="doc doc-labels">
|
||
<small class="doc doc-label doc-label-module-attribute"><code>module-attribute</code></small>
|
||
</span> (<code>docling.datamodel.pipeline_options.smolvlm_picture_description</code>)" href="#docling.datamodel.pipeline_options.smolvlm_picture_description">smolvlm_picture_description</a></span>
|
||
</code></pre></div>
|
||
|
||
<div class="doc doc-contents ">
|
||
|
||
</div>
|
||
|
||
</div>
|
||
|
||
<div class="doc doc-object doc-attribute">
|
||
|
||
|
||
|
||
<h4 id="docling.datamodel.pipeline_options.ThreadedPdfPipelineOptions.queue_max_size" class="doc doc-heading">
|
||
<code class="doc-symbol doc-symbol-heading doc-symbol-attribute"></code> <span class="doc doc-object-name doc-attribute-name">queue_max_size</span>
|
||
|
||
|
||
<span class="doc doc-labels">
|
||
<small class="doc doc-label doc-label-class-attribute"><code>class-attribute</code></small>
|
||
<small class="doc doc-label doc-label-instance-attribute"><code>instance-attribute</code></small>
|
||
</span>
|
||
|
||
</h4>
|
||
<div class="doc-signature highlight"><pre><span></span><code><span class="n">queue_max_size</span><span class="p">:</span> <span class="n"><span title="int">int</span></span> <span class="o">=</span> <span class="mi">100</span>
|
||
</code></pre></div>
|
||
|
||
<div class="doc doc-contents ">
|
||
|
||
</div>
|
||
|
||
</div>
|
||
|
||
<div class="doc doc-object doc-attribute">
|
||
|
||
|
||
|
||
<h4 id="docling.datamodel.pipeline_options.ThreadedPdfPipelineOptions.table_batch_size" class="doc doc-heading">
|
||
<code class="doc-symbol doc-symbol-heading doc-symbol-attribute"></code> <span class="doc doc-object-name doc-attribute-name">table_batch_size</span>
|
||
|
||
|
||
<span class="doc doc-labels">
|
||
<small class="doc doc-label doc-label-class-attribute"><code>class-attribute</code></small>
|
||
<small class="doc doc-label doc-label-instance-attribute"><code>instance-attribute</code></small>
|
||
</span>
|
||
|
||
</h4>
|
||
<div class="doc-signature highlight"><pre><span></span><code><span class="n">table_batch_size</span><span class="p">:</span> <span class="n"><span title="int">int</span></span> <span class="o">=</span> <span class="mi">4</span>
|
||
</code></pre></div>
|
||
|
||
<div class="doc doc-contents ">
|
||
|
||
</div>
|
||
|
||
</div>
|
||
|
||
<div class="doc doc-object doc-attribute">
|
||
|
||
|
||
|
||
<h4 id="docling.datamodel.pipeline_options.ThreadedPdfPipelineOptions.table_structure_options" class="doc doc-heading">
|
||
<code class="doc-symbol doc-symbol-heading doc-symbol-attribute"></code> <span class="doc doc-object-name doc-attribute-name">table_structure_options</span>
|
||
|
||
|
||
<span class="doc doc-labels">
|
||
<small class="doc doc-label doc-label-class-attribute"><code>class-attribute</code></small>
|
||
<small class="doc doc-label doc-label-instance-attribute"><code>instance-attribute</code></small>
|
||
</span>
|
||
|
||
</h4>
|
||
<div class="doc-signature highlight"><pre><span></span><code><span class="n">table_structure_options</span><span class="p">:</span> <span class="n"><a class="autorefs autorefs-internal" title="<code class="doc-symbol doc-symbol-heading doc-symbol-class"></code> <span class="doc doc-object-name doc-class-name">BaseTableStructureOptions</span> (<code>docling.datamodel.pipeline_options.BaseTableStructureOptions</code>)" href="#docling.datamodel.pipeline_options.BaseTableStructureOptions">BaseTableStructureOptions</a></span> <span class="o">=</span> <span class="n"><a class="autorefs autorefs-internal" title="<code class="doc-symbol doc-symbol-heading doc-symbol-class"></code> <span class="doc doc-object-name doc-class-name">TableStructureOptions</span> (<code>docling.datamodel.pipeline_options.TableStructureOptions</code>)" href="#docling.datamodel.pipeline_options.TableStructureOptions">TableStructureOptions</a></span><span class="p">()</span>
|
||
</code></pre></div>
|
||
|
||
<div class="doc doc-contents ">
|
||
|
||
</div>
|
||
|
||
</div>
|
||
|
||
|
||
|
||
|
||
|
||
|
||
</div>
|
||
|
||
</div>
|
||
|
||
</div>
|
||
|
||
<div class="doc doc-object doc-class">
|
||
|
||
|
||
|
||
<h3 id="docling.datamodel.pipeline_options.VlmExtractionPipelineOptions" class="doc doc-heading">
|
||
<code class="doc-symbol doc-symbol-heading doc-symbol-class"></code> <span class="doc doc-object-name doc-class-name">VlmExtractionPipelineOptions</span>
|
||
|
||
|
||
</h3>
|
||
|
||
|
||
<div class="doc doc-contents ">
|
||
<p class="doc doc-class-bases">
|
||
Bases: <code><a class="autorefs autorefs-internal" title="<code class="doc-symbol doc-symbol-heading doc-symbol-class"></code> <span class="doc doc-object-name doc-class-name">PipelineOptions</span> (<code>docling.datamodel.pipeline_options.PipelineOptions</code>)" href="#docling.datamodel.pipeline_options.PipelineOptions">PipelineOptions</a></code></p>
|
||
|
||
|
||
|
||
<p>Options for extraction pipeline.</p>
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
<p><span class="doc-section-title">Attributes:</span></p>
|
||
<ul>
|
||
<li class="doc-section-item field-body">
|
||
<b><code><a class="autorefs autorefs-internal" title="<code class="doc-symbol doc-symbol-heading doc-symbol-attribute"></code> <span class="doc doc-object-name doc-attribute-name">accelerator_options</span>
|
||
|
||
|
||
<span class="doc doc-labels">
|
||
<small class="doc doc-label doc-label-class-attribute"><code>class-attribute</code></small>
|
||
<small class="doc doc-label doc-label-instance-attribute"><code>instance-attribute</code></small>
|
||
</span> (<code>docling.datamodel.pipeline_options.VlmExtractionPipelineOptions.accelerator_options</code>)" href="#docling.datamodel.pipeline_options.VlmExtractionPipelineOptions.accelerator_options">accelerator_options</a></code></b>
|
||
(<code><span title="docling.datamodel.accelerator_options.AcceleratorOptions">AcceleratorOptions</span></code>)
|
||
–
|
||
<div class="doc-md-description">
|
||
|
||
</div>
|
||
</li>
|
||
<li class="doc-section-item field-body">
|
||
<b><code><a class="autorefs autorefs-internal" title="<code class="doc-symbol doc-symbol-heading doc-symbol-attribute"></code> <span class="doc doc-object-name doc-attribute-name">allow_external_plugins</span>
|
||
|
||
|
||
<span class="doc doc-labels">
|
||
<small class="doc doc-label doc-label-class-attribute"><code>class-attribute</code></small>
|
||
<small class="doc doc-label doc-label-instance-attribute"><code>instance-attribute</code></small>
|
||
</span> (<code>docling.datamodel.pipeline_options.VlmExtractionPipelineOptions.allow_external_plugins</code>)" href="#docling.datamodel.pipeline_options.VlmExtractionPipelineOptions.allow_external_plugins">allow_external_plugins</a></code></b>
|
||
(<code><span title="bool">bool</span></code>)
|
||
–
|
||
<div class="doc-md-description">
|
||
|
||
</div>
|
||
</li>
|
||
<li class="doc-section-item field-body">
|
||
<b><code><a class="autorefs autorefs-internal" title="<code class="doc-symbol doc-symbol-heading doc-symbol-attribute"></code> <span class="doc doc-object-name doc-attribute-name">artifacts_path</span>
|
||
|
||
|
||
<span class="doc doc-labels">
|
||
<small class="doc doc-label doc-label-class-attribute"><code>class-attribute</code></small>
|
||
<small class="doc doc-label doc-label-instance-attribute"><code>instance-attribute</code></small>
|
||
</span> (<code>docling.datamodel.pipeline_options.VlmExtractionPipelineOptions.artifacts_path</code>)" href="#docling.datamodel.pipeline_options.VlmExtractionPipelineOptions.artifacts_path">artifacts_path</a></code></b>
|
||
(<code><span title="typing.Optional">Optional</span>[<span title="typing.Union">Union</span>[<span title="pathlib.Path">Path</span>, <span title="str">str</span>]]</code>)
|
||
–
|
||
<div class="doc-md-description">
|
||
|
||
</div>
|
||
</li>
|
||
<li class="doc-section-item field-body">
|
||
<b><code><a class="autorefs autorefs-internal" title="<code class="doc-symbol doc-symbol-heading doc-symbol-attribute"></code> <span class="doc doc-object-name doc-attribute-name">document_timeout</span>
|
||
|
||
|
||
<span class="doc doc-labels">
|
||
<small class="doc doc-label doc-label-class-attribute"><code>class-attribute</code></small>
|
||
<small class="doc doc-label doc-label-instance-attribute"><code>instance-attribute</code></small>
|
||
</span> (<code>docling.datamodel.pipeline_options.VlmExtractionPipelineOptions.document_timeout</code>)" href="#docling.datamodel.pipeline_options.VlmExtractionPipelineOptions.document_timeout">document_timeout</a></code></b>
|
||
(<code><span title="typing.Optional">Optional</span>[<span title="float">float</span>]</code>)
|
||
–
|
||
<div class="doc-md-description">
|
||
|
||
</div>
|
||
</li>
|
||
<li class="doc-section-item field-body">
|
||
<b><code><a class="autorefs autorefs-internal" title="<code class="doc-symbol doc-symbol-heading doc-symbol-attribute"></code> <span class="doc doc-object-name doc-attribute-name">enable_remote_services</span>
|
||
|
||
|
||
<span class="doc doc-labels">
|
||
<small class="doc doc-label doc-label-class-attribute"><code>class-attribute</code></small>
|
||
<small class="doc doc-label doc-label-instance-attribute"><code>instance-attribute</code></small>
|
||
</span> (<code>docling.datamodel.pipeline_options.VlmExtractionPipelineOptions.enable_remote_services</code>)" href="#docling.datamodel.pipeline_options.VlmExtractionPipelineOptions.enable_remote_services">enable_remote_services</a></code></b>
|
||
(<code><span title="bool">bool</span></code>)
|
||
–
|
||
<div class="doc-md-description">
|
||
|
||
</div>
|
||
</li>
|
||
<li class="doc-section-item field-body">
|
||
<b><code><a class="autorefs autorefs-internal" title="<code class="doc-symbol doc-symbol-heading doc-symbol-attribute"></code> <span class="doc doc-object-name doc-attribute-name">kind</span>
|
||
|
||
|
||
<span class="doc doc-labels">
|
||
<small class="doc doc-label doc-label-class-attribute"><code>class-attribute</code></small>
|
||
</span> (<code>docling.datamodel.pipeline_options.VlmExtractionPipelineOptions.kind</code>)" href="#docling.datamodel.pipeline_options.VlmExtractionPipelineOptions.kind">kind</a></code></b>
|
||
(<code><span title="str">str</span></code>)
|
||
–
|
||
<div class="doc-md-description">
|
||
|
||
</div>
|
||
</li>
|
||
<li class="doc-section-item field-body">
|
||
<b><code><a class="autorefs autorefs-internal" title="<code class="doc-symbol doc-symbol-heading doc-symbol-attribute"></code> <span class="doc doc-object-name doc-attribute-name">vlm_options</span>
|
||
|
||
|
||
<span class="doc doc-labels">
|
||
<small class="doc doc-label doc-label-class-attribute"><code>class-attribute</code></small>
|
||
<small class="doc doc-label doc-label-instance-attribute"><code>instance-attribute</code></small>
|
||
</span> (<code>docling.datamodel.pipeline_options.VlmExtractionPipelineOptions.vlm_options</code>)" href="#docling.datamodel.pipeline_options.VlmExtractionPipelineOptions.vlm_options">vlm_options</a></code></b>
|
||
(<code><span title="typing.Union">Union</span>[<span title="docling.datamodel.pipeline_options_vlm_model.InlineVlmOptions">InlineVlmOptions</span>]</code>)
|
||
–
|
||
<div class="doc-md-description">
|
||
|
||
</div>
|
||
</li>
|
||
</ul>
|
||
|
||
|
||
|
||
|
||
<div class="doc doc-children">
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
<div class="doc doc-object doc-attribute">
|
||
|
||
|
||
|
||
<h4 id="docling.datamodel.pipeline_options.VlmExtractionPipelineOptions.accelerator_options" class="doc doc-heading">
|
||
<code class="doc-symbol doc-symbol-heading doc-symbol-attribute"></code> <span class="doc doc-object-name doc-attribute-name">accelerator_options</span>
|
||
|
||
|
||
<span class="doc doc-labels">
|
||
<small class="doc doc-label doc-label-class-attribute"><code>class-attribute</code></small>
|
||
<small class="doc doc-label doc-label-instance-attribute"><code>instance-attribute</code></small>
|
||
</span>
|
||
|
||
</h4>
|
||
<div class="doc-signature highlight"><pre><span></span><code><span class="n">accelerator_options</span><span class="p">:</span> <span class="n"><span title="docling.datamodel.accelerator_options.AcceleratorOptions">AcceleratorOptions</span></span> <span class="o">=</span> <span class="n"><span title="docling.datamodel.accelerator_options.AcceleratorOptions">AcceleratorOptions</span></span><span class="p">()</span>
|
||
</code></pre></div>
|
||
|
||
<div class="doc doc-contents ">
|
||
|
||
</div>
|
||
|
||
</div>
|
||
|
||
<div class="doc doc-object doc-attribute">
|
||
|
||
|
||
|
||
<h4 id="docling.datamodel.pipeline_options.VlmExtractionPipelineOptions.allow_external_plugins" class="doc doc-heading">
|
||
<code class="doc-symbol doc-symbol-heading doc-symbol-attribute"></code> <span class="doc doc-object-name doc-attribute-name">allow_external_plugins</span>
|
||
|
||
|
||
<span class="doc doc-labels">
|
||
<small class="doc doc-label doc-label-class-attribute"><code>class-attribute</code></small>
|
||
<small class="doc doc-label doc-label-instance-attribute"><code>instance-attribute</code></small>
|
||
</span>
|
||
|
||
</h4>
|
||
<div class="doc-signature highlight"><pre><span></span><code><span class="n">allow_external_plugins</span><span class="p">:</span> <span class="n"><span title="bool">bool</span></span> <span class="o">=</span> <span class="kc">False</span>
|
||
</code></pre></div>
|
||
|
||
<div class="doc doc-contents ">
|
||
|
||
</div>
|
||
|
||
</div>
|
||
|
||
<div class="doc doc-object doc-attribute">
|
||
|
||
|
||
|
||
<h4 id="docling.datamodel.pipeline_options.VlmExtractionPipelineOptions.artifacts_path" class="doc doc-heading">
|
||
<code class="doc-symbol doc-symbol-heading doc-symbol-attribute"></code> <span class="doc doc-object-name doc-attribute-name">artifacts_path</span>
|
||
|
||
|
||
<span class="doc doc-labels">
|
||
<small class="doc doc-label doc-label-class-attribute"><code>class-attribute</code></small>
|
||
<small class="doc doc-label doc-label-instance-attribute"><code>instance-attribute</code></small>
|
||
</span>
|
||
|
||
</h4>
|
||
<div class="doc-signature highlight"><pre><span></span><code><span class="n">artifacts_path</span><span class="p">:</span> <span class="n"><span title="typing.Optional">Optional</span></span><span class="p">[</span><span class="n"><span title="typing.Union">Union</span></span><span class="p">[</span><span class="n"><span title="pathlib.Path">Path</span></span><span class="p">,</span> <span class="n"><span title="str">str</span></span><span class="p">]]</span> <span class="o">=</span> <span class="kc">None</span>
|
||
</code></pre></div>
|
||
|
||
<div class="doc doc-contents ">
|
||
|
||
</div>
|
||
|
||
</div>
|
||
|
||
<div class="doc doc-object doc-attribute">
|
||
|
||
|
||
|
||
<h4 id="docling.datamodel.pipeline_options.VlmExtractionPipelineOptions.document_timeout" class="doc doc-heading">
|
||
<code class="doc-symbol doc-symbol-heading doc-symbol-attribute"></code> <span class="doc doc-object-name doc-attribute-name">document_timeout</span>
|
||
|
||
|
||
<span class="doc doc-labels">
|
||
<small class="doc doc-label doc-label-class-attribute"><code>class-attribute</code></small>
|
||
<small class="doc doc-label doc-label-instance-attribute"><code>instance-attribute</code></small>
|
||
</span>
|
||
|
||
</h4>
|
||
<div class="doc-signature highlight"><pre><span></span><code><span class="n">document_timeout</span><span class="p">:</span> <span class="n"><span title="typing.Optional">Optional</span></span><span class="p">[</span><span class="n"><span title="float">float</span></span><span class="p">]</span> <span class="o">=</span> <span class="kc">None</span>
|
||
</code></pre></div>
|
||
|
||
<div class="doc doc-contents ">
|
||
|
||
</div>
|
||
|
||
</div>
|
||
|
||
<div class="doc doc-object doc-attribute">
|
||
|
||
|
||
|
||
<h4 id="docling.datamodel.pipeline_options.VlmExtractionPipelineOptions.enable_remote_services" class="doc doc-heading">
|
||
<code class="doc-symbol doc-symbol-heading doc-symbol-attribute"></code> <span class="doc doc-object-name doc-attribute-name">enable_remote_services</span>
|
||
|
||
|
||
<span class="doc doc-labels">
|
||
<small class="doc doc-label doc-label-class-attribute"><code>class-attribute</code></small>
|
||
<small class="doc doc-label doc-label-instance-attribute"><code>instance-attribute</code></small>
|
||
</span>
|
||
|
||
</h4>
|
||
<div class="doc-signature highlight"><pre><span></span><code><span class="n">enable_remote_services</span><span class="p">:</span> <span class="n"><span title="bool">bool</span></span> <span class="o">=</span> <span class="kc">False</span>
|
||
</code></pre></div>
|
||
|
||
<div class="doc doc-contents ">
|
||
|
||
</div>
|
||
|
||
</div>
|
||
|
||
<div class="doc doc-object doc-attribute">
|
||
|
||
|
||
|
||
<h4 id="docling.datamodel.pipeline_options.VlmExtractionPipelineOptions.kind" class="doc doc-heading">
|
||
<code class="doc-symbol doc-symbol-heading doc-symbol-attribute"></code> <span class="doc doc-object-name doc-attribute-name">kind</span>
|
||
|
||
|
||
<span class="doc doc-labels">
|
||
<small class="doc doc-label doc-label-class-attribute"><code>class-attribute</code></small>
|
||
</span>
|
||
|
||
</h4>
|
||
<div class="doc-signature highlight"><pre><span></span><code><span class="n">kind</span><span class="p">:</span> <span class="n"><span title="str">str</span></span>
|
||
</code></pre></div>
|
||
|
||
<div class="doc doc-contents ">
|
||
|
||
</div>
|
||
|
||
</div>
|
||
|
||
<div class="doc doc-object doc-attribute">
|
||
|
||
|
||
|
||
<h4 id="docling.datamodel.pipeline_options.VlmExtractionPipelineOptions.vlm_options" class="doc doc-heading">
|
||
<code class="doc-symbol doc-symbol-heading doc-symbol-attribute"></code> <span class="doc doc-object-name doc-attribute-name">vlm_options</span>
|
||
|
||
|
||
<span class="doc doc-labels">
|
||
<small class="doc doc-label doc-label-class-attribute"><code>class-attribute</code></small>
|
||
<small class="doc doc-label doc-label-instance-attribute"><code>instance-attribute</code></small>
|
||
</span>
|
||
|
||
</h4>
|
||
<div class="doc-signature highlight"><pre><span></span><code><span class="n">vlm_options</span><span class="p">:</span> <span class="n"><span title="typing.Union">Union</span></span><span class="p">[</span><span class="n"><span title="docling.datamodel.pipeline_options_vlm_model.InlineVlmOptions">InlineVlmOptions</span></span><span class="p">]</span> <span class="o">=</span> <span class="n"><span title="docling.datamodel.vlm_model_specs.NU_EXTRACT_2B_TRANSFORMERS">NU_EXTRACT_2B_TRANSFORMERS</span></span>
|
||
</code></pre></div>
|
||
|
||
<div class="doc doc-contents ">
|
||
|
||
</div>
|
||
|
||
</div>
|
||
|
||
|
||
|
||
|
||
|
||
|
||
</div>
|
||
|
||
</div>
|
||
|
||
</div>
|
||
|
||
<div class="doc doc-object doc-class">
|
||
|
||
|
||
|
||
<h3 id="docling.datamodel.pipeline_options.VlmPipelineOptions" class="doc doc-heading">
|
||
<code class="doc-symbol doc-symbol-heading doc-symbol-class"></code> <span class="doc doc-object-name doc-class-name">VlmPipelineOptions</span>
|
||
|
||
|
||
</h3>
|
||
|
||
|
||
<div class="doc doc-contents ">
|
||
<p class="doc doc-class-bases">
|
||
Bases: <code><a class="autorefs autorefs-internal" title="<code class="doc-symbol doc-symbol-heading doc-symbol-class"></code> <span class="doc doc-object-name doc-class-name">PaginatedPipelineOptions</span> (<code>docling.datamodel.pipeline_options.PaginatedPipelineOptions</code>)" href="#docling.datamodel.pipeline_options.PaginatedPipelineOptions">PaginatedPipelineOptions</a></code></p>
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
<p><span class="doc-section-title">Attributes:</span></p>
|
||
<ul>
|
||
<li class="doc-section-item field-body">
|
||
<b><code><a class="autorefs autorefs-internal" title="<code class="doc-symbol doc-symbol-heading doc-symbol-attribute"></code> <span class="doc doc-object-name doc-attribute-name">accelerator_options</span>
|
||
|
||
|
||
<span class="doc doc-labels">
|
||
<small class="doc doc-label doc-label-class-attribute"><code>class-attribute</code></small>
|
||
<small class="doc doc-label doc-label-instance-attribute"><code>instance-attribute</code></small>
|
||
</span> (<code>docling.datamodel.pipeline_options.VlmPipelineOptions.accelerator_options</code>)" href="#docling.datamodel.pipeline_options.VlmPipelineOptions.accelerator_options">accelerator_options</a></code></b>
|
||
(<code><span title="docling.datamodel.accelerator_options.AcceleratorOptions">AcceleratorOptions</span></code>)
|
||
–
|
||
<div class="doc-md-description">
|
||
|
||
</div>
|
||
</li>
|
||
<li class="doc-section-item field-body">
|
||
<b><code><a class="autorefs autorefs-internal" title="<code class="doc-symbol doc-symbol-heading doc-symbol-attribute"></code> <span class="doc doc-object-name doc-attribute-name">allow_external_plugins</span>
|
||
|
||
|
||
<span class="doc doc-labels">
|
||
<small class="doc doc-label doc-label-class-attribute"><code>class-attribute</code></small>
|
||
<small class="doc doc-label doc-label-instance-attribute"><code>instance-attribute</code></small>
|
||
</span> (<code>docling.datamodel.pipeline_options.VlmPipelineOptions.allow_external_plugins</code>)" href="#docling.datamodel.pipeline_options.VlmPipelineOptions.allow_external_plugins">allow_external_plugins</a></code></b>
|
||
(<code><span title="bool">bool</span></code>)
|
||
–
|
||
<div class="doc-md-description">
|
||
|
||
</div>
|
||
</li>
|
||
<li class="doc-section-item field-body">
|
||
<b><code><a class="autorefs autorefs-internal" title="<code class="doc-symbol doc-symbol-heading doc-symbol-attribute"></code> <span class="doc doc-object-name doc-attribute-name">artifacts_path</span>
|
||
|
||
|
||
<span class="doc doc-labels">
|
||
<small class="doc doc-label doc-label-class-attribute"><code>class-attribute</code></small>
|
||
<small class="doc doc-label doc-label-instance-attribute"><code>instance-attribute</code></small>
|
||
</span> (<code>docling.datamodel.pipeline_options.VlmPipelineOptions.artifacts_path</code>)" href="#docling.datamodel.pipeline_options.VlmPipelineOptions.artifacts_path">artifacts_path</a></code></b>
|
||
(<code><span title="typing.Optional">Optional</span>[<span title="typing.Union">Union</span>[<span title="pathlib.Path">Path</span>, <span title="str">str</span>]]</code>)
|
||
–
|
||
<div class="doc-md-description">
|
||
|
||
</div>
|
||
</li>
|
||
<li class="doc-section-item field-body">
|
||
<b><code><a class="autorefs autorefs-internal" title="<code class="doc-symbol doc-symbol-heading doc-symbol-attribute"></code> <span class="doc doc-object-name doc-attribute-name">do_picture_classification</span>
|
||
|
||
|
||
<span class="doc doc-labels">
|
||
<small class="doc doc-label doc-label-class-attribute"><code>class-attribute</code></small>
|
||
<small class="doc doc-label doc-label-instance-attribute"><code>instance-attribute</code></small>
|
||
</span> (<code>docling.datamodel.pipeline_options.VlmPipelineOptions.do_picture_classification</code>)" href="#docling.datamodel.pipeline_options.VlmPipelineOptions.do_picture_classification">do_picture_classification</a></code></b>
|
||
(<code><span title="bool">bool</span></code>)
|
||
–
|
||
<div class="doc-md-description">
|
||
|
||
</div>
|
||
</li>
|
||
<li class="doc-section-item field-body">
|
||
<b><code><a class="autorefs autorefs-internal" title="<code class="doc-symbol doc-symbol-heading doc-symbol-attribute"></code> <span class="doc doc-object-name doc-attribute-name">do_picture_description</span>
|
||
|
||
|
||
<span class="doc doc-labels">
|
||
<small class="doc doc-label doc-label-class-attribute"><code>class-attribute</code></small>
|
||
<small class="doc doc-label doc-label-instance-attribute"><code>instance-attribute</code></small>
|
||
</span> (<code>docling.datamodel.pipeline_options.VlmPipelineOptions.do_picture_description</code>)" href="#docling.datamodel.pipeline_options.VlmPipelineOptions.do_picture_description">do_picture_description</a></code></b>
|
||
(<code><span title="bool">bool</span></code>)
|
||
–
|
||
<div class="doc-md-description">
|
||
|
||
</div>
|
||
</li>
|
||
<li class="doc-section-item field-body">
|
||
<b><code><a class="autorefs autorefs-internal" title="<code class="doc-symbol doc-symbol-heading doc-symbol-attribute"></code> <span class="doc doc-object-name doc-attribute-name">document_timeout</span>
|
||
|
||
|
||
<span class="doc doc-labels">
|
||
<small class="doc doc-label doc-label-class-attribute"><code>class-attribute</code></small>
|
||
<small class="doc doc-label doc-label-instance-attribute"><code>instance-attribute</code></small>
|
||
</span> (<code>docling.datamodel.pipeline_options.VlmPipelineOptions.document_timeout</code>)" href="#docling.datamodel.pipeline_options.VlmPipelineOptions.document_timeout">document_timeout</a></code></b>
|
||
(<code><span title="typing.Optional">Optional</span>[<span title="float">float</span>]</code>)
|
||
–
|
||
<div class="doc-md-description">
|
||
|
||
</div>
|
||
</li>
|
||
<li class="doc-section-item field-body">
|
||
<b><code><a class="autorefs autorefs-internal" title="<code class="doc-symbol doc-symbol-heading doc-symbol-attribute"></code> <span class="doc doc-object-name doc-attribute-name">enable_remote_services</span>
|
||
|
||
|
||
<span class="doc doc-labels">
|
||
<small class="doc doc-label doc-label-class-attribute"><code>class-attribute</code></small>
|
||
<small class="doc doc-label doc-label-instance-attribute"><code>instance-attribute</code></small>
|
||
</span> (<code>docling.datamodel.pipeline_options.VlmPipelineOptions.enable_remote_services</code>)" href="#docling.datamodel.pipeline_options.VlmPipelineOptions.enable_remote_services">enable_remote_services</a></code></b>
|
||
(<code><span title="bool">bool</span></code>)
|
||
–
|
||
<div class="doc-md-description">
|
||
|
||
</div>
|
||
</li>
|
||
<li class="doc-section-item field-body">
|
||
<b><code><a class="autorefs autorefs-internal" title="<code class="doc-symbol doc-symbol-heading doc-symbol-attribute"></code> <span class="doc doc-object-name doc-attribute-name">force_backend_text</span>
|
||
|
||
|
||
<span class="doc doc-labels">
|
||
<small class="doc doc-label doc-label-class-attribute"><code>class-attribute</code></small>
|
||
<small class="doc doc-label doc-label-instance-attribute"><code>instance-attribute</code></small>
|
||
</span> (<code>docling.datamodel.pipeline_options.VlmPipelineOptions.force_backend_text</code>)" href="#docling.datamodel.pipeline_options.VlmPipelineOptions.force_backend_text">force_backend_text</a></code></b>
|
||
(<code><span title="bool">bool</span></code>)
|
||
–
|
||
<div class="doc-md-description">
|
||
|
||
</div>
|
||
</li>
|
||
<li class="doc-section-item field-body">
|
||
<b><code><a class="autorefs autorefs-internal" title="<code class="doc-symbol doc-symbol-heading doc-symbol-attribute"></code> <span class="doc doc-object-name doc-attribute-name">generate_page_images</span>
|
||
|
||
|
||
<span class="doc doc-labels">
|
||
<small class="doc doc-label doc-label-class-attribute"><code>class-attribute</code></small>
|
||
<small class="doc doc-label doc-label-instance-attribute"><code>instance-attribute</code></small>
|
||
</span> (<code>docling.datamodel.pipeline_options.VlmPipelineOptions.generate_page_images</code>)" href="#docling.datamodel.pipeline_options.VlmPipelineOptions.generate_page_images">generate_page_images</a></code></b>
|
||
(<code><span title="bool">bool</span></code>)
|
||
–
|
||
<div class="doc-md-description">
|
||
|
||
</div>
|
||
</li>
|
||
<li class="doc-section-item field-body">
|
||
<b><code><a class="autorefs autorefs-internal" title="<code class="doc-symbol doc-symbol-heading doc-symbol-attribute"></code> <span class="doc doc-object-name doc-attribute-name">generate_picture_images</span>
|
||
|
||
|
||
<span class="doc doc-labels">
|
||
<small class="doc doc-label doc-label-class-attribute"><code>class-attribute</code></small>
|
||
<small class="doc doc-label doc-label-instance-attribute"><code>instance-attribute</code></small>
|
||
</span> (<code>docling.datamodel.pipeline_options.VlmPipelineOptions.generate_picture_images</code>)" href="#docling.datamodel.pipeline_options.VlmPipelineOptions.generate_picture_images">generate_picture_images</a></code></b>
|
||
(<code><span title="bool">bool</span></code>)
|
||
–
|
||
<div class="doc-md-description">
|
||
|
||
</div>
|
||
</li>
|
||
<li class="doc-section-item field-body">
|
||
<b><code><a class="autorefs autorefs-internal" title="<code class="doc-symbol doc-symbol-heading doc-symbol-attribute"></code> <span class="doc doc-object-name doc-attribute-name">images_scale</span>
|
||
|
||
|
||
<span class="doc doc-labels">
|
||
<small class="doc doc-label doc-label-class-attribute"><code>class-attribute</code></small>
|
||
<small class="doc doc-label doc-label-instance-attribute"><code>instance-attribute</code></small>
|
||
</span> (<code>docling.datamodel.pipeline_options.VlmPipelineOptions.images_scale</code>)" href="#docling.datamodel.pipeline_options.VlmPipelineOptions.images_scale">images_scale</a></code></b>
|
||
(<code><span title="float">float</span></code>)
|
||
–
|
||
<div class="doc-md-description">
|
||
|
||
</div>
|
||
</li>
|
||
<li class="doc-section-item field-body">
|
||
<b><code><a class="autorefs autorefs-internal" title="<code class="doc-symbol doc-symbol-heading doc-symbol-attribute"></code> <span class="doc doc-object-name doc-attribute-name">kind</span>
|
||
|
||
|
||
<span class="doc doc-labels">
|
||
<small class="doc doc-label doc-label-class-attribute"><code>class-attribute</code></small>
|
||
</span> (<code>docling.datamodel.pipeline_options.VlmPipelineOptions.kind</code>)" href="#docling.datamodel.pipeline_options.VlmPipelineOptions.kind">kind</a></code></b>
|
||
(<code><span title="str">str</span></code>)
|
||
–
|
||
<div class="doc-md-description">
|
||
|
||
</div>
|
||
</li>
|
||
<li class="doc-section-item field-body">
|
||
<b><code><a class="autorefs autorefs-internal" title="<code class="doc-symbol doc-symbol-heading doc-symbol-attribute"></code> <span class="doc doc-object-name doc-attribute-name">picture_description_options</span>
|
||
|
||
|
||
<span class="doc doc-labels">
|
||
<small class="doc doc-label doc-label-class-attribute"><code>class-attribute</code></small>
|
||
<small class="doc doc-label doc-label-instance-attribute"><code>instance-attribute</code></small>
|
||
</span> (<code>docling.datamodel.pipeline_options.VlmPipelineOptions.picture_description_options</code>)" href="#docling.datamodel.pipeline_options.VlmPipelineOptions.picture_description_options">picture_description_options</a></code></b>
|
||
(<code><a class="autorefs autorefs-internal" title="<code class="doc-symbol doc-symbol-heading doc-symbol-class"></code> <span class="doc doc-object-name doc-class-name">PictureDescriptionBaseOptions</span> (<code>docling.datamodel.pipeline_options.PictureDescriptionBaseOptions</code>)" href="#docling.datamodel.pipeline_options.PictureDescriptionBaseOptions">PictureDescriptionBaseOptions</a></code>)
|
||
–
|
||
<div class="doc-md-description">
|
||
|
||
</div>
|
||
</li>
|
||
<li class="doc-section-item field-body">
|
||
<b><code><a class="autorefs autorefs-internal" title="<code class="doc-symbol doc-symbol-heading doc-symbol-attribute"></code> <span class="doc doc-object-name doc-attribute-name">vlm_options</span>
|
||
|
||
|
||
<span class="doc doc-labels">
|
||
<small class="doc doc-label doc-label-class-attribute"><code>class-attribute</code></small>
|
||
<small class="doc doc-label doc-label-instance-attribute"><code>instance-attribute</code></small>
|
||
</span> (<code>docling.datamodel.pipeline_options.VlmPipelineOptions.vlm_options</code>)" href="#docling.datamodel.pipeline_options.VlmPipelineOptions.vlm_options">vlm_options</a></code></b>
|
||
(<code><span title="typing.Union">Union</span>[<span title="docling.datamodel.pipeline_options_vlm_model.InlineVlmOptions">InlineVlmOptions</span>, <span title="docling.datamodel.pipeline_options_vlm_model.ApiVlmOptions">ApiVlmOptions</span>]</code>)
|
||
–
|
||
<div class="doc-md-description">
|
||
|
||
</div>
|
||
</li>
|
||
</ul>
|
||
|
||
|
||
|
||
|
||
<div class="doc doc-children">
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
<div class="doc doc-object doc-attribute">
|
||
|
||
|
||
|
||
<h4 id="docling.datamodel.pipeline_options.VlmPipelineOptions.accelerator_options" class="doc doc-heading">
|
||
<code class="doc-symbol doc-symbol-heading doc-symbol-attribute"></code> <span class="doc doc-object-name doc-attribute-name">accelerator_options</span>
|
||
|
||
|
||
<span class="doc doc-labels">
|
||
<small class="doc doc-label doc-label-class-attribute"><code>class-attribute</code></small>
|
||
<small class="doc doc-label doc-label-instance-attribute"><code>instance-attribute</code></small>
|
||
</span>
|
||
|
||
</h4>
|
||
<div class="doc-signature highlight"><pre><span></span><code><span class="n">accelerator_options</span><span class="p">:</span> <span class="n"><span title="docling.datamodel.accelerator_options.AcceleratorOptions">AcceleratorOptions</span></span> <span class="o">=</span> <span class="n"><span title="docling.datamodel.accelerator_options.AcceleratorOptions">AcceleratorOptions</span></span><span class="p">()</span>
|
||
</code></pre></div>
|
||
|
||
<div class="doc doc-contents ">
|
||
|
||
</div>
|
||
|
||
</div>
|
||
|
||
<div class="doc doc-object doc-attribute">
|
||
|
||
|
||
|
||
<h4 id="docling.datamodel.pipeline_options.VlmPipelineOptions.allow_external_plugins" class="doc doc-heading">
|
||
<code class="doc-symbol doc-symbol-heading doc-symbol-attribute"></code> <span class="doc doc-object-name doc-attribute-name">allow_external_plugins</span>
|
||
|
||
|
||
<span class="doc doc-labels">
|
||
<small class="doc doc-label doc-label-class-attribute"><code>class-attribute</code></small>
|
||
<small class="doc doc-label doc-label-instance-attribute"><code>instance-attribute</code></small>
|
||
</span>
|
||
|
||
</h4>
|
||
<div class="doc-signature highlight"><pre><span></span><code><span class="n">allow_external_plugins</span><span class="p">:</span> <span class="n"><span title="bool">bool</span></span> <span class="o">=</span> <span class="kc">False</span>
|
||
</code></pre></div>
|
||
|
||
<div class="doc doc-contents ">
|
||
|
||
</div>
|
||
|
||
</div>
|
||
|
||
<div class="doc doc-object doc-attribute">
|
||
|
||
|
||
|
||
<h4 id="docling.datamodel.pipeline_options.VlmPipelineOptions.artifacts_path" class="doc doc-heading">
|
||
<code class="doc-symbol doc-symbol-heading doc-symbol-attribute"></code> <span class="doc doc-object-name doc-attribute-name">artifacts_path</span>
|
||
|
||
|
||
<span class="doc doc-labels">
|
||
<small class="doc doc-label doc-label-class-attribute"><code>class-attribute</code></small>
|
||
<small class="doc doc-label doc-label-instance-attribute"><code>instance-attribute</code></small>
|
||
</span>
|
||
|
||
</h4>
|
||
<div class="doc-signature highlight"><pre><span></span><code><span class="n">artifacts_path</span><span class="p">:</span> <span class="n"><span title="typing.Optional">Optional</span></span><span class="p">[</span><span class="n"><span title="typing.Union">Union</span></span><span class="p">[</span><span class="n"><span title="pathlib.Path">Path</span></span><span class="p">,</span> <span class="n"><span title="str">str</span></span><span class="p">]]</span> <span class="o">=</span> <span class="kc">None</span>
|
||
</code></pre></div>
|
||
|
||
<div class="doc doc-contents ">
|
||
|
||
</div>
|
||
|
||
</div>
|
||
|
||
<div class="doc doc-object doc-attribute">
|
||
|
||
|
||
|
||
<h4 id="docling.datamodel.pipeline_options.VlmPipelineOptions.do_picture_classification" class="doc doc-heading">
|
||
<code class="doc-symbol doc-symbol-heading doc-symbol-attribute"></code> <span class="doc doc-object-name doc-attribute-name">do_picture_classification</span>
|
||
|
||
|
||
<span class="doc doc-labels">
|
||
<small class="doc doc-label doc-label-class-attribute"><code>class-attribute</code></small>
|
||
<small class="doc doc-label doc-label-instance-attribute"><code>instance-attribute</code></small>
|
||
</span>
|
||
|
||
</h4>
|
||
<div class="doc-signature highlight"><pre><span></span><code><span class="n">do_picture_classification</span><span class="p">:</span> <span class="n"><span title="bool">bool</span></span> <span class="o">=</span> <span class="kc">False</span>
|
||
</code></pre></div>
|
||
|
||
<div class="doc doc-contents ">
|
||
|
||
</div>
|
||
|
||
</div>
|
||
|
||
<div class="doc doc-object doc-attribute">
|
||
|
||
|
||
|
||
<h4 id="docling.datamodel.pipeline_options.VlmPipelineOptions.do_picture_description" class="doc doc-heading">
|
||
<code class="doc-symbol doc-symbol-heading doc-symbol-attribute"></code> <span class="doc doc-object-name doc-attribute-name">do_picture_description</span>
|
||
|
||
|
||
<span class="doc doc-labels">
|
||
<small class="doc doc-label doc-label-class-attribute"><code>class-attribute</code></small>
|
||
<small class="doc doc-label doc-label-instance-attribute"><code>instance-attribute</code></small>
|
||
</span>
|
||
|
||
</h4>
|
||
<div class="doc-signature highlight"><pre><span></span><code><span class="n">do_picture_description</span><span class="p">:</span> <span class="n"><span title="bool">bool</span></span> <span class="o">=</span> <span class="kc">False</span>
|
||
</code></pre></div>
|
||
|
||
<div class="doc doc-contents ">
|
||
|
||
</div>
|
||
|
||
</div>
|
||
|
||
<div class="doc doc-object doc-attribute">
|
||
|
||
|
||
|
||
<h4 id="docling.datamodel.pipeline_options.VlmPipelineOptions.document_timeout" class="doc doc-heading">
|
||
<code class="doc-symbol doc-symbol-heading doc-symbol-attribute"></code> <span class="doc doc-object-name doc-attribute-name">document_timeout</span>
|
||
|
||
|
||
<span class="doc doc-labels">
|
||
<small class="doc doc-label doc-label-class-attribute"><code>class-attribute</code></small>
|
||
<small class="doc doc-label doc-label-instance-attribute"><code>instance-attribute</code></small>
|
||
</span>
|
||
|
||
</h4>
|
||
<div class="doc-signature highlight"><pre><span></span><code><span class="n">document_timeout</span><span class="p">:</span> <span class="n"><span title="typing.Optional">Optional</span></span><span class="p">[</span><span class="n"><span title="float">float</span></span><span class="p">]</span> <span class="o">=</span> <span class="kc">None</span>
|
||
</code></pre></div>
|
||
|
||
<div class="doc doc-contents ">
|
||
|
||
</div>
|
||
|
||
</div>
|
||
|
||
<div class="doc doc-object doc-attribute">
|
||
|
||
|
||
|
||
<h4 id="docling.datamodel.pipeline_options.VlmPipelineOptions.enable_remote_services" class="doc doc-heading">
|
||
<code class="doc-symbol doc-symbol-heading doc-symbol-attribute"></code> <span class="doc doc-object-name doc-attribute-name">enable_remote_services</span>
|
||
|
||
|
||
<span class="doc doc-labels">
|
||
<small class="doc doc-label doc-label-class-attribute"><code>class-attribute</code></small>
|
||
<small class="doc doc-label doc-label-instance-attribute"><code>instance-attribute</code></small>
|
||
</span>
|
||
|
||
</h4>
|
||
<div class="doc-signature highlight"><pre><span></span><code><span class="n">enable_remote_services</span><span class="p">:</span> <span class="n"><span title="bool">bool</span></span> <span class="o">=</span> <span class="kc">False</span>
|
||
</code></pre></div>
|
||
|
||
<div class="doc doc-contents ">
|
||
|
||
</div>
|
||
|
||
</div>
|
||
|
||
<div class="doc doc-object doc-attribute">
|
||
|
||
|
||
|
||
<h4 id="docling.datamodel.pipeline_options.VlmPipelineOptions.force_backend_text" class="doc doc-heading">
|
||
<code class="doc-symbol doc-symbol-heading doc-symbol-attribute"></code> <span class="doc doc-object-name doc-attribute-name">force_backend_text</span>
|
||
|
||
|
||
<span class="doc doc-labels">
|
||
<small class="doc doc-label doc-label-class-attribute"><code>class-attribute</code></small>
|
||
<small class="doc doc-label doc-label-instance-attribute"><code>instance-attribute</code></small>
|
||
</span>
|
||
|
||
</h4>
|
||
<div class="doc-signature highlight"><pre><span></span><code><span class="n">force_backend_text</span><span class="p">:</span> <span class="n"><span title="bool">bool</span></span> <span class="o">=</span> <span class="kc">False</span>
|
||
</code></pre></div>
|
||
|
||
<div class="doc doc-contents ">
|
||
|
||
</div>
|
||
|
||
</div>
|
||
|
||
<div class="doc doc-object doc-attribute">
|
||
|
||
|
||
|
||
<h4 id="docling.datamodel.pipeline_options.VlmPipelineOptions.generate_page_images" class="doc doc-heading">
|
||
<code class="doc-symbol doc-symbol-heading doc-symbol-attribute"></code> <span class="doc doc-object-name doc-attribute-name">generate_page_images</span>
|
||
|
||
|
||
<span class="doc doc-labels">
|
||
<small class="doc doc-label doc-label-class-attribute"><code>class-attribute</code></small>
|
||
<small class="doc doc-label doc-label-instance-attribute"><code>instance-attribute</code></small>
|
||
</span>
|
||
|
||
</h4>
|
||
<div class="doc-signature highlight"><pre><span></span><code><span class="n">generate_page_images</span><span class="p">:</span> <span class="n"><span title="bool">bool</span></span> <span class="o">=</span> <span class="kc">True</span>
|
||
</code></pre></div>
|
||
|
||
<div class="doc doc-contents ">
|
||
|
||
</div>
|
||
|
||
</div>
|
||
|
||
<div class="doc doc-object doc-attribute">
|
||
|
||
|
||
|
||
<h4 id="docling.datamodel.pipeline_options.VlmPipelineOptions.generate_picture_images" class="doc doc-heading">
|
||
<code class="doc-symbol doc-symbol-heading doc-symbol-attribute"></code> <span class="doc doc-object-name doc-attribute-name">generate_picture_images</span>
|
||
|
||
|
||
<span class="doc doc-labels">
|
||
<small class="doc doc-label doc-label-class-attribute"><code>class-attribute</code></small>
|
||
<small class="doc doc-label doc-label-instance-attribute"><code>instance-attribute</code></small>
|
||
</span>
|
||
|
||
</h4>
|
||
<div class="doc-signature highlight"><pre><span></span><code><span class="n">generate_picture_images</span><span class="p">:</span> <span class="n"><span title="bool">bool</span></span> <span class="o">=</span> <span class="kc">False</span>
|
||
</code></pre></div>
|
||
|
||
<div class="doc doc-contents ">
|
||
|
||
</div>
|
||
|
||
</div>
|
||
|
||
<div class="doc doc-object doc-attribute">
|
||
|
||
|
||
|
||
<h4 id="docling.datamodel.pipeline_options.VlmPipelineOptions.images_scale" class="doc doc-heading">
|
||
<code class="doc-symbol doc-symbol-heading doc-symbol-attribute"></code> <span class="doc doc-object-name doc-attribute-name">images_scale</span>
|
||
|
||
|
||
<span class="doc doc-labels">
|
||
<small class="doc doc-label doc-label-class-attribute"><code>class-attribute</code></small>
|
||
<small class="doc doc-label doc-label-instance-attribute"><code>instance-attribute</code></small>
|
||
</span>
|
||
|
||
</h4>
|
||
<div class="doc-signature highlight"><pre><span></span><code><span class="n">images_scale</span><span class="p">:</span> <span class="n"><span title="float">float</span></span> <span class="o">=</span> <span class="mf">1.0</span>
|
||
</code></pre></div>
|
||
|
||
<div class="doc doc-contents ">
|
||
|
||
</div>
|
||
|
||
</div>
|
||
|
||
<div class="doc doc-object doc-attribute">
|
||
|
||
|
||
|
||
<h4 id="docling.datamodel.pipeline_options.VlmPipelineOptions.kind" class="doc doc-heading">
|
||
<code class="doc-symbol doc-symbol-heading doc-symbol-attribute"></code> <span class="doc doc-object-name doc-attribute-name">kind</span>
|
||
|
||
|
||
<span class="doc doc-labels">
|
||
<small class="doc doc-label doc-label-class-attribute"><code>class-attribute</code></small>
|
||
</span>
|
||
|
||
</h4>
|
||
<div class="doc-signature highlight"><pre><span></span><code><span class="n">kind</span><span class="p">:</span> <span class="n"><span title="str">str</span></span>
|
||
</code></pre></div>
|
||
|
||
<div class="doc doc-contents ">
|
||
|
||
</div>
|
||
|
||
</div>
|
||
|
||
<div class="doc doc-object doc-attribute">
|
||
|
||
|
||
|
||
<h4 id="docling.datamodel.pipeline_options.VlmPipelineOptions.picture_description_options" class="doc doc-heading">
|
||
<code class="doc-symbol doc-symbol-heading doc-symbol-attribute"></code> <span class="doc doc-object-name doc-attribute-name">picture_description_options</span>
|
||
|
||
|
||
<span class="doc doc-labels">
|
||
<small class="doc doc-label doc-label-class-attribute"><code>class-attribute</code></small>
|
||
<small class="doc doc-label doc-label-instance-attribute"><code>instance-attribute</code></small>
|
||
</span>
|
||
|
||
</h4>
|
||
<div class="doc-signature highlight"><pre><span></span><code><span class="n">picture_description_options</span><span class="p">:</span> <span class="n"><a class="autorefs autorefs-internal" title="<code class="doc-symbol doc-symbol-heading doc-symbol-class"></code> <span class="doc doc-object-name doc-class-name">PictureDescriptionBaseOptions</span> (<code>docling.datamodel.pipeline_options.PictureDescriptionBaseOptions</code>)" href="#docling.datamodel.pipeline_options.PictureDescriptionBaseOptions">PictureDescriptionBaseOptions</a></span> <span class="o">=</span> <span class="n"><a class="autorefs autorefs-internal" title="<code class="doc-symbol doc-symbol-heading doc-symbol-attribute"></code> <span class="doc doc-object-name doc-attribute-name">smolvlm_picture_description</span>
|
||
|
||
|
||
<span class="doc doc-labels">
|
||
<small class="doc doc-label doc-label-module-attribute"><code>module-attribute</code></small>
|
||
</span> (<code>docling.datamodel.pipeline_options.smolvlm_picture_description</code>)" href="#docling.datamodel.pipeline_options.smolvlm_picture_description">smolvlm_picture_description</a></span>
|
||
</code></pre></div>
|
||
|
||
<div class="doc doc-contents ">
|
||
|
||
</div>
|
||
|
||
</div>
|
||
|
||
<div class="doc doc-object doc-attribute">
|
||
|
||
|
||
|
||
<h4 id="docling.datamodel.pipeline_options.VlmPipelineOptions.vlm_options" class="doc doc-heading">
|
||
<code class="doc-symbol doc-symbol-heading doc-symbol-attribute"></code> <span class="doc doc-object-name doc-attribute-name">vlm_options</span>
|
||
|
||
|
||
<span class="doc doc-labels">
|
||
<small class="doc doc-label doc-label-class-attribute"><code>class-attribute</code></small>
|
||
<small class="doc doc-label doc-label-instance-attribute"><code>instance-attribute</code></small>
|
||
</span>
|
||
|
||
</h4>
|
||
<div class="doc-signature highlight"><pre><span></span><code><span class="n">vlm_options</span><span class="p">:</span> <span class="n"><span title="typing.Union">Union</span></span><span class="p">[</span><span class="n"><span title="docling.datamodel.pipeline_options_vlm_model.InlineVlmOptions">InlineVlmOptions</span></span><span class="p">,</span> <span class="n"><span title="docling.datamodel.pipeline_options_vlm_model.ApiVlmOptions">ApiVlmOptions</span></span><span class="p">]</span> <span class="o">=</span> <span class="n"><span title="docling.datamodel.vlm_model_specs.GRANITEDOCLING_TRANSFORMERS">GRANITEDOCLING_TRANSFORMERS</span></span>
|
||
</code></pre></div>
|
||
|
||
<div class="doc doc-contents ">
|
||
|
||
</div>
|
||
|
||
</div>
|
||
|
||
|
||
|
||
|
||
|
||
|
||
</div>
|
||
|
||
</div>
|
||
|
||
</div>
|
||
|
||
|
||
|
||
|
||
</div>
|
||
|
||
</div>
|
||
|
||
</div><!-- ::: docling.document_converter.DocumentConverter
|
||
handler: python
|
||
options:
|
||
show_if_no_docstring: true
|
||
show_submodules: true -->
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
</article>
|
||
</div>
|
||
|
||
|
||
<script>var tabs=__md_get("__tabs");if(Array.isArray(tabs))e:for(var set of document.querySelectorAll(".tabbed-set")){var labels=set.querySelector(".tabbed-labels");for(var tab of tabs)for(var label of labels.getElementsByTagName("label"))if(label.innerText.trim()===tab){var input=document.getElementById(label.htmlFor);input.checked=!0;continue e}}</script>
|
||
|
||
<script>var target=document.getElementById(location.hash.slice(1));target&&target.name&&(target.checked=target.name.startsWith("__tabbed_"))</script>
|
||
</div>
|
||
|
||
<button type="button" class="md-top md-icon" data-md-component="top" hidden>
|
||
|
||
<svg xmlns="http://www.w3.org/2000/svg" viewBox="0 0 24 24"><path d="M13 20h-2V8l-5.5 5.5-1.42-1.42L12 4.16l7.92 7.92-1.42 1.42L13 8z"/></svg>
|
||
Back to top
|
||
</button>
|
||
|
||
</main>
|
||
|
||
<footer class="md-footer">
|
||
|
||
|
||
|
||
<nav class="md-footer__inner md-grid" aria-label="Footer" >
|
||
|
||
|
||
<a href="../document_converter/" class="md-footer__link md-footer__link--prev" aria-label="Previous: Document Converter">
|
||
<div class="md-footer__button md-icon">
|
||
|
||
<svg xmlns="http://www.w3.org/2000/svg" viewBox="0 0 24 24"><path d="M20 11v2H8l5.5 5.5-1.42 1.42L4.16 12l7.92-7.92L13.5 5.5 8 11z"/></svg>
|
||
</div>
|
||
<div class="md-footer__title">
|
||
<span class="md-footer__direction">
|
||
Previous
|
||
</span>
|
||
<div class="md-ellipsis">
|
||
Document Converter
|
||
</div>
|
||
</div>
|
||
</a>
|
||
|
||
|
||
|
||
<a href="../docling_document/" class="md-footer__link md-footer__link--next" aria-label="Next: Docling Document">
|
||
<div class="md-footer__title">
|
||
<span class="md-footer__direction">
|
||
Next
|
||
</span>
|
||
<div class="md-ellipsis">
|
||
Docling Document
|
||
</div>
|
||
</div>
|
||
<div class="md-footer__button md-icon">
|
||
|
||
<svg xmlns="http://www.w3.org/2000/svg" viewBox="0 0 24 24"><path d="M4 11v2h12l-5.5 5.5 1.42 1.42L19.84 12l-7.92-7.92L10.5 5.5 16 11z"/></svg>
|
||
</div>
|
||
</a>
|
||
|
||
</nav>
|
||
|
||
|
||
<div class="md-footer-meta md-typeset">
|
||
<div class="md-footer-meta__inner md-grid">
|
||
<div class="md-copyright">
|
||
|
||
|
||
Made with
|
||
<a href="https://squidfunk.github.io/mkdocs-material/" target="_blank" rel="noopener">
|
||
Material for MkDocs
|
||
</a>
|
||
|
||
</div>
|
||
|
||
|
||
<div class="md-social">
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
<a href="https://github.com/docling-project/docling" target="_blank" rel="noopener" title="github.com" class="md-social__link">
|
||
<svg xmlns="http://www.w3.org/2000/svg" viewBox="0 0 512 512"><!--! Font Awesome Free 7.1.0 by @fontawesome - https://fontawesome.com License - https://fontawesome.com/license/free (Icons: CC BY 4.0, Fonts: SIL OFL 1.1, Code: MIT License) Copyright 2025 Fonticons, Inc.--><path d="M173.9 397.4c0 2-2.3 3.6-5.2 3.6-3.3.3-5.6-1.3-5.6-3.6 0-2 2.3-3.6 5.2-3.6 3-.3 5.6 1.3 5.6 3.6m-31.1-4.5c-.7 2 1.3 4.3 4.3 4.9 2.6 1 5.6 0 6.2-2s-1.3-4.3-4.3-5.2c-2.6-.7-5.5.3-6.2 2.3m44.2-1.7c-2.9.7-4.9 2.6-4.6 4.9.3 2 2.9 3.3 5.9 2.6 2.9-.7 4.9-2.6 4.6-4.6-.3-1.9-3-3.2-5.9-2.9M252.8 8C114.1 8 8 113.3 8 252c0 110.9 69.8 205.8 169.5 239.2 12.8 2.3 17.3-5.6 17.3-12.1 0-6.2-.3-40.4-.3-61.4 0 0-70 15-84.7-29.8 0 0-11.4-29.1-27.8-36.6 0 0-22.9-15.7 1.6-15.4 0 0 24.9 2 38.6 25.8 21.9 38.6 58.6 27.5 72.9 20.9 2.3-16 8.8-27.1 16-33.7-55.9-6.2-112.3-14.3-112.3-110.5 0-27.5 7.6-41.3 23.6-58.9-2.6-6.5-11.1-33.3 2.6-67.9 20.9-6.5 69 27 69 27 20-5.6 41.5-8.5 62.8-8.5s42.8 2.9 62.8 8.5c0 0 48.1-33.6 69-27 13.7 34.7 5.2 61.4 2.6 67.9 16 17.7 25.8 31.5 25.8 58.9 0 96.5-58.9 104.2-114.8 110.5 9.2 7.9 17 22.9 17 46.4 0 33.7-.3 75.4-.3 83.6 0 6.5 4.6 14.4 17.3 12.1C436.2 457.8 504 362.9 504 252 504 113.3 391.5 8 252.8 8M105.2 352.9c-1.3 1-1 3.3.7 5.2 1.6 1.6 3.9 2.3 5.2 1 1.3-1 1-3.3-.7-5.2-1.6-1.6-3.9-2.3-5.2-1m-10.8-8.1c-.7 1.3.3 2.9 2.3 3.9 1.6 1 3.6.7 4.3-.7.7-1.3-.3-2.9-2.3-3.9-2-.6-3.6-.3-4.3.7m32.4 35.6c-1.6 1.3-1 4.3 1.3 6.2 2.3 2.3 5.2 2.6 6.5 1 1.3-1.3.7-4.3-1.3-6.2-2.2-2.3-5.2-2.6-6.5-1m-11.4-14.7c-1.6 1-1.6 3.6 0 5.9s4.3 3.3 5.6 2.3c1.6-1.3 1.6-3.9 0-6.2-1.4-2.3-4-3.3-5.6-2"/></svg>
|
||
</a>
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
<a href="https://docling.ai/discord" target="_blank" rel="noopener" title="docling.ai" class="md-social__link">
|
||
<svg xmlns="http://www.w3.org/2000/svg" viewBox="0 0 576 512"><!--! Font Awesome Free 7.1.0 by @fontawesome - https://fontawesome.com License - https://fontawesome.com/license/free (Icons: CC BY 4.0, Fonts: SIL OFL 1.1, Code: MIT License) Copyright 2025 Fonticons, Inc.--><path d="M492.5 69.8c-.2-.3-.4-.6-.8-.7-38.1-17.5-78.4-30-119.7-37.1-.4-.1-.8 0-1.1.1s-.6.4-.8.8c-5.5 9.9-10.5 20.2-14.9 30.6-44.6-6.8-89.9-6.8-134.4 0-4.5-10.5-9.5-20.7-15.1-30.6-.2-.3-.5-.6-.8-.8s-.7-.2-1.1-.2C162.5 39 122.2 51.5 84.1 69c-.3.1-.6.4-.8.7C7.1 183.5-13.8 294.6-3.6 404.2c0 .3.1.5.2.8s.3.4.5.6c44.4 32.9 94 58 146.8 74.2.4.1.8.1 1.1 0s.7-.4.9-.7c11.3-15.4 21.4-31.8 30-48.8.1-.2.2-.5.2-.8s0-.5-.1-.8-.2-.5-.4-.6-.4-.3-.7-.4c-15.8-6.1-31.2-13.4-45.9-21.9-.3-.2-.5-.4-.7-.6s-.3-.6-.3-.9 0-.6.2-.9.3-.5.6-.7c3.1-2.3 6.2-4.7 9.1-7.1.3-.2.6-.4.9-.4s.7 0 1 .1c96.2 43.9 200.4 43.9 295.5 0 .3-.1.7-.2 1-.2s.7.2.9.4c2.9 2.4 6 4.9 9.1 7.2.2.2.4.4.6.7s.2.6.2.9-.1.6-.3.9-.4.5-.6.6c-14.7 8.6-30 15.9-45.9 21.8-.2.1-.5.2-.7.4s-.3.4-.4.7-.1.5-.1.8.1.5.2.8c8.8 17 18.8 33.3 30 48.8.2.3.6.6.9.7s.8.1 1.1 0c52.9-16.2 102.6-41.3 147.1-74.2.2-.2.4-.4.5-.6s.2-.5.2-.8c12.3-126.8-20.5-236.9-86.9-334.5zm-302 267.7c-29 0-52.8-26.6-52.8-59.2s23.4-59.2 52.8-59.2c29.7 0 53.3 26.8 52.8 59.2 0 32.7-23.4 59.2-52.8 59.2m195.4 0c-29 0-52.8-26.6-52.8-59.2s23.4-59.2 52.8-59.2c29.7 0 53.3 26.8 52.8 59.2 0 32.7-23.2 59.2-52.8 59.2"/></svg>
|
||
</a>
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
<a href="https://linkedin.com/company/docling/" target="_blank" rel="noopener" title="linkedin.com" class="md-social__link">
|
||
<svg xmlns="http://www.w3.org/2000/svg" viewBox="0 0 448 512"><!--! Font Awesome Free 7.1.0 by @fontawesome - https://fontawesome.com License - https://fontawesome.com/license/free (Icons: CC BY 4.0, Fonts: SIL OFL 1.1, Code: MIT License) Copyright 2025 Fonticons, Inc.--><path d="M416 32H31.9C14.3 32 0 46.5 0 64.3v383.4C0 465.5 14.3 480 31.9 480H416c17.6 0 32-14.5 32-32.3V64.3c0-17.8-14.4-32.3-32-32.3M135.4 416H69V202.2h66.5V416zM102.2 96a38.5 38.5 0 1 1 0 77 38.5 38.5 0 1 1 0-77m282.1 320h-66.4V312c0-24.8-.5-56.7-34.5-56.7-34.6 0-39.9 27-39.9 54.9V416h-66.4V202.2h63.7v29.2h.9c8.9-16.8 30.6-34.5 62.9-34.5 67.2 0 79.7 44.3 79.7 101.9z"/></svg>
|
||
</a>
|
||
|
||
</div>
|
||
|
||
</div>
|
||
</div>
|
||
</footer>
|
||
|
||
</div>
|
||
<div class="md-dialog" data-md-component="dialog">
|
||
<div class="md-dialog__inner md-typeset"></div>
|
||
</div>
|
||
|
||
<div class="md-progress" data-md-component="progress" role="progressbar"></div>
|
||
|
||
|
||
|
||
|
||
|
||
<script id="__config" type="application/json">{"annotate": null, "base": "../..", "features": ["content.tabs.link", "content.code.annotate", "content.code.copy", "content.tooltips", "announce.dismiss", "navigation.footer", "navigation.tabs", "navigation.indexes", "navigation.instant", "navigation.instant.prefetch", "navigation.instant.progress", "navigation.path", "navigation.top", "navigation.tracking", "search.suggest", "toc.follow"], "search": "../../assets/javascripts/workers/search.7a47a382.min.js", "tags": null, "translations": {"clipboard.copied": "Copied to clipboard", "clipboard.copy": "Copy to clipboard", "search.result.more.one": "1 more on this page", "search.result.more.other": "# more on this page", "search.result.none": "No matching documents", "search.result.one": "1 matching document", "search.result.other": "# matching documents", "search.result.placeholder": "Type to start searching", "search.result.term.missing": "Missing", "select.version": "Select version"}, "version": null}</script>
|
||
|
||
|
||
<script src="../../assets/javascripts/bundle.e71a0d61.min.js"></script>
|
||
|
||
|
||
</body>
|
||
</html> |