diff --git a/docling/experimental/pipeline/threaded_layout_vlm_pipeline.py b/docling/experimental/pipeline/threaded_layout_vlm_pipeline.py index 92c0c104..db73db8d 100644 --- a/docling/experimental/pipeline/threaded_layout_vlm_pipeline.py +++ b/docling/experimental/pipeline/threaded_layout_vlm_pipeline.py @@ -232,9 +232,12 @@ class ThreadedLayoutVlmPipeline(BasePipeline): # Initialize pages start_page, end_page = conv_res.input.limits.page_range pages: List[Page] = [] + images_scale = self.pipeline_options.images_scale for i in range(conv_res.input.page_count): if start_page - 1 <= i <= end_page - 1: page = Page(page_no=i) + if images_scale is not None: + page._default_image_scale = images_scale page._backend = backend.load_page(i) if page._backend and page._backend.is_valid(): page.size = page._backend.get_size() diff --git a/docling/pipeline/vlm_pipeline.py b/docling/pipeline/vlm_pipeline.py index 6fabdb38..ab919c4d 100644 --- a/docling/pipeline/vlm_pipeline.py +++ b/docling/pipeline/vlm_pipeline.py @@ -114,6 +114,9 @@ class VlmPipeline(PaginatedPipeline): def initialize_page(self, conv_res: ConversionResult, page: Page) -> Page: with TimeRecorder(conv_res, "page_init"): + images_scale = self.pipeline_options.images_scale + if images_scale is not None: + page._default_image_scale = images_scale page._backend = conv_res.input._backend.load_page(page.page_no) # type: ignore if page._backend is not None and page._backend.is_valid(): page.size = page._backend.get_size() diff --git a/docs/examples/demo_layout_vlm.py b/docs/examples/demo_layout_vlm.py index 18eb4aa1..13a5295f 100644 --- a/docs/examples/demo_layout_vlm.py +++ b/docs/examples/demo_layout_vlm.py @@ -113,7 +113,7 @@ def demo_threaded_layout_vlm_pipeline( # Queue configuration queue_max_size=10, # Image processing - images_scale=2.0, + images_scale=vlm_options.scale, generate_page_images=True, enable_remote_services=use_api_vlm, ) @@ -142,7 +142,7 @@ def demo_threaded_layout_vlm_pipeline( ) result_layout_aware.document.save_as_html( - out_dir_layout_aware / f"{doc_filename}.html" + out_dir_layout_aware / f"{doc_filename}.html", split_page_view=True ) for page in result_layout_aware.pages: _log.info("Page %s of VLM response:", page.page_no)