From e13fa5ade8f0c2203dd1714685c651b29ef4e07f Mon Sep 17 00:00:00 2001 From: Maksym Lysak Date: Wed, 19 Mar 2025 14:40:21 +0100 Subject: [PATCH] Updated example Signed-off-by: Maksym Lysak --- docs/examples/minimal_vlm_pipeline.py | 18 ++++++++---------- 1 file changed, 8 insertions(+), 10 deletions(-) diff --git a/docs/examples/minimal_vlm_pipeline.py b/docs/examples/minimal_vlm_pipeline.py index 023cbc30..6a15fe42 100644 --- a/docs/examples/minimal_vlm_pipeline.py +++ b/docs/examples/minimal_vlm_pipeline.py @@ -68,18 +68,13 @@ for source in sources: res = converter.convert(source) - print("------------------------------------------------") - print("MD:") - print("------------------------------------------------") print("") print(res.document.export_to_markdown()) - doctags = "" for page in res.pages: print("") print("Predicted page in DOCTAGS:") print(page.predictions.vlm_response.text) - doctags += page.predictions.vlm_response.text res.document.save_as_html( filename=Path("{}/{}.html".format(out_path, res.input.file.stem)), @@ -90,14 +85,17 @@ for source in sources: with (out_path / f"{res.input.file.stem}.json").open("w") as fp: fp.write(json.dumps(res.document.export_to_dict())) - with (out_path / f"{res.input.file.stem}.md").open("w") as fp: - fp.write(res.document.export_to_markdown()) + res.document.save_as_json( + out_path / f"{res.input.file.stem}.md", + image_mode=ImageRefMode.PLACEHOLDER, + ) - with (out_path / f"{res.input.file.stem}.doctag").open("w") as fp: - fp.write(doctags) + res.document.save_as_markdown( + out_path / f"{res.input.file.stem}.md", + image_mode=ImageRefMode.PLACEHOLDER, + ) pg_num = res.document.num_pages() - print("") inference_time = time.time() - start_time print(