mirror of
https://github.com/DS4SD/docling.git
synced 2025-07-28 21:14:23 +00:00
* Update tests for docling-core 2.5.0 Signed-off-by: Christoph Auer <cau@zurich.ibm.com> * Add export with referenced images to export_figures example Signed-off-by: Christoph Auer <cau@zurich.ibm.com> * Fix OCR tests Signed-off-by: Christoph Auer <cau@zurich.ibm.com> * Revert "Fix OCR tests" This reverts commit 12b575946f51950fcacece99d4d6eb682125d779. Signed-off-by: Christoph Auer <cau@zurich.ibm.com> * Update lockfile for docling-core 2.5.1 Signed-off-by: Christoph Auer <cau@zurich.ibm.com> --------- Signed-off-by: Christoph Auer <cau@zurich.ibm.com>
1 line
1.1 KiB
JSON
1 line
1.1 KiB
JSON
{"schema_name": "DoclingDocument", "version": "1.0.0", "name": "ocr_test", "origin": {"mimetype": "application/pdf", "binary_hash": 14853448746796404529, "filename": "ocr_test.pdf", "uri": null}, "furniture": {"self_ref": "#/furniture", "parent": null, "children": [], "name": "_root_", "label": "unspecified"}, "body": {"self_ref": "#/body", "parent": null, "children": [{"cref": "#/texts/0"}], "name": "_root_", "label": "unspecified"}, "groups": [], "texts": [{"self_ref": "#/texts/0", "parent": {"cref": "#/body"}, "children": [], "label": "text", "prov": [{"page_no": 1, "bbox": {"l": 70.90211486816406, "t": 765.0995483398438, "r": 504.87200927734375, "b": 689.2166748046875, "coord_origin": "BOTTOMLEFT"}, "charspan": [0, 94]}], "orig": "Docling bundles PDF document conversion to JSON and Markdown in an easy self contained package", "text": "Docling bundles PDF document conversion to JSON and Markdown in an easy self contained package"}], "pictures": [], "tables": [], "key_value_items": [], "pages": {"1": {"size": {"width": 595.201171875, "height": 841.9216918945312}, "image": null, "page_no": 1}}} |