docling/tests/data/groundtruth/docling_v1/2305.03393v1-pg9.json
Christoph Auer e00f362405
Some checks failed
Run Docs CI / build-docs (push) Failing after 1m26s
Run CI / code-checks (push) Failing after 6m37s
Update tests, use TextCell.from_ocr property
Signed-off-by: Christoph Auer <cau@zurich.ibm.com>
2025-03-13 16:04:08 +01:00

1 line
3.0 KiB
JSON

{"_name": "", "type": "pdf-document", "description": {"title": null, "abstract": null, "authors": null, "affiliations": null, "subjects": null, "keywords": null, "publication_date": null, "languages": null, "license": null, "publishers": null, "url_refs": null, "references": null, "publication": null, "reference_count": null, "citation_count": null, "citation_date": null, "advanced": null, "analytics": null, "logs": [], "collection": null, "acquisition": null}, "file-info": {"filename": "2305.03393v1-pg9.pdf", "filename-prov": null, "document-hash": "1a36870a3e6aa062b563b50c1eaed40685b651ee03e0538453de65e7013b742f", "#-pages": 1, "collection-name": null, "description": null, "page-hashes": [{"hash": "8a5a8d9a1ae6cbd1dcedcad02ed10195aa71d1ac3e4d56be4ab72c858d7f543e", "model": "default", "page": 1}]}, "main-text": [{"prov": [{"bbox": [134.765, 663.83, 480.591, 673.126], "page": 1, "span": [0, 76], "__ref_s3_data": null}], "text": "order to compute the TED score. Inference timing results for all experiments", "type": "paragraph", "payload": null, "name": "Text", "font": null}, {"prov": [{"bbox": [134.765, 613.617, 149.403, 622.844], "page": 1, "span": [0, 3], "__ref_s3_data": null}], "text": "5.1", "type": "subtitle-level-1", "payload": null, "name": "Section-header", "font": null}, {"prov": [{"bbox": [134.765, 597.178, 480.582, 606.474], "page": 1, "span": [0, 73], "__ref_s3_data": null}], "text": "We have chosen the PubTabNet data set to perform HPO, since it includes a", "type": "paragraph", "payload": null, "name": "Text", "font": null}, {"name": "Table", "type": "table", "$ref": "#/tables/0"}, {"prov": [{"bbox": [134.765, 508.127, 160.118, 518.264], "page": 1, "span": [0, 5], "__ref_s3_data": null}], "text": "Table", "type": "caption", "payload": null, "name": "Caption", "font": null}, {"prov": [{"bbox": [134.765, 274.65100000000007, 149.403, 283.878], "page": 1, "span": [0, 3], "__ref_s3_data": null}], "text": "5.2", "type": "subtitle-level-1", "payload": null, "name": "Section-header", "font": null}, {"prov": [{"bbox": [134.765, 258.21299999999997, 480.562, 267.509], "page": 1, "span": [0, 77], "__ref_s3_data": null}], "text": "We picked the model parameter configuration that produced the best prediction", "type": "paragraph", "payload": null, "name": "Text", "font": null}, {"prov": [{"bbox": [149.709, 162.57100000000003, 205.6, 171.86699999999996], "page": 1, "span": [0, 13], "__ref_s3_data": null}], "text": "Additionally,", "type": "paragraph", "payload": null, "name": "Text", "font": null}], "figures": [], "tables": [{"prov": [{"bbox": [139.66741943359375, 322.5054626464844, 475.00927734375, 454.45458984375], "page": 1, "span": [0, 0], "__ref_s3_data": null}], "text": "Table", "type": "table", "payload": null, "#-cols": 0, "#-rows": 0, "data": [], "model": null, "bounding-box": null}], "bitmaps": null, "equations": [], "footnotes": [], "page-dimensions": [{"height": 792.0, "page": 1, "width": 612.0}], "page-footers": [], "page-headers": [], "_s3_data": null, "identifiers": null}