docling/tests/data/groundtruth/docling_v1/amt_handbook_sample.json
Christoph Auer e00f362405
Some checks failed
Run Docs CI / build-docs (push) Failing after 1m26s
Run CI / code-checks (push) Failing after 6m37s
Update tests, use TextCell.from_ocr property
Signed-off-by: Christoph Auer <cau@zurich.ibm.com>
2025-03-13 16:04:08 +01:00

1 line
4.4 KiB
JSON

{"_name": "", "type": "pdf-document", "description": {"title": null, "abstract": null, "authors": null, "affiliations": null, "subjects": null, "keywords": null, "publication_date": null, "languages": null, "license": null, "publishers": null, "url_refs": null, "references": null, "publication": null, "reference_count": null, "citation_count": null, "citation_date": null, "advanced": null, "analytics": null, "logs": [], "collection": null, "acquisition": null}, "file-info": {"filename": "amt_handbook_sample.pdf", "filename-prov": null, "document-hash": "4ba7cdbd9ce8155d692d8f477f88bb3ec1acc2a463cf1e0209d1e624e58ebce9", "#-pages": 1, "collection-name": null, "description": null, "page-hashes": [{"hash": "f31706a847734c62e1e41f9f792c756283d1d4955552c1cc7f5e23c351bdd7cb", "model": "default", "page": 1}]}, "main-text": [{"prov": [{"bbox": [71.992, 719.501, 309.122, 727.966], "page": 1, "span": [0, 58], "__ref_s3_data": null}], "text": "pulleys, provided the inner race of the bearing is clamped", "type": "paragraph", "payload": null, "name": "Text", "font": null}, {"prov": [{"bbox": [71.992, 657.001, 309.033, 665.466], "page": 1, "span": [0, 59], "__ref_s3_data": null}], "text": "The two general types of self-locking nuts currently in use", "type": "paragraph", "payload": null, "name": "Text", "font": null}, {"prov": [{"bbox": [71.992, 569.5, 167.272, 577.876], "page": 1, "span": [0, 22], "__ref_s3_data": null}], "text": "Boots Self-Locking Nut", "type": "subtitle-level-1", "payload": null, "name": "Section-header", "font": null}, {"prov": [{"bbox": [174.212, 555.001, 311.548, 563.466], "page": 1, "span": [0, 35], "__ref_s3_data": null}], "text": "nut is of one piece, all-metal", "type": "paragraph", "payload": null, "name": "Text", "font": null}, {"prov": [{"bbox": [71.992, 467.501, 309.03, 475.966], "page": 1, "span": [0, 60], "__ref_s3_data": null}], "text": "The spring keeps the locking and load-carrying sections such", "type": "paragraph", "payload": null, "name": "Text", "font": null}, {"prov": [{"bbox": [71.992, 380.001, 309.042, 388.466], "page": 1, "span": [0, 61], "__ref_s3_data": null}], "text": "The spring, through the medium of the locking section, exerts", "type": "paragraph", "payload": null, "name": "Text", "font": null}, {"prov": [{"bbox": [71.992, 267.501, 311.502, 275.966], "page": 1, "span": [0, 60], "__ref_s3_data": null}], "text": "Boots self-locking nuts are made with three different spring", "type": "paragraph", "payload": null, "name": "Text", "font": null}, {"name": "Picture", "type": "figure", "$ref": "#/figures/0"}, {"prov": [{"bbox": [320.992, 719.501, 560.508, 727.966], "page": 1, "span": [0, 61], "__ref_s3_data": null}], "text": "the most common ranges in size for No. 6 up to 1 4 inch, the", "type": "paragraph", "payload": null, "name": "Text", "font": null}, {"prov": [{"bbox": [320.995, 632.0, 450.995, 640.376], "page": 1, "span": [0, 32], "__ref_s3_data": null}], "text": "Stainless Steel Self-Locking Nut", "type": "subtitle-level-1", "payload": null, "name": "Section-header", "font": null}, {"prov": [{"bbox": [320.995, 617.501, 560.498, 625.966], "page": 1, "span": [0, 59], "__ref_s3_data": null}], "text": "The stainless steel self-locking nut may be spun on and off", "type": "paragraph", "payload": null, "name": "Text", "font": null}, {"prov": [{"bbox": [320.995, 392.5, 388.505, 400.876], "page": 1, "span": [0, 16], "__ref_s3_data": null}], "text": "Elastic Stop Nut", "type": "subtitle-level-1", "payload": null, "name": "Section-header", "font": null}, {"prov": [{"bbox": [320.995, 378.001, 558.104, 386.466], "page": 1, "span": [0, 63], "__ref_s3_data": null}], "text": "The elastic stop nut is a standard nut with the height", "type": "paragraph", "payload": null, "name": "Text", "font": null}, {"name": "Picture", "type": "figure", "$ref": "#/figures/1"}], "figures": [{"prov": [{"bbox": [70.59269714355469, 79.6090087890625, 309.863037109375, 242.77777099609375], "page": 1, "span": [0, 12], "__ref_s3_data": null}], "text": "Figure 7-26.", "type": "figure", "payload": null, "bounding-box": null}, {"prov": [{"bbox": [320.4467468261719, 81.689208984375, 558.8576049804688, 352.359375], "page": 1, "span": [0, 12], "__ref_s3_data": null}], "text": "Figure 7-27.", "type": "figure", "payload": null, "bounding-box": null}], "tables": [], "bitmaps": null, "equations": [], "footnotes": [], "page-dimensions": [{"height": 774.0, "page": 1, "width": 594.0}], "page-footers": [], "page-headers": [], "_s3_data": null, "identifiers": null}