docling/tests/data/groundtruth/docling_v2/2305.03393v1-pg9.json
Christoph Auer 0e63cb09e6 Remove pages.json from diff
Signed-off-by: Christoph Auer <cau@zurich.ibm.com>
2025-06-19 16:19:46 +02:00

2122 lines
62 KiB
JSON
Vendored

{
"schema_name": "DoclingDocument",
"version": "1.3.0",
"name": "2305.03393v1-pg9",
"origin": {
"mimetype": "application/pdf",
"binary_hash": 3463920545297462180,
"filename": "2305.03393v1-pg9.pdf",
"uri": null
},
"furniture": {
"self_ref": "#/furniture",
"parent": null,
"children": [],
"content_layer": "furniture",
"name": "_root_",
"label": "unspecified"
},
"body": {
"self_ref": "#/body",
"parent": null,
"children": [
{
"cref": "#/texts/0"
},
{
"cref": "#/texts/1"
},
{
"cref": "#/texts/2"
},
{
"cref": "#/texts/3"
},
{
"cref": "#/texts/4"
},
{
"cref": "#/tables/0"
},
{
"cref": "#/texts/6"
},
{
"cref": "#/texts/7"
},
{
"cref": "#/texts/8"
}
],
"content_layer": "body",
"name": "_root_",
"label": "unspecified"
},
"groups": [],
"texts": [
{
"self_ref": "#/texts/0",
"parent": {
"cref": "#/body"
},
"children": [],
"content_layer": "furniture",
"label": "page_header",
"prov": [
{
"page_no": 1,
"bbox": {
"l": 194.478,
"t": 698.337,
"r": 447.545,
"b": 689.963,
"coord_origin": "BOTTOMLEFT"
},
"charspan": [
0,
60
]
}
],
"orig": "Optimized Table Tokenization for Table Structure Recognition",
"text": "Optimized Table Tokenization for Table Structure Recognition",
"formatting": null,
"hyperlink": null
},
{
"self_ref": "#/texts/1",
"parent": {
"cref": "#/body"
},
"children": [],
"content_layer": "furniture",
"label": "page_header",
"prov": [
{
"page_no": 1,
"bbox": {
"l": 475.984,
"t": 698.337,
"r": 480.593,
"b": 689.963,
"coord_origin": "BOTTOMLEFT"
},
"charspan": [
0,
1
]
}
],
"orig": "9",
"text": "9",
"formatting": null,
"hyperlink": null
},
{
"self_ref": "#/texts/2",
"parent": {
"cref": "#/body"
},
"children": [],
"content_layer": "body",
"label": "text",
"prov": [
{
"page_no": 1,
"bbox": {
"l": 134.765,
"t": 673.126,
"r": 480.597,
"b": 639.919,
"coord_origin": "BOTTOMLEFT"
},
"charspan": [
0,
163
]
}
],
"orig": "order to compute the TED score. Inference timing results for all experiments were obtained from the same machine on a single core with AMD EPYC 7763 CPU @2.45 GHz.",
"text": "order to compute the TED score. Inference timing results for all experiments were obtained from the same machine on a single core with AMD EPYC 7763 CPU @2.45 GHz.",
"formatting": null,
"hyperlink": null
},
{
"self_ref": "#/texts/3",
"parent": {
"cref": "#/body"
},
"children": [],
"content_layer": "body",
"label": "section_header",
"prov": [
{
"page_no": 1,
"bbox": {
"l": 134.765,
"t": 622.844,
"r": 318.451,
"b": 613.617,
"coord_origin": "BOTTOMLEFT"
},
"charspan": [
0,
32
]
}
],
"orig": "5.1 Hyper Parameter Optimization",
"text": "5.1 Hyper Parameter Optimization",
"formatting": null,
"hyperlink": null,
"level": 1
},
{
"self_ref": "#/texts/4",
"parent": {
"cref": "#/body"
},
"children": [],
"content_layer": "body",
"label": "text",
"prov": [
{
"page_no": 1,
"bbox": {
"l": 134.765,
"t": 606.474,
"r": 480.596,
"b": 536.933,
"coord_origin": "BOTTOMLEFT"
},
"charspan": [
0,
423
]
}
],
"orig": "We have chosen the PubTabNet data set to perform HPO, since it includes a highly diverse set of tables. Also we report TED scores separately for simple and complex tables (tables with cell spans). Results are presented in Table. 1. It is evident that with OTSL, our model achieves the same TED score and slightly better mAP scores in comparison to HTML. However OTSL yields a 2x speed up in the inference runtime over HTML.",
"text": "We have chosen the PubTabNet data set to perform HPO, since it includes a highly diverse set of tables. Also we report TED scores separately for simple and complex tables (tables with cell spans). Results are presented in Table. 1. It is evident that with OTSL, our model achieves the same TED score and slightly better mAP scores in comparison to HTML. However OTSL yields a 2x speed up in the inference runtime over HTML.",
"formatting": null,
"hyperlink": null
},
{
"self_ref": "#/texts/5",
"parent": {
"cref": "#/tables/0"
},
"children": [],
"content_layer": "body",
"label": "caption",
"prov": [
{
"page_no": 1,
"bbox": {
"l": 134.765,
"t": 518.264,
"r": 480.599,
"b": 464.763,
"coord_origin": "BOTTOMLEFT"
},
"charspan": [
0,
398
]
}
],
"orig": "Table 1. HPO performed in OTSL and HTML representation on the same transformer-based TableFormer [9] architecture, trained only on PubTabNet [22]. Effects of reducing the # of layers in encoder and decoder stages of the model show that smaller models trained on OTSL perform better, especially in recognizing complex table structures, and maintain a much higher mAP score than the HTML counterpart.",
"text": "Table 1. HPO performed in OTSL and HTML representation on the same transformer-based TableFormer [9] architecture, trained only on PubTabNet [22]. Effects of reducing the # of layers in encoder and decoder stages of the model show that smaller models trained on OTSL perform better, especially in recognizing complex table structures, and maintain a much higher mAP score than the HTML counterpart.",
"formatting": null,
"hyperlink": null
},
{
"self_ref": "#/texts/6",
"parent": {
"cref": "#/body"
},
"children": [],
"content_layer": "body",
"label": "section_header",
"prov": [
{
"page_no": 1,
"bbox": {
"l": 134.765,
"t": 283.878,
"r": 264.408,
"b": 274.65100000000007,
"coord_origin": "BOTTOMLEFT"
},
"charspan": [
0,
24
]
}
],
"orig": "5.2 Quantitative Results",
"text": "5.2 Quantitative Results",
"formatting": null,
"hyperlink": null,
"level": 1
},
{
"self_ref": "#/texts/7",
"parent": {
"cref": "#/body"
},
"children": [],
"content_layer": "body",
"label": "text",
"prov": [
{
"page_no": 1,
"bbox": {
"l": 134.765,
"t": 267.509,
"r": 480.722,
"b": 174.52600000000007,
"coord_origin": "BOTTOMLEFT"
},
"charspan": [
0,
557
]
}
],
"orig": "We picked the model parameter configuration that produced the best prediction quality (enc=6, dec=6, heads=8) with PubTabNet alone, then independently trained and evaluated it on three publicly available data sets: PubTabNet (395k samples), FinTabNet (113k samples) and PubTables-1M (about 1M samples). Performance results are presented in Table. 2. It is clearly evident that the model trained on OTSL outperforms HTML across the board, keeping high TEDs and mAP scores even on di ffi cult financial tables (FinTabNet) that contain sparse and large tables.",
"text": "We picked the model parameter configuration that produced the best prediction quality (enc=6, dec=6, heads=8) with PubTabNet alone, then independently trained and evaluated it on three publicly available data sets: PubTabNet (395k samples), FinTabNet (113k samples) and PubTables-1M (about 1M samples). Performance results are presented in Table. 2. It is clearly evident that the model trained on OTSL outperforms HTML across the board, keeping high TEDs and mAP scores even on di ffi cult financial tables (FinTabNet) that contain sparse and large tables.",
"formatting": null,
"hyperlink": null
},
{
"self_ref": "#/texts/8",
"parent": {
"cref": "#/body"
},
"children": [],
"content_layer": "body",
"label": "text",
"prov": [
{
"page_no": 1,
"bbox": {
"l": 134.765,
"t": 171.86699999999996,
"r": 480.599,
"b": 126.70600000000002,
"coord_origin": "BOTTOMLEFT"
},
"charspan": [
0,
289
]
}
],
"orig": "Additionally, the results show that OTSL has an advantage over HTML when applied on a bigger data set like PubTables-1M and achieves significantly improved scores. Finally, OTSL achieves faster inference due to fewer decoding steps which is a result of the reduced sequence representation.",
"text": "Additionally, the results show that OTSL has an advantage over HTML when applied on a bigger data set like PubTables-1M and achieves significantly improved scores. Finally, OTSL achieves faster inference due to fewer decoding steps which is a result of the reduced sequence representation.",
"formatting": null,
"hyperlink": null
}
],
"pictures": [],
"tables": [
{
"self_ref": "#/tables/0",
"parent": {
"cref": "#/body"
},
"children": [
{
"cref": "#/texts/5"
}
],
"content_layer": "body",
"label": "table",
"prov": [
{
"page_no": 1,
"bbox": {
"l": 139.6674041748047,
"t": 454.4546203613281,
"r": 475.00927734375,
"b": 322.5054626464844,
"coord_origin": "BOTTOMLEFT"
},
"charspan": [
0,
0
]
}
],
"captions": [
{
"cref": "#/texts/5"
}
],
"references": [],
"footnotes": [],
"image": null,
"data": {
"table_cells": [
{
"bbox": {
"l": 160.37,
"t": 341.627,
"r": 168.045,
"b": 350.001,
"coord_origin": "TOPLEFT"
},
"row_span": 2,
"col_span": 1,
"start_row_offset_idx": 0,
"end_row_offset_idx": 2,
"start_col_offset_idx": 0,
"end_col_offset_idx": 1,
"text": "# enc-layers",
"column_header": true,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 207.974,
"t": 341.627,
"r": 215.649,
"b": 350.001,
"coord_origin": "TOPLEFT"
},
"row_span": 2,
"col_span": 1,
"start_row_offset_idx": 0,
"end_row_offset_idx": 2,
"start_col_offset_idx": 1,
"end_col_offset_idx": 2,
"text": "# dec-layers",
"column_header": true,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 239.798,
"t": 347.106,
"r": 278.333,
"b": 355.48,
"coord_origin": "TOPLEFT"
},
"row_span": 2,
"col_span": 1,
"start_row_offset_idx": 0,
"end_row_offset_idx": 2,
"start_col_offset_idx": 2,
"end_col_offset_idx": 3,
"text": "Language",
"column_header": true,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 324.67,
"t": 341.627,
"r": 348.263,
"b": 350.001,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 3,
"start_row_offset_idx": 0,
"end_row_offset_idx": 1,
"start_col_offset_idx": 3,
"end_col_offset_idx": 6,
"text": "TEDs",
"column_header": true,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 396.271,
"t": 341.627,
"r": 417.123,
"b": 350.001,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 0,
"end_row_offset_idx": 1,
"start_col_offset_idx": 6,
"end_col_offset_idx": 7,
"text": "mAP",
"column_header": true,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 394.927,
"t": 352.586,
"r": 418.473,
"b": 360.96,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 1,
"end_row_offset_idx": 2,
"start_col_offset_idx": 6,
"end_col_offset_idx": 7,
"text": "(0.75)",
"column_header": true,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 430.771,
"t": 341.627,
"r": 467.141,
"b": 350.001,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 0,
"end_row_offset_idx": 1,
"start_col_offset_idx": 7,
"end_col_offset_idx": 8,
"text": "Inference",
"column_header": true,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 427.148,
"t": 352.586,
"r": 445.07,
"b": 360.96,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 1,
"end_row_offset_idx": 2,
"start_col_offset_idx": 7,
"end_col_offset_idx": 8,
"text": "time (secs)",
"column_header": true,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 286.686,
"t": 354.578,
"r": 312.325,
"b": 362.952,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 1,
"end_row_offset_idx": 2,
"start_col_offset_idx": 3,
"end_col_offset_idx": 4,
"text": "simple",
"column_header": true,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 320.702,
"t": 354.578,
"r": 353.718,
"b": 362.952,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 1,
"end_row_offset_idx": 2,
"start_col_offset_idx": 4,
"end_col_offset_idx": 5,
"text": "complex",
"column_header": true,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 369.306,
"t": 354.578,
"r": 379.031,
"b": 362.952,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 1,
"end_row_offset_idx": 2,
"start_col_offset_idx": 5,
"end_col_offset_idx": 6,
"text": "all",
"column_header": true,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 161.906,
"t": 373.408,
"r": 166.515,
"b": 381.782,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 2,
"end_row_offset_idx": 3,
"start_col_offset_idx": 0,
"end_col_offset_idx": 1,
"text": "6",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 209.509,
"t": 373.408,
"r": 214.118,
"b": 381.782,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 2,
"end_row_offset_idx": 3,
"start_col_offset_idx": 1,
"end_col_offset_idx": 2,
"text": "6",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 246.71,
"t": 367.928,
"r": 271.409,
"b": 376.302,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 2,
"end_row_offset_idx": 3,
"start_col_offset_idx": 2,
"end_col_offset_idx": 3,
"text": "OTSL HTML",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 289.017,
"t": 367.928,
"r": 310.009,
"b": 376.302,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 2,
"end_row_offset_idx": 3,
"start_col_offset_idx": 3,
"end_col_offset_idx": 4,
"text": "0.965 0.969",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 326.717,
"t": 367.928,
"r": 347.709,
"b": 376.302,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 2,
"end_row_offset_idx": 3,
"start_col_offset_idx": 4,
"end_col_offset_idx": 5,
"text": "0.934 0.927",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 363.676,
"t": 367.928,
"r": 384.668,
"b": 376.302,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 2,
"end_row_offset_idx": 3,
"start_col_offset_idx": 5,
"end_col_offset_idx": 6,
"text": "0.955 0.955",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 397.27,
"t": 366.637,
"r": 416.131,
"b": 376.774,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 2,
"end_row_offset_idx": 3,
"start_col_offset_idx": 6,
"end_col_offset_idx": 7,
"text": "0.88 0.857",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 439.527,
"t": 366.637,
"r": 458.388,
"b": 376.774,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 2,
"end_row_offset_idx": 3,
"start_col_offset_idx": 7,
"end_col_offset_idx": 8,
"text": "2.73 5.39",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 161.906,
"t": 399.709,
"r": 166.515,
"b": 408.083,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 3,
"end_row_offset_idx": 4,
"start_col_offset_idx": 0,
"end_col_offset_idx": 1,
"text": "4",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 209.509,
"t": 399.709,
"r": 214.118,
"b": 408.083,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 3,
"end_row_offset_idx": 4,
"start_col_offset_idx": 1,
"end_col_offset_idx": 2,
"text": "4",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 246.71,
"t": 394.23,
"r": 271.409,
"b": 402.604,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 3,
"end_row_offset_idx": 4,
"start_col_offset_idx": 2,
"end_col_offset_idx": 3,
"text": "OTSL HTML",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 289.017,
"t": 394.23,
"r": 310.009,
"b": 402.604,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 3,
"end_row_offset_idx": 4,
"start_col_offset_idx": 3,
"end_col_offset_idx": 4,
"text": "0.938 0.952",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 326.717,
"t": 394.23,
"r": 347.709,
"b": 402.604,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 3,
"end_row_offset_idx": 4,
"start_col_offset_idx": 4,
"end_col_offset_idx": 5,
"text": "0.904 0.909",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 363.676,
"t": 394.23,
"r": 384.668,
"b": 402.604,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 3,
"end_row_offset_idx": 4,
"start_col_offset_idx": 5,
"end_col_offset_idx": 6,
"text": "0.927 0.938",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 394.618,
"t": 392.939,
"r": 418.782,
"b": 403.076,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 3,
"end_row_offset_idx": 4,
"start_col_offset_idx": 6,
"end_col_offset_idx": 7,
"text": "0.853 0.843",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 439.527,
"t": 392.939,
"r": 458.388,
"b": 403.076,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 3,
"end_row_offset_idx": 4,
"start_col_offset_idx": 7,
"end_col_offset_idx": 8,
"text": "1.97 3.77",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 161.906,
"t": 426.01,
"r": 166.515,
"b": 434.384,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 4,
"end_row_offset_idx": 5,
"start_col_offset_idx": 0,
"end_col_offset_idx": 1,
"text": "2",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 209.509,
"t": 426.01,
"r": 214.118,
"b": 434.384,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 4,
"end_row_offset_idx": 5,
"start_col_offset_idx": 1,
"end_col_offset_idx": 2,
"text": "4",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 246.71,
"t": 420.531,
"r": 271.409,
"b": 428.905,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 4,
"end_row_offset_idx": 5,
"start_col_offset_idx": 2,
"end_col_offset_idx": 3,
"text": "OTSL HTML",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 289.017,
"t": 420.531,
"r": 310.009,
"b": 428.905,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 4,
"end_row_offset_idx": 5,
"start_col_offset_idx": 3,
"end_col_offset_idx": 4,
"text": "0.923 0.945",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 326.717,
"t": 420.531,
"r": 347.709,
"b": 428.905,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 4,
"end_row_offset_idx": 5,
"start_col_offset_idx": 4,
"end_col_offset_idx": 5,
"text": "0.897 0.901",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 363.676,
"t": 420.531,
"r": 384.668,
"b": 428.905,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 4,
"end_row_offset_idx": 5,
"start_col_offset_idx": 5,
"end_col_offset_idx": 6,
"text": "0.915 0.931",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 394.618,
"t": 419.24,
"r": 418.782,
"b": 429.377,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 4,
"end_row_offset_idx": 5,
"start_col_offset_idx": 6,
"end_col_offset_idx": 7,
"text": "0.859 0.834",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 439.527,
"t": 419.24,
"r": 458.388,
"b": 429.377,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 4,
"end_row_offset_idx": 5,
"start_col_offset_idx": 7,
"end_col_offset_idx": 8,
"text": "1.91 3.81",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 161.906,
"t": 452.312,
"r": 166.515,
"b": 460.686,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 5,
"end_row_offset_idx": 6,
"start_col_offset_idx": 0,
"end_col_offset_idx": 1,
"text": "4",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 209.509,
"t": 452.312,
"r": 214.118,
"b": 460.686,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 5,
"end_row_offset_idx": 6,
"start_col_offset_idx": 1,
"end_col_offset_idx": 2,
"text": "2",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 246.71,
"t": 446.832,
"r": 271.409,
"b": 455.206,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 5,
"end_row_offset_idx": 6,
"start_col_offset_idx": 2,
"end_col_offset_idx": 3,
"text": "OTSL HTML",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 289.017,
"t": 446.832,
"r": 310.009,
"b": 455.206,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 5,
"end_row_offset_idx": 6,
"start_col_offset_idx": 3,
"end_col_offset_idx": 4,
"text": "0.952 0.944",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 329.021,
"t": 446.832,
"r": 345.406,
"b": 455.206,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 5,
"end_row_offset_idx": 6,
"start_col_offset_idx": 4,
"end_col_offset_idx": 5,
"text": "0.92 0.903",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 362.088,
"t": 445.541,
"r": 386.252,
"b": 455.678,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 5,
"end_row_offset_idx": 6,
"start_col_offset_idx": 5,
"end_col_offset_idx": 6,
"text": "0.942 0.931",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 394.618,
"t": 445.541,
"r": 418.782,
"b": 455.678,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 5,
"end_row_offset_idx": 6,
"start_col_offset_idx": 6,
"end_col_offset_idx": 7,
"text": "0.857 0.824",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 439.527,
"t": 445.541,
"r": 458.388,
"b": 455.678,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 5,
"end_row_offset_idx": 6,
"start_col_offset_idx": 7,
"end_col_offset_idx": 8,
"text": "1.22 2",
"column_header": false,
"row_header": false,
"row_section": false
}
],
"num_rows": 6,
"num_cols": 8,
"grid": [
[
{
"bbox": {
"l": 160.37,
"t": 341.627,
"r": 168.045,
"b": 350.001,
"coord_origin": "TOPLEFT"
},
"row_span": 2,
"col_span": 1,
"start_row_offset_idx": 0,
"end_row_offset_idx": 2,
"start_col_offset_idx": 0,
"end_col_offset_idx": 1,
"text": "# enc-layers",
"column_header": true,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 207.974,
"t": 341.627,
"r": 215.649,
"b": 350.001,
"coord_origin": "TOPLEFT"
},
"row_span": 2,
"col_span": 1,
"start_row_offset_idx": 0,
"end_row_offset_idx": 2,
"start_col_offset_idx": 1,
"end_col_offset_idx": 2,
"text": "# dec-layers",
"column_header": true,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 239.798,
"t": 347.106,
"r": 278.333,
"b": 355.48,
"coord_origin": "TOPLEFT"
},
"row_span": 2,
"col_span": 1,
"start_row_offset_idx": 0,
"end_row_offset_idx": 2,
"start_col_offset_idx": 2,
"end_col_offset_idx": 3,
"text": "Language",
"column_header": true,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 324.67,
"t": 341.627,
"r": 348.263,
"b": 350.001,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 3,
"start_row_offset_idx": 0,
"end_row_offset_idx": 1,
"start_col_offset_idx": 3,
"end_col_offset_idx": 6,
"text": "TEDs",
"column_header": true,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 324.67,
"t": 341.627,
"r": 348.263,
"b": 350.001,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 3,
"start_row_offset_idx": 0,
"end_row_offset_idx": 1,
"start_col_offset_idx": 3,
"end_col_offset_idx": 6,
"text": "TEDs",
"column_header": true,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 324.67,
"t": 341.627,
"r": 348.263,
"b": 350.001,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 3,
"start_row_offset_idx": 0,
"end_row_offset_idx": 1,
"start_col_offset_idx": 3,
"end_col_offset_idx": 6,
"text": "TEDs",
"column_header": true,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 396.271,
"t": 341.627,
"r": 417.123,
"b": 350.001,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 0,
"end_row_offset_idx": 1,
"start_col_offset_idx": 6,
"end_col_offset_idx": 7,
"text": "mAP",
"column_header": true,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 430.771,
"t": 341.627,
"r": 467.141,
"b": 350.001,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 0,
"end_row_offset_idx": 1,
"start_col_offset_idx": 7,
"end_col_offset_idx": 8,
"text": "Inference",
"column_header": true,
"row_header": false,
"row_section": false
}
],
[
{
"bbox": {
"l": 160.37,
"t": 341.627,
"r": 168.045,
"b": 350.001,
"coord_origin": "TOPLEFT"
},
"row_span": 2,
"col_span": 1,
"start_row_offset_idx": 0,
"end_row_offset_idx": 2,
"start_col_offset_idx": 0,
"end_col_offset_idx": 1,
"text": "# enc-layers",
"column_header": true,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 207.974,
"t": 341.627,
"r": 215.649,
"b": 350.001,
"coord_origin": "TOPLEFT"
},
"row_span": 2,
"col_span": 1,
"start_row_offset_idx": 0,
"end_row_offset_idx": 2,
"start_col_offset_idx": 1,
"end_col_offset_idx": 2,
"text": "# dec-layers",
"column_header": true,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 239.798,
"t": 347.106,
"r": 278.333,
"b": 355.48,
"coord_origin": "TOPLEFT"
},
"row_span": 2,
"col_span": 1,
"start_row_offset_idx": 0,
"end_row_offset_idx": 2,
"start_col_offset_idx": 2,
"end_col_offset_idx": 3,
"text": "Language",
"column_header": true,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 286.686,
"t": 354.578,
"r": 312.325,
"b": 362.952,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 1,
"end_row_offset_idx": 2,
"start_col_offset_idx": 3,
"end_col_offset_idx": 4,
"text": "simple",
"column_header": true,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 320.702,
"t": 354.578,
"r": 353.718,
"b": 362.952,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 1,
"end_row_offset_idx": 2,
"start_col_offset_idx": 4,
"end_col_offset_idx": 5,
"text": "complex",
"column_header": true,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 369.306,
"t": 354.578,
"r": 379.031,
"b": 362.952,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 1,
"end_row_offset_idx": 2,
"start_col_offset_idx": 5,
"end_col_offset_idx": 6,
"text": "all",
"column_header": true,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 394.927,
"t": 352.586,
"r": 418.473,
"b": 360.96,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 1,
"end_row_offset_idx": 2,
"start_col_offset_idx": 6,
"end_col_offset_idx": 7,
"text": "(0.75)",
"column_header": true,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 427.148,
"t": 352.586,
"r": 445.07,
"b": 360.96,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 1,
"end_row_offset_idx": 2,
"start_col_offset_idx": 7,
"end_col_offset_idx": 8,
"text": "time (secs)",
"column_header": true,
"row_header": false,
"row_section": false
}
],
[
{
"bbox": {
"l": 161.906,
"t": 373.408,
"r": 166.515,
"b": 381.782,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 2,
"end_row_offset_idx": 3,
"start_col_offset_idx": 0,
"end_col_offset_idx": 1,
"text": "6",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 209.509,
"t": 373.408,
"r": 214.118,
"b": 381.782,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 2,
"end_row_offset_idx": 3,
"start_col_offset_idx": 1,
"end_col_offset_idx": 2,
"text": "6",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 246.71,
"t": 367.928,
"r": 271.409,
"b": 376.302,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 2,
"end_row_offset_idx": 3,
"start_col_offset_idx": 2,
"end_col_offset_idx": 3,
"text": "OTSL HTML",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 289.017,
"t": 367.928,
"r": 310.009,
"b": 376.302,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 2,
"end_row_offset_idx": 3,
"start_col_offset_idx": 3,
"end_col_offset_idx": 4,
"text": "0.965 0.969",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 326.717,
"t": 367.928,
"r": 347.709,
"b": 376.302,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 2,
"end_row_offset_idx": 3,
"start_col_offset_idx": 4,
"end_col_offset_idx": 5,
"text": "0.934 0.927",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 363.676,
"t": 367.928,
"r": 384.668,
"b": 376.302,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 2,
"end_row_offset_idx": 3,
"start_col_offset_idx": 5,
"end_col_offset_idx": 6,
"text": "0.955 0.955",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 397.27,
"t": 366.637,
"r": 416.131,
"b": 376.774,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 2,
"end_row_offset_idx": 3,
"start_col_offset_idx": 6,
"end_col_offset_idx": 7,
"text": "0.88 0.857",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 439.527,
"t": 366.637,
"r": 458.388,
"b": 376.774,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 2,
"end_row_offset_idx": 3,
"start_col_offset_idx": 7,
"end_col_offset_idx": 8,
"text": "2.73 5.39",
"column_header": false,
"row_header": false,
"row_section": false
}
],
[
{
"bbox": {
"l": 161.906,
"t": 399.709,
"r": 166.515,
"b": 408.083,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 3,
"end_row_offset_idx": 4,
"start_col_offset_idx": 0,
"end_col_offset_idx": 1,
"text": "4",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 209.509,
"t": 399.709,
"r": 214.118,
"b": 408.083,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 3,
"end_row_offset_idx": 4,
"start_col_offset_idx": 1,
"end_col_offset_idx": 2,
"text": "4",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 246.71,
"t": 394.23,
"r": 271.409,
"b": 402.604,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 3,
"end_row_offset_idx": 4,
"start_col_offset_idx": 2,
"end_col_offset_idx": 3,
"text": "OTSL HTML",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 289.017,
"t": 394.23,
"r": 310.009,
"b": 402.604,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 3,
"end_row_offset_idx": 4,
"start_col_offset_idx": 3,
"end_col_offset_idx": 4,
"text": "0.938 0.952",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 326.717,
"t": 394.23,
"r": 347.709,
"b": 402.604,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 3,
"end_row_offset_idx": 4,
"start_col_offset_idx": 4,
"end_col_offset_idx": 5,
"text": "0.904 0.909",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 363.676,
"t": 394.23,
"r": 384.668,
"b": 402.604,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 3,
"end_row_offset_idx": 4,
"start_col_offset_idx": 5,
"end_col_offset_idx": 6,
"text": "0.927 0.938",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 394.618,
"t": 392.939,
"r": 418.782,
"b": 403.076,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 3,
"end_row_offset_idx": 4,
"start_col_offset_idx": 6,
"end_col_offset_idx": 7,
"text": "0.853 0.843",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 439.527,
"t": 392.939,
"r": 458.388,
"b": 403.076,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 3,
"end_row_offset_idx": 4,
"start_col_offset_idx": 7,
"end_col_offset_idx": 8,
"text": "1.97 3.77",
"column_header": false,
"row_header": false,
"row_section": false
}
],
[
{
"bbox": {
"l": 161.906,
"t": 426.01,
"r": 166.515,
"b": 434.384,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 4,
"end_row_offset_idx": 5,
"start_col_offset_idx": 0,
"end_col_offset_idx": 1,
"text": "2",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 209.509,
"t": 426.01,
"r": 214.118,
"b": 434.384,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 4,
"end_row_offset_idx": 5,
"start_col_offset_idx": 1,
"end_col_offset_idx": 2,
"text": "4",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 246.71,
"t": 420.531,
"r": 271.409,
"b": 428.905,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 4,
"end_row_offset_idx": 5,
"start_col_offset_idx": 2,
"end_col_offset_idx": 3,
"text": "OTSL HTML",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 289.017,
"t": 420.531,
"r": 310.009,
"b": 428.905,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 4,
"end_row_offset_idx": 5,
"start_col_offset_idx": 3,
"end_col_offset_idx": 4,
"text": "0.923 0.945",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 326.717,
"t": 420.531,
"r": 347.709,
"b": 428.905,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 4,
"end_row_offset_idx": 5,
"start_col_offset_idx": 4,
"end_col_offset_idx": 5,
"text": "0.897 0.901",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 363.676,
"t": 420.531,
"r": 384.668,
"b": 428.905,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 4,
"end_row_offset_idx": 5,
"start_col_offset_idx": 5,
"end_col_offset_idx": 6,
"text": "0.915 0.931",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 394.618,
"t": 419.24,
"r": 418.782,
"b": 429.377,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 4,
"end_row_offset_idx": 5,
"start_col_offset_idx": 6,
"end_col_offset_idx": 7,
"text": "0.859 0.834",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 439.527,
"t": 419.24,
"r": 458.388,
"b": 429.377,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 4,
"end_row_offset_idx": 5,
"start_col_offset_idx": 7,
"end_col_offset_idx": 8,
"text": "1.91 3.81",
"column_header": false,
"row_header": false,
"row_section": false
}
],
[
{
"bbox": {
"l": 161.906,
"t": 452.312,
"r": 166.515,
"b": 460.686,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 5,
"end_row_offset_idx": 6,
"start_col_offset_idx": 0,
"end_col_offset_idx": 1,
"text": "4",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 209.509,
"t": 452.312,
"r": 214.118,
"b": 460.686,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 5,
"end_row_offset_idx": 6,
"start_col_offset_idx": 1,
"end_col_offset_idx": 2,
"text": "2",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 246.71,
"t": 446.832,
"r": 271.409,
"b": 455.206,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 5,
"end_row_offset_idx": 6,
"start_col_offset_idx": 2,
"end_col_offset_idx": 3,
"text": "OTSL HTML",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 289.017,
"t": 446.832,
"r": 310.009,
"b": 455.206,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 5,
"end_row_offset_idx": 6,
"start_col_offset_idx": 3,
"end_col_offset_idx": 4,
"text": "0.952 0.944",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 329.021,
"t": 446.832,
"r": 345.406,
"b": 455.206,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 5,
"end_row_offset_idx": 6,
"start_col_offset_idx": 4,
"end_col_offset_idx": 5,
"text": "0.92 0.903",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 362.088,
"t": 445.541,
"r": 386.252,
"b": 455.678,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 5,
"end_row_offset_idx": 6,
"start_col_offset_idx": 5,
"end_col_offset_idx": 6,
"text": "0.942 0.931",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 394.618,
"t": 445.541,
"r": 418.782,
"b": 455.678,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 5,
"end_row_offset_idx": 6,
"start_col_offset_idx": 6,
"end_col_offset_idx": 7,
"text": "0.857 0.824",
"column_header": false,
"row_header": false,
"row_section": false
},
{
"bbox": {
"l": 439.527,
"t": 445.541,
"r": 458.388,
"b": 455.678,
"coord_origin": "TOPLEFT"
},
"row_span": 1,
"col_span": 1,
"start_row_offset_idx": 5,
"end_row_offset_idx": 6,
"start_col_offset_idx": 7,
"end_col_offset_idx": 8,
"text": "1.22 2",
"column_header": false,
"row_header": false,
"row_section": false
}
]
]
}
}
],
"key_value_items": [],
"form_items": [],
"pages": {
"1": {
"size": {
"width": 612.0,
"height": 792.0
},
"image": null,
"page_no": 1
}
}
}