docling/tests/data/groundtruth/docling_v1/2305.03393v1-pg9.pages.json
Christoph Auer e00f362405
Some checks failed
Run Docs CI / build-docs (push) Failing after 1m26s
Run CI / code-checks (push) Failing after 6m37s
Update tests, use TextCell.from_ocr property
Signed-off-by: Christoph Auer <cau@zurich.ibm.com>
2025-03-13 16:04:08 +01:00

1 line
65 KiB
JSON

[{"page_no": 0, "size": {"width": 612.0, "height": 792.0}, "cells": [{"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 194.478, "r_y0": 102.03700000000003, "r_x1": 447.545, "r_y1": 102.03700000000003, "r_x2": 447.545, "r_y2": 93.66300000000001, "r_x3": 194.478, "r_y3": 93.66300000000001, "coord_origin": "TOPLEFT"}, "text": "Optimized Table Tokenization for Table Structure Recognition", "orig": "Optimized Table Tokenization for Table Structure Recognition", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 475.984, "r_y0": 102.03700000000003, "r_x1": 480.593, "r_y1": 102.03700000000003, "r_x2": 480.593, "r_y2": 93.66300000000001, "r_x3": 475.984, "r_y3": 93.66300000000001, "coord_origin": "TOPLEFT"}, "text": "9", "orig": "9", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 128.16999999999996, "r_x1": 480.591, "r_y1": 128.16999999999996, "r_x2": 480.591, "r_y2": 118.87400000000002, "r_x3": 134.765, "r_y3": 118.87400000000002, "coord_origin": "TOPLEFT"}, "text": "order to compute the TED score. Inference timing results for all experiments", "orig": "order to compute the TED score. Inference timing results for all experiments", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 140.125, "r_x1": 480.597, "r_y1": 140.125, "r_x2": 480.597, "r_y2": 130.82899999999995, "r_x3": 134.765, "r_y3": 130.82899999999995, "coord_origin": "TOPLEFT"}, "text": "were obtained from the same machine on a single core with AMD EPYC 7763", "orig": "were obtained from the same machine on a single core with AMD EPYC 7763", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 152.08100000000002, "r_x1": 210.788, "r_y1": 152.08100000000002, "r_x2": 210.788, "r_y2": 142.78499999999997, "r_x3": 134.765, "r_y3": 142.78499999999997, "coord_origin": "TOPLEFT"}, "text": "CPU @2.45 GHz.", "orig": "CPU @2.45 GHz.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 178.38300000000004, "r_x1": 149.403, "r_y1": 178.38300000000004, "r_x2": 149.403, "r_y2": 169.15599999999995, "r_x3": 134.765, "r_y3": 169.15599999999995, "coord_origin": "TOPLEFT"}, "text": "5.1", "orig": "5.1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 160.859, "r_y0": 178.38300000000004, "r_x1": 318.451, "r_y1": 178.38300000000004, "r_x2": 318.451, "r_y2": 169.15599999999995, "r_x3": 160.859, "r_y3": 169.15599999999995, "coord_origin": "TOPLEFT"}, "text": "Hyper Parameter Optimization", "orig": "Hyper Parameter Optimization", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 194.822, "r_x1": 480.582, "r_y1": 194.822, "r_x2": 480.582, "r_y2": 185.52599999999995, "r_x3": 134.765, "r_y3": 185.52599999999995, "coord_origin": "TOPLEFT"}, "text": "We have chosen the PubTabNet data set to perform HPO, since it includes a", "orig": "We have chosen the PubTabNet data set to perform HPO, since it includes a", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 206.77700000000004, "r_x1": 480.588, "r_y1": 206.77700000000004, "r_x2": 480.588, "r_y2": 197.481, "r_x3": 134.765, "r_y3": 197.481, "coord_origin": "TOPLEFT"}, "text": "highly diverse set of tables. Also we report TED scores separately for simple and", "orig": "highly diverse set of tables. Also we report TED scores separately for simple and", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 218.73199999999997, "r_x1": 480.589, "r_y1": 218.73199999999997, "r_x2": 480.589, "r_y2": 209.43600000000004, "r_x3": 134.765, "r_y3": 209.43600000000004, "coord_origin": "TOPLEFT"}, "text": "complex tables (tables with cell spans). Results are presented in Table. 1. It is", "orig": "complex tables (tables with cell spans). Results are presented in Table. 1. It is", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 230.687, "r_x1": 480.596, "r_y1": 230.687, "r_x2": 480.596, "r_y2": 221.39099999999996, "r_x3": 134.765, "r_y3": 221.39099999999996, "coord_origin": "TOPLEFT"}, "text": "evident that with OTSL, our model achieves the same TED score and slightly", "orig": "evident that with OTSL, our model achieves the same TED score and slightly", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 242.64200000000005, "r_x1": 440.943, "r_y1": 242.64200000000005, "r_x2": 440.943, "r_y2": 233.346, "r_x3": 134.765, "r_y3": 233.346, "coord_origin": "TOPLEFT"}, "text": "better mAP scores in comparison to HTML. However OTSL yields a", "orig": "better mAP scores in comparison to HTML. However OTSL yields a", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 444.868, "r_y0": 243.111, "r_x1": 480.588, "r_y1": 243.111, "r_x2": 480.588, "r_y2": 232.02099999999996, "r_x3": 444.868, "r_y3": 232.02099999999996, "coord_origin": "TOPLEFT"}, "text": "2x speed", "orig": "2x speed", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 255.067, "r_x1": 145.201, "r_y1": 255.067, "r_x2": 145.201, "r_y2": 243.97699999999998, "r_x3": 134.765, "r_y3": 243.97699999999998, "coord_origin": "TOPLEFT"}, "text": "up", "orig": "up", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 149.149, "r_y0": 254.59799999999996, "r_x1": 311.223, "r_y1": 254.59799999999996, "r_x2": 311.223, "r_y2": 245.30200000000002, "r_x3": 149.149, "r_y3": 245.30200000000002, "coord_origin": "TOPLEFT"}, "text": "in the inference runtime over HTML.", "orig": "in the inference runtime over HTML.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 283.873, "r_x1": 160.118, "r_y1": 283.873, "r_x2": 160.118, "r_y2": 273.736, "r_x3": 134.765, "r_y3": 273.736, "coord_origin": "TOPLEFT"}, "text": "Table", "orig": "Table", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 167.344, "r_y0": 283.873, "r_x1": 175.602, "r_y1": 283.873, "r_x2": 175.602, "r_y2": 273.736, "r_x3": 167.344, "r_y3": 273.736, "coord_origin": "TOPLEFT"}, "text": "1.", "orig": "1.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 188.133, "r_y0": 283.401, "r_x1": 255.735, "r_y1": 283.401, "r_x2": 255.735, "r_y2": 275.02700000000004, "r_x3": 188.133, "r_y3": 275.02700000000004, "coord_origin": "TOPLEFT"}, "text": "HPO performed", "orig": "HPO performed", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 262.007, "r_y0": 283.401, "r_x1": 269.687, "r_y1": 283.401, "r_x2": 269.687, "r_y2": 275.02700000000004, "r_x3": 262.007, "r_y3": 275.02700000000004, "coord_origin": "TOPLEFT"}, "text": "in", "orig": "in", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 275.95, "r_y0": 283.401, "r_x1": 300.648, "r_y1": 283.401, "r_x2": 300.648, "r_y2": 275.02700000000004, "r_x3": 275.95, "r_y3": 275.02700000000004, "coord_origin": "TOPLEFT"}, "text": "OTSL", "orig": "OTSL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 306.92, "r_y0": 283.401, "r_x1": 321.759, "r_y1": 283.401, "r_x2": 321.759, "r_y2": 275.02700000000004, "r_x3": 306.92, "r_y3": 275.02700000000004, "coord_origin": "TOPLEFT"}, "text": "and", "orig": "and", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 328.022, "r_y0": 283.401, "r_x1": 419.233, "r_y1": 283.401, "r_x2": 419.233, "r_y2": 275.02700000000004, "r_x3": 328.022, "r_y3": 275.02700000000004, "coord_origin": "TOPLEFT"}, "text": "HTML representation", "orig": "HTML representation", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 425.496, "r_y0": 283.401, "r_x1": 435.22, "r_y1": 283.401, "r_x2": 435.22, "r_y2": 275.02700000000004, "r_x3": 425.496, "r_y3": 275.02700000000004, "coord_origin": "TOPLEFT"}, "text": "on", "orig": "on", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 441.492, "r_y0": 283.401, "r_x1": 454.287, "r_y1": 283.401, "r_x2": 454.287, "r_y2": 275.02700000000004, "r_x3": 441.492, "r_y3": 275.02700000000004, "coord_origin": "TOPLEFT"}, "text": "the", "orig": "the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 460.559, "r_y0": 283.401, "r_x1": 480.577, "r_y1": 283.401, "r_x2": 480.577, "r_y2": 275.02700000000004, "r_x3": 460.559, "r_y3": 275.02700000000004, "coord_origin": "TOPLEFT"}, "text": "same", "orig": "same", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 294.36, "r_x1": 480.599, "r_y1": 294.36, "r_x2": 480.599, "r_y2": 285.986, "r_x3": 134.765, "r_y3": 285.986, "coord_origin": "TOPLEFT"}, "text": "transformer-based TableFormer [9] architecture, trained only on PubTabNet [22]. Ef-", "orig": "transformer-based TableFormer [9] architecture, trained only on PubTabNet [22]. Ef-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 305.319, "r_x1": 480.599, "r_y1": 305.319, "r_x2": 480.599, "r_y2": 296.945, "r_x3": 134.765, "r_y3": 296.945, "coord_origin": "TOPLEFT"}, "text": "fects of reducing the # of layers in encoder and decoder stages of the model show that", "orig": "fects of reducing the # of layers in encoder and decoder stages of the model show that", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 316.278, "r_x1": 163.505, "r_y1": 316.278, "r_x2": 163.505, "r_y2": 307.904, "r_x3": 134.765, "r_y3": 307.904, "coord_origin": "TOPLEFT"}, "text": "smaller", "orig": "smaller", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 167.817, "r_y0": 316.278, "r_x1": 443.266, "r_y1": 316.278, "r_x2": 443.266, "r_y2": 307.904, "r_x3": 167.817, "r_y3": 307.904, "coord_origin": "TOPLEFT"}, "text": "models trained on OTSL perform better, especially in recognizing", "orig": "models trained on OTSL perform better, especially in recognizing", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 447.577, "r_y0": 316.278, "r_x1": 480.592, "r_y1": 316.278, "r_x2": 480.592, "r_y2": 307.904, "r_x3": 447.577, "r_y3": 307.904, "coord_origin": "TOPLEFT"}, "text": "complex", "orig": "complex", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 327.237, "r_x1": 480.588, "r_y1": 327.237, "r_x2": 480.588, "r_y2": 318.863, "r_x3": 134.765, "r_y3": 318.863, "coord_origin": "TOPLEFT"}, "text": "table structures, and maintain a much higher mAP score than the HTML counterpart.", "orig": "table structures, and maintain a much higher mAP score than the HTML counterpart.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 160.37, "r_y0": 350.001, "r_x1": 168.045, "r_y1": 350.001, "r_x2": 168.045, "r_y2": 341.627, "r_x3": 160.37, "r_y3": 341.627, "coord_origin": "TOPLEFT"}, "text": "#", "orig": "#", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 144.592, "r_y0": 362.952, "r_x1": 183.828, "r_y1": 362.952, "r_x2": 183.828, "r_y2": 354.578, "r_x3": 144.592, "r_y3": 354.578, "coord_origin": "TOPLEFT"}, "text": "enc-layers", "orig": "enc-layers", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 207.974, "r_y0": 350.001, "r_x1": 215.649, "r_y1": 350.001, "r_x2": 215.649, "r_y2": 341.627, "r_x3": 207.974, "r_y3": 341.627, "coord_origin": "TOPLEFT"}, "text": "#", "orig": "#", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 192.195, "r_y0": 362.952, "r_x1": 231.425, "r_y1": 362.952, "r_x2": 231.425, "r_y2": 354.578, "r_x3": 192.195, "r_y3": 354.578, "coord_origin": "TOPLEFT"}, "text": "dec-layers", "orig": "dec-layers", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 239.798, "r_y0": 355.48, "r_x1": 278.333, "r_y1": 355.48, "r_x2": 278.333, "r_y2": 347.106, "r_x3": 239.798, "r_y3": 347.106, "coord_origin": "TOPLEFT"}, "text": "Language", "orig": "Language", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 324.67, "r_y0": 350.001, "r_x1": 348.263, "r_y1": 350.001, "r_x2": 348.263, "r_y2": 341.627, "r_x3": 324.67, "r_y3": 341.627, "coord_origin": "TOPLEFT"}, "text": "TEDs", "orig": "TEDs", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 396.271, "r_y0": 350.001, "r_x1": 417.123, "r_y1": 350.001, "r_x2": 417.123, "r_y2": 341.627, "r_x3": 396.271, "r_y3": 341.627, "coord_origin": "TOPLEFT"}, "text": "mAP", "orig": "mAP", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 394.927, "r_y0": 360.96, "r_x1": 418.473, "r_y1": 360.96, "r_x2": 418.473, "r_y2": 352.586, "r_x3": 394.927, "r_y3": 352.586, "coord_origin": "TOPLEFT"}, "text": "(0.75)", "orig": "(0.75)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 430.771, "r_y0": 350.001, "r_x1": 467.141, "r_y1": 350.001, "r_x2": 467.141, "r_y2": 341.627, "r_x3": 430.771, "r_y3": 341.627, "coord_origin": "TOPLEFT"}, "text": "Inference", "orig": "Inference", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 427.148, "r_y0": 360.96, "r_x1": 470.773, "r_y1": 360.96, "r_x2": 470.773, "r_y2": 352.586, "r_x3": 427.148, "r_y3": 352.586, "coord_origin": "TOPLEFT"}, "text": "time (secs)", "orig": "time (secs)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 286.686, "r_y0": 362.952, "r_x1": 312.325, "r_y1": 362.952, "r_x2": 312.325, "r_y2": 354.578, "r_x3": 286.686, "r_y3": 354.578, "coord_origin": "TOPLEFT"}, "text": "simple", "orig": "simple", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 320.702, "r_y0": 362.952, "r_x1": 353.718, "r_y1": 362.952, "r_x2": 353.718, "r_y2": 354.578, "r_x3": 320.702, "r_y3": 354.578, "coord_origin": "TOPLEFT"}, "text": "complex", "orig": "complex", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 369.306, "r_y0": 362.952, "r_x1": 379.031, "r_y1": 362.952, "r_x2": 379.031, "r_y2": 354.578, "r_x3": 369.306, "r_y3": 354.578, "coord_origin": "TOPLEFT"}, "text": "all", "orig": "all", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 161.906, "r_y0": 381.782, "r_x1": 166.515, "r_y1": 381.782, "r_x2": 166.515, "r_y2": 373.408, "r_x3": 161.906, "r_y3": 373.408, "coord_origin": "TOPLEFT"}, "text": "6", "orig": "6", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 209.509, "r_y0": 381.782, "r_x1": 214.118, "r_y1": 381.782, "r_x2": 214.118, "r_y2": 373.408, "r_x3": 209.509, "r_y3": 373.408, "coord_origin": "TOPLEFT"}, "text": "6", "orig": "6", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 246.71, "r_y0": 376.302, "r_x1": 271.409, "r_y1": 376.302, "r_x2": 271.409, "r_y2": 367.928, "r_x3": 246.71, "r_y3": 367.928, "coord_origin": "TOPLEFT"}, "text": "OTSL", "orig": "OTSL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 289.017, "r_y0": 376.302, "r_x1": 310.009, "r_y1": 376.302, "r_x2": 310.009, "r_y2": 367.928, "r_x3": 289.017, "r_y3": 367.928, "coord_origin": "TOPLEFT"}, "text": "0.965", "orig": "0.965", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 326.717, "r_y0": 376.302, "r_x1": 347.709, "r_y1": 376.302, "r_x2": 347.709, "r_y2": 367.928, "r_x3": 326.717, "r_y3": 367.928, "coord_origin": "TOPLEFT"}, "text": "0.934", "orig": "0.934", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 363.676, "r_y0": 376.302, "r_x1": 384.668, "r_y1": 376.302, "r_x2": 384.668, "r_y2": 367.928, "r_x3": 363.676, "r_y3": 367.928, "coord_origin": "TOPLEFT"}, "text": "0.955", "orig": "0.955", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 397.27, "r_y0": 376.774, "r_x1": 416.131, "r_y1": 376.774, "r_x2": 416.131, "r_y2": 366.637, "r_x3": 397.27, "r_y3": 366.637, "coord_origin": "TOPLEFT"}, "text": "0.88", "orig": "0.88", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 439.527, "r_y0": 376.774, "r_x1": 458.388, "r_y1": 376.774, "r_x2": 458.388, "r_y2": 366.637, "r_x3": 439.527, "r_y3": 366.637, "coord_origin": "TOPLEFT"}, "text": "2.73", "orig": "2.73", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 245.176, "r_y0": 389.254, "r_x1": 272.94, "r_y1": 389.254, "r_x2": 272.94, "r_y2": 380.88, "r_x3": 245.176, "r_y3": 380.88, "coord_origin": "TOPLEFT"}, "text": "HTML", "orig": "HTML", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 289.017, "r_y0": 389.254, "r_x1": 310.009, "r_y1": 389.254, "r_x2": 310.009, "r_y2": 380.88, "r_x3": 289.017, "r_y3": 380.88, "coord_origin": "TOPLEFT"}, "text": "0.969", "orig": "0.969", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 326.717, "r_y0": 389.254, "r_x1": 347.709, "r_y1": 389.254, "r_x2": 347.709, "r_y2": 380.88, "r_x3": 326.717, "r_y3": 380.88, "coord_origin": "TOPLEFT"}, "text": "0.927", "orig": "0.927", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 363.676, "r_y0": 389.254, "r_x1": 384.668, "r_y1": 389.254, "r_x2": 384.668, "r_y2": 380.88, "r_x3": 363.676, "r_y3": 380.88, "coord_origin": "TOPLEFT"}, "text": "0.955", "orig": "0.955", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 396.206, "r_y0": 389.254, "r_x1": 417.198, "r_y1": 389.254, "r_x2": 417.198, "r_y2": 380.88, "r_x3": 396.206, "r_y3": 380.88, "coord_origin": "TOPLEFT"}, "text": "0.857", "orig": "0.857", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 440.767, "r_y0": 389.254, "r_x1": 457.152, "r_y1": 389.254, "r_x2": 457.152, "r_y2": 380.88, "r_x3": 440.767, "r_y3": 380.88, "coord_origin": "TOPLEFT"}, "text": "5.39", "orig": "5.39", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 161.906, "r_y0": 408.083, "r_x1": 166.515, "r_y1": 408.083, "r_x2": 166.515, "r_y2": 399.709, "r_x3": 161.906, "r_y3": 399.709, "coord_origin": "TOPLEFT"}, "text": "4", "orig": "4", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 209.509, "r_y0": 408.083, "r_x1": 214.118, "r_y1": 408.083, "r_x2": 214.118, "r_y2": 399.709, "r_x3": 209.509, "r_y3": 399.709, "coord_origin": "TOPLEFT"}, "text": "4", "orig": "4", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 246.71, "r_y0": 402.604, "r_x1": 271.409, "r_y1": 402.604, "r_x2": 271.409, "r_y2": 394.23, "r_x3": 246.71, "r_y3": 394.23, "coord_origin": "TOPLEFT"}, "text": "OTSL", "orig": "OTSL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 289.017, "r_y0": 402.604, "r_x1": 310.009, "r_y1": 402.604, "r_x2": 310.009, "r_y2": 394.23, "r_x3": 289.017, "r_y3": 394.23, "coord_origin": "TOPLEFT"}, "text": "0.938", "orig": "0.938", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 326.717, "r_y0": 402.604, "r_x1": 347.709, "r_y1": 402.604, "r_x2": 347.709, "r_y2": 394.23, "r_x3": 326.717, "r_y3": 394.23, "coord_origin": "TOPLEFT"}, "text": "0.904", "orig": "0.904", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 363.676, "r_y0": 402.604, "r_x1": 384.668, "r_y1": 402.604, "r_x2": 384.668, "r_y2": 394.23, "r_x3": 363.676, "r_y3": 394.23, "coord_origin": "TOPLEFT"}, "text": "0.927", "orig": "0.927", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 394.618, "r_y0": 403.076, "r_x1": 418.782, "r_y1": 403.076, "r_x2": 418.782, "r_y2": 392.939, "r_x3": 394.618, "r_y3": 392.939, "coord_origin": "TOPLEFT"}, "text": "0.853", "orig": "0.853", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 439.527, "r_y0": 403.076, "r_x1": 458.388, "r_y1": 403.076, "r_x2": 458.388, "r_y2": 392.939, "r_x3": 439.527, "r_y3": 392.939, "coord_origin": "TOPLEFT"}, "text": "1.97", "orig": "1.97", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 245.176, "r_y0": 415.555, "r_x1": 272.94, "r_y1": 415.555, "r_x2": 272.94, "r_y2": 407.181, "r_x3": 245.176, "r_y3": 407.181, "coord_origin": "TOPLEFT"}, "text": "HTML", "orig": "HTML", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 289.017, "r_y0": 415.555, "r_x1": 310.009, "r_y1": 415.555, "r_x2": 310.009, "r_y2": 407.181, "r_x3": 289.017, "r_y3": 407.181, "coord_origin": "TOPLEFT"}, "text": "0.952", "orig": "0.952", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 326.717, "r_y0": 415.555, "r_x1": 347.709, "r_y1": 415.555, "r_x2": 347.709, "r_y2": 407.181, "r_x3": 326.717, "r_y3": 407.181, "coord_origin": "TOPLEFT"}, "text": "0.909", "orig": "0.909", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 362.088, "r_y0": 416.027, "r_x1": 386.252, "r_y1": 416.027, "r_x2": 386.252, "r_y2": 405.89, "r_x3": 362.088, "r_y3": 405.89, "coord_origin": "TOPLEFT"}, "text": "0.938", "orig": "0.938", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 396.206, "r_y0": 415.555, "r_x1": 417.198, "r_y1": 415.555, "r_x2": 417.198, "r_y2": 407.181, "r_x3": 396.206, "r_y3": 407.181, "coord_origin": "TOPLEFT"}, "text": "0.843", "orig": "0.843", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 440.767, "r_y0": 415.555, "r_x1": 457.152, "r_y1": 415.555, "r_x2": 457.152, "r_y2": 407.181, "r_x3": 440.767, "r_y3": 407.181, "coord_origin": "TOPLEFT"}, "text": "3.77", "orig": "3.77", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 161.906, "r_y0": 434.384, "r_x1": 166.515, "r_y1": 434.384, "r_x2": 166.515, "r_y2": 426.01, "r_x3": 161.906, "r_y3": 426.01, "coord_origin": "TOPLEFT"}, "text": "2", "orig": "2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 209.509, "r_y0": 434.384, "r_x1": 214.118, "r_y1": 434.384, "r_x2": 214.118, "r_y2": 426.01, "r_x3": 209.509, "r_y3": 426.01, "coord_origin": "TOPLEFT"}, "text": "4", "orig": "4", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 246.71, "r_y0": 428.905, "r_x1": 271.409, "r_y1": 428.905, "r_x2": 271.409, "r_y2": 420.531, "r_x3": 246.71, "r_y3": 420.531, "coord_origin": "TOPLEFT"}, "text": "OTSL", "orig": "OTSL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 289.017, "r_y0": 428.905, "r_x1": 310.009, "r_y1": 428.905, "r_x2": 310.009, "r_y2": 420.531, "r_x3": 289.017, "r_y3": 420.531, "coord_origin": "TOPLEFT"}, "text": "0.923", "orig": "0.923", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 326.717, "r_y0": 428.905, "r_x1": 347.709, "r_y1": 428.905, "r_x2": 347.709, "r_y2": 420.531, "r_x3": 326.717, "r_y3": 420.531, "coord_origin": "TOPLEFT"}, "text": "0.897", "orig": "0.897", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 363.676, "r_y0": 428.905, "r_x1": 384.668, "r_y1": 428.905, "r_x2": 384.668, "r_y2": 420.531, "r_x3": 363.676, "r_y3": 420.531, "coord_origin": "TOPLEFT"}, "text": "0.915", "orig": "0.915", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 394.618, "r_y0": 429.377, "r_x1": 418.782, "r_y1": 429.377, "r_x2": 418.782, "r_y2": 419.24, "r_x3": 394.618, "r_y3": 419.24, "coord_origin": "TOPLEFT"}, "text": "0.859", "orig": "0.859", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 439.527, "r_y0": 429.377, "r_x1": 458.388, "r_y1": 429.377, "r_x2": 458.388, "r_y2": 419.24, "r_x3": 439.527, "r_y3": 419.24, "coord_origin": "TOPLEFT"}, "text": "1.91", "orig": "1.91", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 245.176, "r_y0": 441.856, "r_x1": 272.94, "r_y1": 441.856, "r_x2": 272.94, "r_y2": 433.482, "r_x3": 245.176, "r_y3": 433.482, "coord_origin": "TOPLEFT"}, "text": "HTML", "orig": "HTML", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 289.017, "r_y0": 441.856, "r_x1": 310.009, "r_y1": 441.856, "r_x2": 310.009, "r_y2": 433.482, "r_x3": 289.017, "r_y3": 433.482, "coord_origin": "TOPLEFT"}, "text": "0.945", "orig": "0.945", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 326.717, "r_y0": 441.856, "r_x1": 347.709, "r_y1": 441.856, "r_x2": 347.709, "r_y2": 433.482, "r_x3": 326.717, "r_y3": 433.482, "coord_origin": "TOPLEFT"}, "text": "0.901", "orig": "0.901", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 362.088, "r_y0": 442.328, "r_x1": 386.252, "r_y1": 442.328, "r_x2": 386.252, "r_y2": 432.191, "r_x3": 362.088, "r_y3": 432.191, "coord_origin": "TOPLEFT"}, "text": "0.931", "orig": "0.931", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 396.206, "r_y0": 441.856, "r_x1": 417.198, "r_y1": 441.856, "r_x2": 417.198, "r_y2": 433.482, "r_x3": 396.206, "r_y3": 433.482, "coord_origin": "TOPLEFT"}, "text": "0.834", "orig": "0.834", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 440.767, "r_y0": 441.856, "r_x1": 457.152, "r_y1": 441.856, "r_x2": 457.152, "r_y2": 433.482, "r_x3": 440.767, "r_y3": 433.482, "coord_origin": "TOPLEFT"}, "text": "3.81", "orig": "3.81", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 161.906, "r_y0": 460.686, "r_x1": 166.515, "r_y1": 460.686, "r_x2": 166.515, "r_y2": 452.312, "r_x3": 161.906, "r_y3": 452.312, "coord_origin": "TOPLEFT"}, "text": "4", "orig": "4", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 209.509, "r_y0": 460.686, "r_x1": 214.118, "r_y1": 460.686, "r_x2": 214.118, "r_y2": 452.312, "r_x3": 209.509, "r_y3": 452.312, "coord_origin": "TOPLEFT"}, "text": "2", "orig": "2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 246.71, "r_y0": 455.206, "r_x1": 271.409, "r_y1": 455.206, "r_x2": 271.409, "r_y2": 446.832, "r_x3": 246.71, "r_y3": 446.832, "coord_origin": "TOPLEFT"}, "text": "OTSL", "orig": "OTSL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 289.017, "r_y0": 455.206, "r_x1": 310.009, "r_y1": 455.206, "r_x2": 310.009, "r_y2": 446.832, "r_x3": 289.017, "r_y3": 446.832, "coord_origin": "TOPLEFT"}, "text": "0.952", "orig": "0.952", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 329.021, "r_y0": 455.206, "r_x1": 345.406, "r_y1": 455.206, "r_x2": 345.406, "r_y2": 446.832, "r_x3": 329.021, "r_y3": 446.832, "coord_origin": "TOPLEFT"}, "text": "0.92", "orig": "0.92", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 362.088, "r_y0": 455.678, "r_x1": 386.252, "r_y1": 455.678, "r_x2": 386.252, "r_y2": 445.541, "r_x3": 362.088, "r_y3": 445.541, "coord_origin": "TOPLEFT"}, "text": "0.942", "orig": "0.942", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 394.618, "r_y0": 455.678, "r_x1": 418.782, "r_y1": 455.678, "r_x2": 418.782, "r_y2": 445.541, "r_x3": 394.618, "r_y3": 445.541, "coord_origin": "TOPLEFT"}, "text": "0.857", "orig": "0.857", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 439.527, "r_y0": 455.678, "r_x1": 458.388, "r_y1": 455.678, "r_x2": 458.388, "r_y2": 445.541, "r_x3": 439.527, "r_y3": 445.541, "coord_origin": "TOPLEFT"}, "text": "1.22", "orig": "1.22", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 245.176, "r_y0": 468.158, "r_x1": 272.94, "r_y1": 468.158, "r_x2": 272.94, "r_y2": 459.784, "r_x3": 245.176, "r_y3": 459.784, "coord_origin": "TOPLEFT"}, "text": "HTML", "orig": "HTML", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 289.017, "r_y0": 468.158, "r_x1": 310.009, "r_y1": 468.158, "r_x2": 310.009, "r_y2": 459.784, "r_x3": 289.017, "r_y3": 459.784, "coord_origin": "TOPLEFT"}, "text": "0.944", "orig": "0.944", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 326.717, "r_y0": 468.158, "r_x1": 347.709, "r_y1": 468.158, "r_x2": 347.709, "r_y2": 459.784, "r_x3": 326.717, "r_y3": 459.784, "coord_origin": "TOPLEFT"}, "text": "0.903", "orig": "0.903", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 363.676, "r_y0": 468.158, "r_x1": 384.668, "r_y1": 468.158, "r_x2": 384.668, "r_y2": 459.784, "r_x3": 363.676, "r_y3": 459.784, "coord_origin": "TOPLEFT"}, "text": "0.931", "orig": "0.931", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 396.206, "r_y0": 468.158, "r_x1": 417.198, "r_y1": 468.158, "r_x2": 417.198, "r_y2": 459.784, "r_x3": 396.206, "r_y3": 459.784, "coord_origin": "TOPLEFT"}, "text": "0.824", "orig": "0.824", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 446.653, "r_y0": 468.158, "r_x1": 451.262, "r_y1": 468.158, "r_x2": 451.262, "r_y2": 459.784, "r_x3": 446.653, "r_y3": 459.784, "coord_origin": "TOPLEFT"}, "text": "2", "orig": "2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 517.3489999999999, "r_x1": 149.403, "r_y1": 517.3489999999999, "r_x2": 149.403, "r_y2": 508.122, "r_x3": 134.765, "r_y3": 508.122, "coord_origin": "TOPLEFT"}, "text": "5.2", "orig": "5.2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 160.859, "r_y0": 517.3489999999999, "r_x1": 264.408, "r_y1": 517.3489999999999, "r_x2": 264.408, "r_y2": 508.122, "r_x3": 160.859, "r_y3": 508.122, "coord_origin": "TOPLEFT"}, "text": "Quantitative Results", "orig": "Quantitative Results", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 533.787, "r_x1": 480.562, "r_y1": 533.787, "r_x2": 480.562, "r_y2": 524.491, "r_x3": 134.765, "r_y3": 524.491, "coord_origin": "TOPLEFT"}, "text": "We picked the model parameter configuration that produced the best prediction", "orig": "We picked the model parameter configuration that produced the best prediction", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 545.7429999999999, "r_x1": 164.924, "r_y1": 545.7429999999999, "r_x2": 164.924, "r_y2": 536.447, "r_x3": 134.765, "r_y3": 536.447, "coord_origin": "TOPLEFT"}, "text": "quality", "orig": "quality", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 169.324, "r_y0": 545.7429999999999, "r_x1": 480.59, "r_y1": 545.7429999999999, "r_x2": 480.59, "r_y2": 536.447, "r_x3": 169.324, "r_y3": 536.447, "coord_origin": "TOPLEFT"}, "text": "(enc=6, dec=6, heads=8) with PubTabNet alone, then independently", "orig": "(enc=6, dec=6, heads=8) with PubTabNet alone, then independently", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 557.698, "r_x1": 480.722, "r_y1": 557.698, "r_x2": 480.722, "r_y2": 548.402, "r_x3": 134.765, "r_y3": 548.402, "coord_origin": "TOPLEFT"}, "text": "trained and evaluated it on three publicly available data sets: PubTabNet (395k", "orig": "trained and evaluated it on three publicly available data sets: PubTabNet (395k", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 569.653, "r_x1": 480.603, "r_y1": 569.653, "r_x2": 480.603, "r_y2": 560.357, "r_x3": 134.765, "r_y3": 560.357, "coord_origin": "TOPLEFT"}, "text": "samples), FinTabNet (113k samples) and PubTables-1M (about 1M samples).", "orig": "samples), FinTabNet (113k samples) and PubTables-1M (about 1M samples).", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 581.608, "r_x1": 480.594, "r_y1": 581.608, "r_x2": 480.594, "r_y2": 572.312, "r_x3": 134.765, "r_y3": 572.312, "coord_origin": "TOPLEFT"}, "text": "Performance results are presented in Table. 2. It is clearly evident that the model", "orig": "Performance results are presented in Table. 2. It is clearly evident that the model", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 593.563, "r_x1": 480.592, "r_y1": 593.563, "r_x2": 480.592, "r_y2": 584.267, "r_x3": 134.765, "r_y3": 584.267, "coord_origin": "TOPLEFT"}, "text": "trained on OTSL outperforms HTML across the board, keeping high TEDs and", "orig": "trained on OTSL outperforms HTML across the board, keeping high TEDs and", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 605.519, "r_x1": 237.316, "r_y1": 605.519, "r_x2": 237.316, "r_y2": 596.223, "r_x3": 134.765, "r_y3": 596.223, "coord_origin": "TOPLEFT"}, "text": "mAP scores even on di", "orig": "mAP scores even on di", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 237.317, "r_y0": 605.519, "r_x1": 245.616, "r_y1": 605.519, "r_x2": 245.616, "r_y2": 596.223, "r_x3": 237.317, "r_y3": 596.223, "coord_origin": "TOPLEFT"}, "text": "ffi", "orig": "ffi", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 245.617, "r_y0": 605.519, "r_x1": 480.58, "r_y1": 605.519, "r_x2": 480.58, "r_y2": 596.223, "r_x3": 245.617, "r_y3": 596.223, "coord_origin": "TOPLEFT"}, "text": "cult financial tables (FinTabNet) that contain sparse", "orig": "cult financial tables (FinTabNet) that contain sparse", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 617.4739999999999, "r_x1": 206.801, "r_y1": 617.4739999999999, "r_x2": 206.801, "r_y2": 608.178, "r_x3": 134.765, "r_y3": 608.178, "coord_origin": "TOPLEFT"}, "text": "and large tables.", "orig": "and large tables.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 149.709, "r_y0": 629.429, "r_x1": 205.6, "r_y1": 629.429, "r_x2": 205.6, "r_y2": 620.133, "r_x3": 149.709, "r_y3": 620.133, "coord_origin": "TOPLEFT"}, "text": "Additionally,", "orig": "Additionally,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 210.578, "r_y0": 629.429, "r_x1": 224.409, "r_y1": 629.429, "r_x2": 224.409, "r_y2": 620.133, "r_x3": 210.578, "r_y3": 620.133, "coord_origin": "TOPLEFT"}, "text": "the", "orig": "the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 229.383, "r_y0": 629.429, "r_x1": 257.737, "r_y1": 629.429, "r_x2": 257.737, "r_y2": 620.133, "r_x3": 229.383, "r_y3": 620.133, "coord_origin": "TOPLEFT"}, "text": "results", "orig": "results", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 262.722, "r_y0": 629.429, "r_x1": 307.321, "r_y1": 629.429, "r_x2": 307.321, "r_y2": 620.133, "r_x3": 262.722, "r_y3": 620.133, "coord_origin": "TOPLEFT"}, "text": "show that", "orig": "show that", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 312.301, "r_y0": 629.429, "r_x1": 480.595, "r_y1": 629.429, "r_x2": 480.595, "r_y2": 620.133, "r_x3": 312.301, "r_y3": 620.133, "coord_origin": "TOPLEFT"}, "text": "OTSL has an advantage over HTML", "orig": "OTSL has an advantage over HTML", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 641.384, "r_x1": 480.599, "r_y1": 641.384, "r_x2": 480.599, "r_y2": 632.088, "r_x3": 134.765, "r_y3": 632.088, "coord_origin": "TOPLEFT"}, "text": "when applied on a bigger data set like PubTables-1M and achieves significantly", "orig": "when applied on a bigger data set like PubTables-1M and achieves significantly", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 653.3389999999999, "r_x1": 480.594, "r_y1": 653.3389999999999, "r_x2": 480.594, "r_y2": 644.043, "r_x3": 134.765, "r_y3": 644.043, "coord_origin": "TOPLEFT"}, "text": "improved scores. Finally, OTSL achieves faster inference due to fewer decoding", "orig": "improved scores. Finally, OTSL achieves faster inference due to fewer decoding", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 665.294, "r_x1": 405.8, "r_y1": 665.294, "r_x2": 405.8, "r_y2": 655.998, "r_x3": 134.765, "r_y3": 655.998, "coord_origin": "TOPLEFT"}, "text": "steps which is a result of the reduced sequence representation.", "orig": "steps which is a result of the reduced sequence representation.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "parsed_page": null, "predictions": {"layout": {"clusters": [{"id": 8, "label": "page_header", "bbox": {"l": 194.478, "t": 93.66300000000001, "r": 447.545, "b": 102.03700000000003, "coord_origin": "TOPLEFT"}, "confidence": 0.9373534917831421, "cells": [{"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 194.478, "r_y0": 102.03700000000003, "r_x1": 447.545, "r_y1": 102.03700000000003, "r_x2": 447.545, "r_y2": 93.66300000000001, "r_x3": 194.478, "r_y3": 93.66300000000001, "coord_origin": "TOPLEFT"}, "text": "Optimized Table Tokenization for Table Structure Recognition", "orig": "Optimized Table Tokenization for Table Structure Recognition", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 9, "label": "page_header", "bbox": {"l": 475.984, "t": 93.66300000000001, "r": 480.593, "b": 102.03700000000003, "coord_origin": "TOPLEFT"}, "confidence": 0.8858680725097656, "cells": [{"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 475.984, "r_y0": 102.03700000000003, "r_x1": 480.593, "r_y1": 102.03700000000003, "r_x2": 480.593, "r_y2": 93.66300000000001, "r_x3": 475.984, "r_y3": 93.66300000000001, "coord_origin": "TOPLEFT"}, "text": "9", "orig": "9", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 4, "label": "text", "bbox": {"l": 134.765, "t": 118.87400000000002, "r": 480.591, "b": 128.16999999999996, "coord_origin": "TOPLEFT"}, "confidence": 0.9806433916091919, "cells": [{"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 128.16999999999996, "r_x1": 480.591, "r_y1": 128.16999999999996, "r_x2": 480.591, "r_y2": 118.87400000000002, "r_x3": 134.765, "r_y3": 118.87400000000002, "coord_origin": "TOPLEFT"}, "text": "order to compute the TED score. Inference timing results for all experiments", "orig": "order to compute the TED score. Inference timing results for all experiments", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 7, "label": "section_header", "bbox": {"l": 134.765, "t": 169.15599999999995, "r": 149.403, "b": 178.38300000000004, "coord_origin": "TOPLEFT"}, "confidence": 0.9577404260635376, "cells": [{"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 178.38300000000004, "r_x1": 149.403, "r_y1": 178.38300000000004, "r_x2": 149.403, "r_y2": 169.15599999999995, "r_x3": 134.765, "r_y3": 169.15599999999995, "coord_origin": "TOPLEFT"}, "text": "5.1", "orig": "5.1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 1, "label": "text", "bbox": {"l": 134.765, "t": 185.52599999999995, "r": 480.582, "b": 194.822, "coord_origin": "TOPLEFT"}, "confidence": 0.98504239320755, "cells": [{"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 194.822, "r_x1": 480.582, "r_y1": 194.822, "r_x2": 480.582, "r_y2": 185.52599999999995, "r_x3": 134.765, "r_y3": 185.52599999999995, "coord_origin": "TOPLEFT"}, "text": "We have chosen the PubTabNet data set to perform HPO, since it includes a", "orig": "We have chosen the PubTabNet data set to perform HPO, since it includes a", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 5, "label": "caption", "bbox": {"l": 134.765, "t": 273.736, "r": 160.118, "b": 283.873, "coord_origin": "TOPLEFT"}, "confidence": 0.9591909050941467, "cells": [{"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 283.873, "r_x1": 160.118, "r_y1": 283.873, "r_x2": 160.118, "r_y2": 273.736, "r_x3": 134.765, "r_y3": 273.736, "coord_origin": "TOPLEFT"}, "text": "Table", "orig": "Table", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 6, "label": "section_header", "bbox": {"l": 134.765, "t": 508.122, "r": 149.403, "b": 517.3489999999999, "coord_origin": "TOPLEFT"}, "confidence": 0.9589294195175171, "cells": [{"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 517.3489999999999, "r_x1": 149.403, "r_y1": 517.3489999999999, "r_x2": 149.403, "r_y2": 508.122, "r_x3": 134.765, "r_y3": 508.122, "coord_origin": "TOPLEFT"}, "text": "5.2", "orig": "5.2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 3, "label": "text", "bbox": {"l": 134.765, "t": 524.491, "r": 480.562, "b": 533.787, "coord_origin": "TOPLEFT"}, "confidence": 0.9849975109100342, "cells": [{"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 533.787, "r_x1": 480.562, "r_y1": 533.787, "r_x2": 480.562, "r_y2": 524.491, "r_x3": 134.765, "r_y3": 524.491, "coord_origin": "TOPLEFT"}, "text": "We picked the model parameter configuration that produced the best prediction", "orig": "We picked the model parameter configuration that produced the best prediction", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 2, "label": "text", "bbox": {"l": 149.709, "t": 620.133, "r": 205.6, "b": 629.429, "coord_origin": "TOPLEFT"}, "confidence": 0.9850137829780579, "cells": [{"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 149.709, "r_y0": 629.429, "r_x1": 205.6, "r_y1": 629.429, "r_x2": 205.6, "r_y2": 620.133, "r_x3": 149.709, "r_y3": 620.133, "coord_origin": "TOPLEFT"}, "text": "Additionally,", "orig": "Additionally,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 0, "label": "table", "bbox": {"l": 139.66741943359375, "t": 337.54541015625, "r": 475.00927734375, "b": 469.4945373535156, "coord_origin": "TOPLEFT"}, "confidence": 0.9901031255722046, "cells": [], "children": []}]}, "tablestructure": {"table_map": {"0": {"label": "table", "id": 0, "page_no": 0, "cluster": {"id": 0, "label": "table", "bbox": {"l": 139.66741943359375, "t": 337.54541015625, "r": 475.00927734375, "b": 469.4945373535156, "coord_origin": "TOPLEFT"}, "confidence": 0.9901031255722046, "cells": [], "children": []}, "text": null, "otsl_seq": ["ched", "ched", "ched", "ched", "lcel", "lcel", "ched", "ched", "nl", "ucel", "ucel", "ucel", "ched", "ched", "ched", "ched", "ched", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "nl"], "num_rows": 0, "num_cols": 0, "table_cells": []}}}, "figures_classification": null, "equations_prediction": null, "vlm_response": null}, "assembled": {"elements": [{"label": "page_header", "id": 8, "page_no": 0, "cluster": {"id": 8, "label": "page_header", "bbox": {"l": 194.478, "t": 93.66300000000001, "r": 447.545, "b": 102.03700000000003, "coord_origin": "TOPLEFT"}, "confidence": 0.9373534917831421, "cells": [{"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 194.478, "r_y0": 102.03700000000003, "r_x1": 447.545, "r_y1": 102.03700000000003, "r_x2": 447.545, "r_y2": 93.66300000000001, "r_x3": 194.478, "r_y3": 93.66300000000001, "coord_origin": "TOPLEFT"}, "text": "Optimized Table Tokenization for Table Structure Recognition", "orig": "Optimized Table Tokenization for Table Structure Recognition", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "Optimized Table Tokenization for Table Structure Recognition"}, {"label": "page_header", "id": 9, "page_no": 0, "cluster": {"id": 9, "label": "page_header", "bbox": {"l": 475.984, "t": 93.66300000000001, "r": 480.593, "b": 102.03700000000003, "coord_origin": "TOPLEFT"}, "confidence": 0.8858680725097656, "cells": [{"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 475.984, "r_y0": 102.03700000000003, "r_x1": 480.593, "r_y1": 102.03700000000003, "r_x2": 480.593, "r_y2": 93.66300000000001, "r_x3": 475.984, "r_y3": 93.66300000000001, "coord_origin": "TOPLEFT"}, "text": "9", "orig": "9", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "9"}, {"label": "text", "id": 4, "page_no": 0, "cluster": {"id": 4, "label": "text", "bbox": {"l": 134.765, "t": 118.87400000000002, "r": 480.591, "b": 128.16999999999996, "coord_origin": "TOPLEFT"}, "confidence": 0.9806433916091919, "cells": [{"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 128.16999999999996, "r_x1": 480.591, "r_y1": 128.16999999999996, "r_x2": 480.591, "r_y2": 118.87400000000002, "r_x3": 134.765, "r_y3": 118.87400000000002, "coord_origin": "TOPLEFT"}, "text": "order to compute the TED score. Inference timing results for all experiments", "orig": "order to compute the TED score. Inference timing results for all experiments", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "order to compute the TED score. Inference timing results for all experiments"}, {"label": "section_header", "id": 7, "page_no": 0, "cluster": {"id": 7, "label": "section_header", "bbox": {"l": 134.765, "t": 169.15599999999995, "r": 149.403, "b": 178.38300000000004, "coord_origin": "TOPLEFT"}, "confidence": 0.9577404260635376, "cells": [{"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 178.38300000000004, "r_x1": 149.403, "r_y1": 178.38300000000004, "r_x2": 149.403, "r_y2": 169.15599999999995, "r_x3": 134.765, "r_y3": 169.15599999999995, "coord_origin": "TOPLEFT"}, "text": "5.1", "orig": "5.1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "5.1"}, {"label": "text", "id": 1, "page_no": 0, "cluster": {"id": 1, "label": "text", "bbox": {"l": 134.765, "t": 185.52599999999995, "r": 480.582, "b": 194.822, "coord_origin": "TOPLEFT"}, "confidence": 0.98504239320755, "cells": [{"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 194.822, "r_x1": 480.582, "r_y1": 194.822, "r_x2": 480.582, "r_y2": 185.52599999999995, "r_x3": 134.765, "r_y3": 185.52599999999995, "coord_origin": "TOPLEFT"}, "text": "We have chosen the PubTabNet data set to perform HPO, since it includes a", "orig": "We have chosen the PubTabNet data set to perform HPO, since it includes a", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "We have chosen the PubTabNet data set to perform HPO, since it includes a"}, {"label": "caption", "id": 5, "page_no": 0, "cluster": {"id": 5, "label": "caption", "bbox": {"l": 134.765, "t": 273.736, "r": 160.118, "b": 283.873, "coord_origin": "TOPLEFT"}, "confidence": 0.9591909050941467, "cells": [{"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 283.873, "r_x1": 160.118, "r_y1": 283.873, "r_x2": 160.118, "r_y2": 273.736, "r_x3": 134.765, "r_y3": 273.736, "coord_origin": "TOPLEFT"}, "text": "Table", "orig": "Table", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "Table"}, {"label": "section_header", "id": 6, "page_no": 0, "cluster": {"id": 6, "label": "section_header", "bbox": {"l": 134.765, "t": 508.122, "r": 149.403, "b": 517.3489999999999, "coord_origin": "TOPLEFT"}, "confidence": 0.9589294195175171, "cells": [{"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 517.3489999999999, "r_x1": 149.403, "r_y1": 517.3489999999999, "r_x2": 149.403, "r_y2": 508.122, "r_x3": 134.765, "r_y3": 508.122, "coord_origin": "TOPLEFT"}, "text": "5.2", "orig": "5.2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "5.2"}, {"label": "text", "id": 3, "page_no": 0, "cluster": {"id": 3, "label": "text", "bbox": {"l": 134.765, "t": 524.491, "r": 480.562, "b": 533.787, "coord_origin": "TOPLEFT"}, "confidence": 0.9849975109100342, "cells": [{"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 533.787, "r_x1": 480.562, "r_y1": 533.787, "r_x2": 480.562, "r_y2": 524.491, "r_x3": 134.765, "r_y3": 524.491, "coord_origin": "TOPLEFT"}, "text": "We picked the model parameter configuration that produced the best prediction", "orig": "We picked the model parameter configuration that produced the best prediction", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "We picked the model parameter configuration that produced the best prediction"}, {"label": "text", "id": 2, "page_no": 0, "cluster": {"id": 2, "label": "text", "bbox": {"l": 149.709, "t": 620.133, "r": 205.6, "b": 629.429, "coord_origin": "TOPLEFT"}, "confidence": 0.9850137829780579, "cells": [{"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 149.709, "r_y0": 629.429, "r_x1": 205.6, "r_y1": 629.429, "r_x2": 205.6, "r_y2": 620.133, "r_x3": 149.709, "r_y3": 620.133, "coord_origin": "TOPLEFT"}, "text": "Additionally,", "orig": "Additionally,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "Additionally,"}, {"label": "table", "id": 0, "page_no": 0, "cluster": {"id": 0, "label": "table", "bbox": {"l": 139.66741943359375, "t": 337.54541015625, "r": 475.00927734375, "b": 469.4945373535156, "coord_origin": "TOPLEFT"}, "confidence": 0.9901031255722046, "cells": [], "children": []}, "text": null, "otsl_seq": ["ched", "ched", "ched", "ched", "lcel", "lcel", "ched", "ched", "nl", "ucel", "ucel", "ucel", "ched", "ched", "ched", "ched", "ched", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "nl"], "num_rows": 0, "num_cols": 0, "table_cells": []}], "body": [{"label": "text", "id": 4, "page_no": 0, "cluster": {"id": 4, "label": "text", "bbox": {"l": 134.765, "t": 118.87400000000002, "r": 480.591, "b": 128.16999999999996, "coord_origin": "TOPLEFT"}, "confidence": 0.9806433916091919, "cells": [{"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 128.16999999999996, "r_x1": 480.591, "r_y1": 128.16999999999996, "r_x2": 480.591, "r_y2": 118.87400000000002, "r_x3": 134.765, "r_y3": 118.87400000000002, "coord_origin": "TOPLEFT"}, "text": "order to compute the TED score. Inference timing results for all experiments", "orig": "order to compute the TED score. Inference timing results for all experiments", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "order to compute the TED score. Inference timing results for all experiments"}, {"label": "section_header", "id": 7, "page_no": 0, "cluster": {"id": 7, "label": "section_header", "bbox": {"l": 134.765, "t": 169.15599999999995, "r": 149.403, "b": 178.38300000000004, "coord_origin": "TOPLEFT"}, "confidence": 0.9577404260635376, "cells": [{"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 178.38300000000004, "r_x1": 149.403, "r_y1": 178.38300000000004, "r_x2": 149.403, "r_y2": 169.15599999999995, "r_x3": 134.765, "r_y3": 169.15599999999995, "coord_origin": "TOPLEFT"}, "text": "5.1", "orig": "5.1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "5.1"}, {"label": "text", "id": 1, "page_no": 0, "cluster": {"id": 1, "label": "text", "bbox": {"l": 134.765, "t": 185.52599999999995, "r": 480.582, "b": 194.822, "coord_origin": "TOPLEFT"}, "confidence": 0.98504239320755, "cells": [{"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 194.822, "r_x1": 480.582, "r_y1": 194.822, "r_x2": 480.582, "r_y2": 185.52599999999995, "r_x3": 134.765, "r_y3": 185.52599999999995, "coord_origin": "TOPLEFT"}, "text": "We have chosen the PubTabNet data set to perform HPO, since it includes a", "orig": "We have chosen the PubTabNet data set to perform HPO, since it includes a", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "We have chosen the PubTabNet data set to perform HPO, since it includes a"}, {"label": "caption", "id": 5, "page_no": 0, "cluster": {"id": 5, "label": "caption", "bbox": {"l": 134.765, "t": 273.736, "r": 160.118, "b": 283.873, "coord_origin": "TOPLEFT"}, "confidence": 0.9591909050941467, "cells": [{"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 283.873, "r_x1": 160.118, "r_y1": 283.873, "r_x2": 160.118, "r_y2": 273.736, "r_x3": 134.765, "r_y3": 273.736, "coord_origin": "TOPLEFT"}, "text": "Table", "orig": "Table", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "Table"}, {"label": "section_header", "id": 6, "page_no": 0, "cluster": {"id": 6, "label": "section_header", "bbox": {"l": 134.765, "t": 508.122, "r": 149.403, "b": 517.3489999999999, "coord_origin": "TOPLEFT"}, "confidence": 0.9589294195175171, "cells": [{"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 517.3489999999999, "r_x1": 149.403, "r_y1": 517.3489999999999, "r_x2": 149.403, "r_y2": 508.122, "r_x3": 134.765, "r_y3": 508.122, "coord_origin": "TOPLEFT"}, "text": "5.2", "orig": "5.2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "5.2"}, {"label": "text", "id": 3, "page_no": 0, "cluster": {"id": 3, "label": "text", "bbox": {"l": 134.765, "t": 524.491, "r": 480.562, "b": 533.787, "coord_origin": "TOPLEFT"}, "confidence": 0.9849975109100342, "cells": [{"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 533.787, "r_x1": 480.562, "r_y1": 533.787, "r_x2": 480.562, "r_y2": 524.491, "r_x3": 134.765, "r_y3": 524.491, "coord_origin": "TOPLEFT"}, "text": "We picked the model parameter configuration that produced the best prediction", "orig": "We picked the model parameter configuration that produced the best prediction", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "We picked the model parameter configuration that produced the best prediction"}, {"label": "text", "id": 2, "page_no": 0, "cluster": {"id": 2, "label": "text", "bbox": {"l": 149.709, "t": 620.133, "r": 205.6, "b": 629.429, "coord_origin": "TOPLEFT"}, "confidence": 0.9850137829780579, "cells": [{"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 149.709, "r_y0": 629.429, "r_x1": 205.6, "r_y1": 629.429, "r_x2": 205.6, "r_y2": 620.133, "r_x3": 149.709, "r_y3": 620.133, "coord_origin": "TOPLEFT"}, "text": "Additionally,", "orig": "Additionally,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "Additionally,"}, {"label": "table", "id": 0, "page_no": 0, "cluster": {"id": 0, "label": "table", "bbox": {"l": 139.66741943359375, "t": 337.54541015625, "r": 475.00927734375, "b": 469.4945373535156, "coord_origin": "TOPLEFT"}, "confidence": 0.9901031255722046, "cells": [], "children": []}, "text": null, "otsl_seq": ["ched", "ched", "ched", "ched", "lcel", "lcel", "ched", "ched", "nl", "ucel", "ucel", "ucel", "ched", "ched", "ched", "ched", "ched", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "nl"], "num_rows": 0, "num_cols": 0, "table_cells": []}], "headers": [{"label": "page_header", "id": 8, "page_no": 0, "cluster": {"id": 8, "label": "page_header", "bbox": {"l": 194.478, "t": 93.66300000000001, "r": 447.545, "b": 102.03700000000003, "coord_origin": "TOPLEFT"}, "confidence": 0.9373534917831421, "cells": [{"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 194.478, "r_y0": 102.03700000000003, "r_x1": 447.545, "r_y1": 102.03700000000003, "r_x2": 447.545, "r_y2": 93.66300000000001, "r_x3": 194.478, "r_y3": 93.66300000000001, "coord_origin": "TOPLEFT"}, "text": "Optimized Table Tokenization for Table Structure Recognition", "orig": "Optimized Table Tokenization for Table Structure Recognition", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "Optimized Table Tokenization for Table Structure Recognition"}, {"label": "page_header", "id": 9, "page_no": 0, "cluster": {"id": 9, "label": "page_header", "bbox": {"l": 475.984, "t": 93.66300000000001, "r": 480.593, "b": 102.03700000000003, "coord_origin": "TOPLEFT"}, "confidence": 0.8858680725097656, "cells": [{"index": -1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 475.984, "r_y0": 102.03700000000003, "r_x1": 480.593, "r_y1": 102.03700000000003, "r_x2": 480.593, "r_y2": 93.66300000000001, "r_x3": 475.984, "r_y3": 93.66300000000001, "coord_origin": "TOPLEFT"}, "text": "9", "orig": "9", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "9"}]}}]