docling/tests/data/groundtruth/docling_v1/2305.03393v1.pages.json
Christoph Auer f1f7df49e3 Update test-cases
Signed-off-by: Christoph Auer <cau@zurich.ibm.com>
2025-03-25 13:49:08 +01:00

1 line
2.8 MiB

[{"page_no": 0, "size": {"width": 612.0, "height": 792.0}, "cells": [{"index": 0, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 128.58100000000002, "r_x1": 480.597, "r_y1": 128.58100000000002, "r_x2": 480.597, "r_y2": 115.899, "r_x3": 134.765, "r_y3": 115.899, "coord_origin": "TOPLEFT"}, "text": "Optimized Table Tokenization for Table Structure", "orig": "Optimized Table Tokenization for Table Structure", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 266.675, "r_y0": 146.514, "r_x1": 348.685, "r_y1": 146.514, "r_x2": 348.685, "r_y2": 133.832, "r_x3": 266.675, "r_y3": 133.832, "coord_origin": "TOPLEFT"}, "text": "Recognition", "orig": "Recognition", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 2, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 151.226, "r_y0": 180.471, "r_x1": 217.044, "r_y1": 180.471, "r_x2": 217.044, "r_y2": 171.67399999999998, "r_x3": 151.226, "r_y3": 171.67399999999998, "coord_origin": "TOPLEFT"}, "text": "Maksym Lysak", "orig": "Maksym Lysak", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 3, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 217.046, "r_y0": 176.25300000000004, "r_x1": 235.188, "r_y1": 176.25300000000004, "r_x2": 235.188, "r_y2": 170.159, "r_x3": 217.046, "r_y3": 170.159, "coord_origin": "TOPLEFT"}, "text": "[0000", "orig": "[0000", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 4, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 235.186, "r_y0": 176.154, "r_x1": 241.413, "r_y1": 176.154, "r_x2": 241.413, "r_y2": 170.159, "r_x3": 235.186, "r_y3": 170.159, "coord_origin": "TOPLEFT"}, "text": "-", "orig": "-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 5, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 241.413, "r_y0": 176.25300000000004, "r_x1": 257.299, "r_y1": 176.25300000000004, "r_x2": 257.299, "r_y2": 170.159, "r_x3": 241.413, "r_y3": 170.159, "coord_origin": "TOPLEFT"}, "text": "0002", "orig": "0002", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 6, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 257.298, "r_y0": 176.154, "r_x1": 263.525, "r_y1": 176.154, "r_x2": 263.525, "r_y2": 170.159, "r_x3": 257.298, "r_y3": 170.159, "coord_origin": "TOPLEFT"}, "text": "-", "orig": "-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 7, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 263.525, "r_y0": 176.25300000000004, "r_x1": 279.411, "r_y1": 176.25300000000004, "r_x2": 279.411, "r_y2": 170.159, "r_x3": 263.525, "r_y3": 170.159, "coord_origin": "TOPLEFT"}, "text": "3723", "orig": "3723", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 8, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 279.41, "r_y0": 176.154, "r_x1": 285.637, "r_y1": 176.154, "r_x2": 285.637, "r_y2": 170.159, "r_x3": 279.41, "r_y3": 170.159, "coord_origin": "TOPLEFT"}, "text": "-", "orig": "-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 9, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 285.636, "r_y0": 176.25300000000004, "r_x1": 303.778, "r_y1": 176.25300000000004, "r_x2": 303.778, "r_y2": 170.159, "r_x3": 285.636, "r_y3": 170.159, "coord_origin": "TOPLEFT"}, "text": "6960]", "orig": "6960]", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 10, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 304.275, "r_y0": 180.471, "r_x1": 307.042, "r_y1": 180.471, "r_x2": 307.042, "r_y2": 171.67399999999998, "r_x3": 304.275, "r_y3": 171.67399999999998, "coord_origin": "TOPLEFT"}, "text": ",", "orig": ",", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 11, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 310.359, "r_y0": 180.471, "r_x1": 374.138, "r_y1": 180.471, "r_x2": 374.138, "r_y2": 171.67399999999998, "r_x3": 310.359, "r_y3": 171.67399999999998, "coord_origin": "TOPLEFT"}, "text": "Ahmed Nassar", "orig": "Ahmed Nassar", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 12, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 374.135, "r_y0": 176.25300000000004, "r_x1": 392.277, "r_y1": 176.25300000000004, "r_x2": 392.277, "r_y2": 170.159, "r_x3": 374.135, "r_y3": 170.159, "coord_origin": "TOPLEFT"}, "text": "[0000", "orig": "[0000", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 13, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 392.275, "r_y0": 176.154, "r_x1": 398.502, "r_y1": 176.154, "r_x2": 398.502, "r_y2": 170.159, "r_x3": 392.275, "r_y3": 170.159, "coord_origin": "TOPLEFT"}, "text": "-", "orig": "-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 14, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 398.502, "r_y0": 176.25300000000004, "r_x1": 414.388, "r_y1": 176.25300000000004, "r_x2": 414.388, "r_y2": 170.159, "r_x3": 398.502, "r_y3": 170.159, "coord_origin": "TOPLEFT"}, "text": "0002", "orig": "0002", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 15, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 414.387, "r_y0": 176.154, "r_x1": 420.614, "r_y1": 176.154, "r_x2": 420.614, "r_y2": 170.159, "r_x3": 414.387, "r_y3": 170.159, "coord_origin": "TOPLEFT"}, "text": "-", "orig": "-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 16, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 420.613, "r_y0": 176.25300000000004, "r_x1": 436.499, "r_y1": 176.25300000000004, "r_x2": 436.499, "r_y2": 170.159, "r_x3": 420.613, "r_y3": 170.159, "coord_origin": "TOPLEFT"}, "text": "9468", "orig": "9468", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 17, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 436.498, "r_y0": 176.154, "r_x1": 442.725, "r_y1": 176.154, "r_x2": 442.725, "r_y2": 170.159, "r_x3": 436.498, "r_y3": 170.159, "coord_origin": "TOPLEFT"}, "text": "-", "orig": "-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 18, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 442.725, "r_y0": 176.25300000000004, "r_x1": 460.867, "r_y1": 176.25300000000004, "r_x2": 460.867, "r_y2": 170.159, "r_x3": 442.725, "r_y3": 170.159, "coord_origin": "TOPLEFT"}, "text": "0822]", "orig": "0822]", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 19, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 461.363, "r_y0": 180.471, "r_x1": 464.13, "r_y1": 180.471, "r_x2": 464.13, "r_y2": 171.67399999999998, "r_x3": 461.363, "r_y3": 171.67399999999998, "coord_origin": "TOPLEFT"}, "text": ",", "orig": ",", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 20, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 139.343, "r_y0": 192.42600000000004, "r_x1": 224.807, "r_y1": 192.42600000000004, "r_x2": 224.807, "r_y2": 183.62900000000002, "r_x3": 139.343, "r_y3": 183.62900000000002, "coord_origin": "TOPLEFT"}, "text": "Nikolaos Livathinos", "orig": "Nikolaos Livathinos", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 21, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 224.807, "r_y0": 188.20899999999995, "r_x1": 242.949, "r_y1": 188.20899999999995, "r_x2": 242.949, "r_y2": 182.115, "r_x3": 224.807, "r_y3": 182.115, "coord_origin": "TOPLEFT"}, "text": "[0000", "orig": "[0000", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 22, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 242.947, "r_y0": 188.11, "r_x1": 249.174, "r_y1": 188.11, "r_x2": 249.174, "r_y2": 182.115, "r_x3": 242.947, "r_y3": 182.115, "coord_origin": "TOPLEFT"}, "text": "-", "orig": "-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 23, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 249.174, "r_y0": 188.20899999999995, "r_x1": 265.06, "r_y1": 188.20899999999995, "r_x2": 265.06, "r_y2": 182.115, "r_x3": 249.174, "r_y3": 182.115, "coord_origin": "TOPLEFT"}, "text": "0001", "orig": "0001", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 24, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 265.059, "r_y0": 188.11, "r_x1": 271.286, "r_y1": 188.11, "r_x2": 271.286, "r_y2": 182.115, "r_x3": 265.059, "r_y3": 182.115, "coord_origin": "TOPLEFT"}, "text": "-", "orig": "-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 25, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 271.285, "r_y0": 188.20899999999995, "r_x1": 287.171, "r_y1": 188.20899999999995, "r_x2": 287.171, "r_y2": 182.115, "r_x3": 271.285, "r_y3": 182.115, "coord_origin": "TOPLEFT"}, "text": "8513", "orig": "8513", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 26, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 287.17, "r_y0": 188.11, "r_x1": 293.397, "r_y1": 188.11, "r_x2": 293.397, "r_y2": 182.115, "r_x3": 287.17, "r_y3": 182.115, "coord_origin": "TOPLEFT"}, "text": "-", "orig": "-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 27, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 293.397, "r_y0": 188.20899999999995, "r_x1": 311.539, "r_y1": 188.20899999999995, "r_x2": 311.539, "r_y2": 182.115, "r_x3": 293.397, "r_y3": 182.115, "coord_origin": "TOPLEFT"}, "text": "3491]", "orig": "3491]", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 28, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 312.035, "r_y0": 192.42600000000004, "r_x1": 314.802, "r_y1": 192.42600000000004, "r_x2": 314.802, "r_y2": 183.62900000000002, "r_x3": 312.035, "r_y3": 183.62900000000002, "coord_origin": "TOPLEFT"}, "text": ",", "orig": ",", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 29, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 318.119, "r_y0": 192.42600000000004, "r_x1": 386.02, "r_y1": 192.42600000000004, "r_x2": 386.02, "r_y2": 183.62900000000002, "r_x3": 318.119, "r_y3": 183.62900000000002, "coord_origin": "TOPLEFT"}, "text": "Christoph Auer", "orig": "Christoph Auer", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 30, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 386.018, "r_y0": 188.20899999999995, "r_x1": 404.16, "r_y1": 188.20899999999995, "r_x2": 404.16, "r_y2": 182.115, "r_x3": 386.018, "r_y3": 182.115, "coord_origin": "TOPLEFT"}, "text": "[0000", "orig": "[0000", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 31, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 404.158, "r_y0": 188.11, "r_x1": 410.385, "r_y1": 188.11, "r_x2": 410.385, "r_y2": 182.115, "r_x3": 404.158, "r_y3": 182.115, "coord_origin": "TOPLEFT"}, "text": "-", "orig": "-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 32, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 410.385, "r_y0": 188.20899999999995, "r_x1": 426.271, "r_y1": 188.20899999999995, "r_x2": 426.271, "r_y2": 182.115, "r_x3": 410.385, "r_y3": 182.115, "coord_origin": "TOPLEFT"}, "text": "0001", "orig": "0001", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 33, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 426.27, "r_y0": 188.11, "r_x1": 432.497, "r_y1": 188.11, "r_x2": 432.497, "r_y2": 182.115, "r_x3": 426.27, "r_y3": 182.115, "coord_origin": "TOPLEFT"}, "text": "-", "orig": "-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 34, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 432.496, "r_y0": 188.20899999999995, "r_x1": 448.382, "r_y1": 188.20899999999995, "r_x2": 448.382, "r_y2": 182.115, "r_x3": 432.496, "r_y3": 182.115, "coord_origin": "TOPLEFT"}, "text": "5761", "orig": "5761", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 35, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 448.381, "r_y0": 188.11, "r_x1": 454.608, "r_y1": 188.11, "r_x2": 454.608, "r_y2": 182.115, "r_x3": 448.381, "r_y3": 182.115, "coord_origin": "TOPLEFT"}, "text": "-", "orig": "-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 36, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 454.608, "r_y0": 188.20899999999995, "r_x1": 472.75, "r_y1": 188.20899999999995, "r_x2": 472.75, "r_y2": 182.115, "r_x3": 454.608, "r_y3": 182.115, "coord_origin": "TOPLEFT"}, "text": "0422]", "orig": "0422]", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 37, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 473.246, "r_y0": 192.42600000000004, "r_x1": 476.013, "r_y1": 192.42600000000004, "r_x2": 476.013, "r_y2": 183.62900000000002, "r_x3": 473.246, "r_y3": 183.62900000000002, "coord_origin": "TOPLEFT"}, "text": ",", "orig": ",", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 38, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 229.521, "r_y0": 204.38099999999997, "r_x1": 298.609, "r_y1": 204.38099999999997, "r_x2": 298.609, "r_y2": 195.58399999999995, "r_x3": 229.521, "r_y3": 195.58399999999995, "coord_origin": "TOPLEFT"}, "text": "and Peter Staar", "orig": "and Peter Staar", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 39, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 298.606, "r_y0": 200.164, "r_x1": 316.748, "r_y1": 200.164, "r_x2": 316.748, "r_y2": 194.07000000000005, "r_x3": 298.606, "r_y3": 194.07000000000005, "coord_origin": "TOPLEFT"}, "text": "[0000", "orig": "[0000", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 40, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 316.746, "r_y0": 200.06500000000005, "r_x1": 322.973, "r_y1": 200.06500000000005, "r_x2": 322.973, "r_y2": 194.07000000000005, "r_x3": 316.746, "r_y3": 194.07000000000005, "coord_origin": "TOPLEFT"}, "text": "-", "orig": "-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 41, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 322.973, "r_y0": 200.164, "r_x1": 338.859, "r_y1": 200.164, "r_x2": 338.859, "r_y2": 194.07000000000005, "r_x3": 322.973, "r_y3": 194.07000000000005, "coord_origin": "TOPLEFT"}, "text": "0002", "orig": "0002", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 42, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 338.858, "r_y0": 200.06500000000005, "r_x1": 345.085, "r_y1": 200.06500000000005, "r_x2": 345.085, "r_y2": 194.07000000000005, "r_x3": 338.858, "r_y3": 194.07000000000005, "coord_origin": "TOPLEFT"}, "text": "-", "orig": "-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 43, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 345.085, "r_y0": 200.164, "r_x1": 360.971, "r_y1": 200.164, "r_x2": 360.971, "r_y2": 194.07000000000005, "r_x3": 345.085, "r_y3": 194.07000000000005, "coord_origin": "TOPLEFT"}, "text": "8088", "orig": "8088", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 44, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 360.97, "r_y0": 200.06500000000005, "r_x1": 367.197, "r_y1": 200.06500000000005, "r_x2": 367.197, "r_y2": 194.07000000000005, "r_x3": 360.97, "r_y3": 194.07000000000005, "coord_origin": "TOPLEFT"}, "text": "-", "orig": "-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 45, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 367.196, "r_y0": 200.164, "r_x1": 385.338, "r_y1": 200.164, "r_x2": 385.338, "r_y2": 194.07000000000005, "r_x3": 367.196, "r_y3": 194.07000000000005, "coord_origin": "TOPLEFT"}, "text": "0823]", "orig": "0823]", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 46, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 279.105, "r_y0": 226.21500000000003, "r_x1": 336.251, "r_y1": 226.21500000000003, "r_x2": 336.251, "r_y2": 214.92600000000004, "r_x3": 279.105, "r_y3": 214.92600000000004, "coord_origin": "TOPLEFT"}, "text": "IBM Research", "orig": "IBM Research", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 47, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 222.966, "r_y0": 236.27800000000002, "r_x1": 392.39, "r_y1": 236.27800000000002, "r_x2": 392.39, "r_y2": 228.80899999999997, "r_x3": 222.966, "r_y3": 228.80899999999997, "coord_origin": "TOPLEFT"}, "text": "{mly,ahn,nli,cau,taa}@zurich.ibm.com", "orig": "{mly,ahn,nli,cau,taa}@zurich.ibm.com", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 48, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 163.111, "r_y0": 278.227, "r_x1": 206.636, "r_y1": 278.227, "r_x2": 206.636, "r_y2": 270.30100000000004, "r_x3": 163.111, "r_y3": 270.30100000000004, "coord_origin": "TOPLEFT"}, "text": "Abstract.", "orig": "Abstract.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 49, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 211.617, "r_y0": 279.375, "r_x1": 452.245, "r_y1": 279.375, "r_x2": 452.245, "r_y2": 268.086, "r_x3": 211.617, "r_y3": 268.086, "coord_origin": "TOPLEFT"}, "text": "Extracting tables from documents is a crucial task in any", "orig": "Extracting tables from documents is a crucial task in any", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 50, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 163.111, "r_y0": 290.334, "r_x1": 452.242, "r_y1": 290.334, "r_x2": 452.242, "r_y2": 279.04499999999996, "r_x3": 163.111, "r_y3": 279.04499999999996, "coord_origin": "TOPLEFT"}, "text": "document conversion pipeline. Recently, transformer-based models have", "orig": "document conversion pipeline. Recently, transformer-based models have", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 51, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 163.111, "r_y0": 301.293, "r_x1": 452.248, "r_y1": 301.293, "r_x2": 452.248, "r_y2": 290.004, "r_x3": 163.111, "r_y3": 290.004, "coord_origin": "TOPLEFT"}, "text": "demonstrated that table-structure can be recognized with impressive ac-", "orig": "demonstrated that table-structure can be recognized with impressive ac-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 52, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 163.111, "r_y0": 312.252, "r_x1": 452.241, "r_y1": 312.252, "r_x2": 452.241, "r_y2": 300.963, "r_x3": 163.111, "r_y3": 300.963, "coord_origin": "TOPLEFT"}, "text": "curacy using Image-to-Markup-Sequence (Im2Seq) approaches. Taking", "orig": "curacy using Image-to-Markup-Sequence (Im2Seq) approaches. Taking", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 53, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 163.111, "r_y0": 323.21, "r_x1": 452.246, "r_y1": 323.21, "r_x2": 452.246, "r_y2": 311.921, "r_x3": 163.111, "r_y3": 311.921, "coord_origin": "TOPLEFT"}, "text": "only the image of a table, such models predict a sequence of tokens (e.g.", "orig": "only the image of a table, such models predict a sequence of tokens (e.g.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 54, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 163.111, "r_y0": 334.169, "r_x1": 452.246, "r_y1": 334.169, "r_x2": 452.246, "r_y2": 322.88, "r_x3": 163.111, "r_y3": 322.88, "coord_origin": "TOPLEFT"}, "text": "in HTML, LaTeX) which represent the structure of the table. Since the", "orig": "in HTML, LaTeX) which represent the structure of the table. Since the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 55, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 163.111, "r_y0": 345.128, "r_x1": 452.247, "r_y1": 345.128, "r_x2": 452.247, "r_y2": 333.839, "r_x3": 163.111, "r_y3": 333.839, "coord_origin": "TOPLEFT"}, "text": "token representation of the table structure has a significant impact on", "orig": "token representation of the table structure has a significant impact on", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 56, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 163.111, "r_y0": 356.087, "r_x1": 452.246, "r_y1": 356.087, "r_x2": 452.246, "r_y2": 344.798, "r_x3": 163.111, "r_y3": 344.798, "coord_origin": "TOPLEFT"}, "text": "the accuracy and run-time performance of any Im2Seq model, we inves-", "orig": "the accuracy and run-time performance of any Im2Seq model, we inves-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 57, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 163.111, "r_y0": 367.046, "r_x1": 452.248, "r_y1": 367.046, "r_x2": 452.248, "r_y2": 355.757, "r_x3": 163.111, "r_y3": 355.757, "coord_origin": "TOPLEFT"}, "text": "tigate in this paper how table-structure representation can be optimised.", "orig": "tigate in this paper how table-structure representation can be optimised.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 58, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 163.111, "r_y0": 378.005, "r_x1": 452.246, "r_y1": 378.005, "r_x2": 452.246, "r_y2": 366.716, "r_x3": 163.111, "r_y3": 366.716, "coord_origin": "TOPLEFT"}, "text": "We propose a new, optimised table-structure language (OTSL) with a", "orig": "We propose a new, optimised table-structure language (OTSL) with a", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 59, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 163.111, "r_y0": 388.964, "r_x1": 452.242, "r_y1": 388.964, "r_x2": 452.242, "r_y2": 377.675, "r_x3": 163.111, "r_y3": 377.675, "coord_origin": "TOPLEFT"}, "text": "minimized vocabulary and specific rules. The benefits of OTSL are that", "orig": "minimized vocabulary and specific rules. The benefits of OTSL are that", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 60, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 163.111, "r_y0": 399.923, "r_x1": 169.253, "r_y1": 399.923, "r_x2": 169.253, "r_y2": 388.634, "r_x3": 163.111, "r_y3": 388.634, "coord_origin": "TOPLEFT"}, "text": "it", "orig": "it", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 61, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 172.795, "r_y0": 399.923, "r_x1": 452.244, "r_y1": 399.923, "r_x2": 452.244, "r_y2": 388.634, "r_x3": 172.795, "r_y3": 388.634, "coord_origin": "TOPLEFT"}, "text": "reduces the number of tokens to 5 (HTML needs 28+) and shortens", "orig": "reduces the number of tokens to 5 (HTML needs 28+) and shortens", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 62, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 163.111, "r_y0": 410.882, "r_x1": 452.249, "r_y1": 410.882, "r_x2": 452.249, "r_y2": 399.593, "r_x3": 163.111, "r_y3": 399.593, "coord_origin": "TOPLEFT"}, "text": "the sequence length to half of HTML on average. Consequently, model", "orig": "the sequence length to half of HTML on average. Consequently, model", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 63, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 163.111, "r_y0": 421.841, "r_x1": 198.194, "r_y1": 421.841, "r_x2": 198.194, "r_y2": 410.552, "r_x3": 163.111, "r_y3": 410.552, "coord_origin": "TOPLEFT"}, "text": "accuracy", "orig": "accuracy", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 64, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 202.632, "r_y0": 421.841, "r_x1": 292.676, "r_y1": 421.841, "r_x2": 292.676, "r_y2": 410.552, "r_x3": 202.632, "r_y3": 410.552, "coord_origin": "TOPLEFT"}, "text": "improves significantly,", "orig": "improves significantly,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 65, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 297.115, "r_y0": 421.841, "r_x1": 332.719, "r_y1": 421.841, "r_x2": 332.719, "r_y2": 410.552, "r_x3": 297.115, "r_y3": 410.552, "coord_origin": "TOPLEFT"}, "text": "inference", "orig": "inference", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 66, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 337.158, "r_y0": 421.841, "r_x1": 365.708, "r_y1": 421.841, "r_x2": 365.708, "r_y2": 410.552, "r_x3": 337.158, "r_y3": 410.552, "coord_origin": "TOPLEFT"}, "text": "time is", "orig": "time is", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 67, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 370.146, "r_y0": 421.841, "r_x1": 396.249, "r_y1": 421.841, "r_x2": 396.249, "r_y2": 410.552, "r_x3": 370.146, "r_y3": 410.552, "coord_origin": "TOPLEFT"}, "text": "halved", "orig": "halved", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 68, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 400.696, "r_y0": 421.841, "r_x1": 452.241, "r_y1": 421.841, "r_x2": 452.241, "r_y2": 410.552, "r_x3": 400.696, "r_y3": 410.552, "coord_origin": "TOPLEFT"}, "text": "compared to", "orig": "compared to", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 69, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 163.111, "r_y0": 432.799, "r_x1": 452.242, "r_y1": 432.799, "r_x2": 452.242, "r_y2": 421.51, "r_x3": 163.111, "r_y3": 421.51, "coord_origin": "TOPLEFT"}, "text": "HTML-based models, and the predicted table structures are always syn-", "orig": "HTML-based models, and the predicted table structures are always syn-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 70, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 163.111, "r_y0": 443.758, "r_x1": 200.22, "r_y1": 443.758, "r_x2": 200.22, "r_y2": 432.469, "r_x3": 163.111, "r_y3": 432.469, "coord_origin": "TOPLEFT"}, "text": "tactically", "orig": "tactically", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 71, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 204.282, "r_y0": 443.758, "r_x1": 234.527, "r_y1": 443.758, "r_x2": 234.527, "r_y2": 432.469, "r_x3": 204.282, "r_y3": 432.469, "coord_origin": "TOPLEFT"}, "text": "correct.", "orig": "correct.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 72, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 238.588, "r_y0": 443.758, "r_x1": 452.244, "r_y1": 443.758, "r_x2": 452.244, "r_y2": 432.469, "r_x3": 238.588, "r_y3": 432.469, "coord_origin": "TOPLEFT"}, "text": "This in turn eliminates most post-processing needs.", "orig": "This in turn eliminates most post-processing needs.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 73, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 163.111, "r_y0": 454.717, "r_x1": 452.246, "r_y1": 454.717, "r_x2": 452.246, "r_y2": 443.428, "r_x3": 163.111, "r_y3": 443.428, "coord_origin": "TOPLEFT"}, "text": "Popular table structure data-sets will be published in OTSL format to", "orig": "Popular table structure data-sets will be published in OTSL format to", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 74, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 163.111, "r_y0": 465.676, "r_x1": 225.561, "r_y1": 465.676, "r_x2": 225.561, "r_y2": 454.387, "r_x3": 163.111, "r_y3": 454.387, "coord_origin": "TOPLEFT"}, "text": "the community.", "orig": "the community.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 75, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 163.111, "r_y0": 486.62, "r_x1": 211.942, "r_y1": 486.62, "r_x2": 211.942, "r_y2": 478.694, "r_x3": 163.111, "r_y3": 478.694, "coord_origin": "TOPLEFT"}, "text": "Keywords:", "orig": "Keywords:", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 76, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 216.552, "r_y0": 487.768, "r_x1": 452.241, "r_y1": 487.768, "r_x2": 452.241, "r_y2": 476.479, "r_x3": 216.552, "r_y3": 476.479, "coord_origin": "TOPLEFT"}, "text": "Table Structure Recognition \u00b7 Data Representation \u00b7 Trans-", "orig": "Table Structure Recognition \u00b7 Data Representation \u00b7 Trans-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 77, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 163.111, "r_y0": 498.727, "r_x1": 257.642, "r_y1": 498.727, "r_x2": 257.642, "r_y2": 487.438, "r_x3": 163.111, "r_y3": 487.438, "coord_origin": "TOPLEFT"}, "text": "formers \u00b7 Optimization.", "orig": "formers \u00b7 Optimization.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 78, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 532.688, "r_x1": 141.489, "r_y1": 532.688, "r_x2": 141.489, "r_y2": 522.12, "r_x3": 134.765, "r_y3": 522.12, "coord_origin": "TOPLEFT"}, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 79, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 154.938, "r_y0": 532.688, "r_x1": 228.934, "r_y1": 532.688, "r_x2": 228.934, "r_y2": 522.12, "r_x3": 154.938, "r_y3": 522.12, "coord_origin": "TOPLEFT"}, "text": "Introduction", "orig": "Introduction", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 80, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 557.0840000000001, "r_x1": 480.594, "r_y1": 557.0840000000001, "r_x2": 480.594, "r_y2": 548.287, "r_x3": 134.765, "r_y3": 548.287, "coord_origin": "TOPLEFT"}, "text": "Tables are ubiquitous in documents such as scientific papers, patents, reports,", "orig": "Tables are ubiquitous in documents such as scientific papers, patents, reports,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 81, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 569.04, "r_x1": 480.592, "r_y1": 569.04, "r_x2": 480.592, "r_y2": 560.2429999999999, "r_x3": 134.765, "r_y3": 560.2429999999999, "coord_origin": "TOPLEFT"}, "text": "manuals, specification sheets or marketing material. They often encode highly", "orig": "manuals, specification sheets or marketing material. They often encode highly", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 82, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 580.995, "r_x1": 170.451, "r_y1": 580.995, "r_x2": 170.451, "r_y2": 572.198, "r_x3": 134.765, "r_y3": 572.198, "coord_origin": "TOPLEFT"}, "text": "valuable", "orig": "valuable", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 83, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 175.173, "r_y0": 580.995, "r_x1": 225.832, "r_y1": 580.995, "r_x2": 225.832, "r_y2": 572.198, "r_x3": 175.173, "r_y3": 572.198, "coord_origin": "TOPLEFT"}, "text": "information", "orig": "information", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 84, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 230.544, "r_y0": 580.995, "r_x1": 289.826, "r_y1": 580.995, "r_x2": 289.826, "r_y2": 572.198, "r_x3": 230.544, "r_y3": 572.198, "coord_origin": "TOPLEFT"}, "text": "and therefore", "orig": "and therefore", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 85, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 294.538, "r_y0": 580.995, "r_x1": 388.395, "r_y1": 580.995, "r_x2": 388.395, "r_y2": 572.198, "r_x3": 294.538, "r_y3": 572.198, "coord_origin": "TOPLEFT"}, "text": "need to be extracted", "orig": "need to be extracted", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 86, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 393.107, "r_y0": 580.995, "r_x1": 480.593, "r_y1": 580.995, "r_x2": 480.593, "r_y2": 572.198, "r_x3": 393.107, "r_y3": 572.198, "coord_origin": "TOPLEFT"}, "text": "with high accuracy.", "orig": "with high accuracy.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 87, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 592.95, "r_x1": 480.596, "r_y1": 592.95, "r_x2": 480.596, "r_y2": 584.153, "r_x3": 134.765, "r_y3": 584.153, "coord_origin": "TOPLEFT"}, "text": "Unfortunately, tables appear in documents in various sizes, styling and struc-", "orig": "Unfortunately, tables appear in documents in various sizes, styling and struc-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 88, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 604.905, "r_x1": 155.266, "r_y1": 604.905, "r_x2": 155.266, "r_y2": 596.108, "r_x3": 134.765, "r_y3": 596.108, "coord_origin": "TOPLEFT"}, "text": "ture,", "orig": "ture,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 89, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 159.48, "r_y0": 604.905, "r_x1": 480.587, "r_y1": 604.905, "r_x2": 480.587, "r_y2": 596.108, "r_x3": 159.48, "r_y3": 596.108, "coord_origin": "TOPLEFT"}, "text": "making it difficult to recover their correct structure with simple analyt-", "orig": "making it difficult to recover their correct structure with simple analyt-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 90, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 616.86, "r_x1": 149.705, "r_y1": 616.86, "r_x2": 149.705, "r_y2": 608.063, "r_x3": 134.765, "r_y3": 608.063, "coord_origin": "TOPLEFT"}, "text": "ical", "orig": "ical", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 91, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 153.71, "r_y0": 616.86, "r_x1": 480.591, "r_y1": 616.86, "r_x2": 480.591, "r_y2": 608.063, "r_x3": 153.71, "r_y3": 608.063, "coord_origin": "TOPLEFT"}, "text": "methods. Therefore, accurate table extraction is achieved these days with", "orig": "methods. Therefore, accurate table extraction is achieved these days with", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 92, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 628.815, "r_x1": 279.327, "r_y1": 628.815, "r_x2": 279.327, "r_y2": 620.018, "r_x3": 134.765, "r_y3": 620.018, "coord_origin": "TOPLEFT"}, "text": "machine-learning based methods.", "orig": "machine-learning based methods.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 93, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 149.708, "r_y0": 640.9449999999999, "r_x1": 480.589, "r_y1": 640.9449999999999, "r_x2": 480.589, "r_y2": 632.148, "r_x3": 149.708, "r_y3": 632.148, "coord_origin": "TOPLEFT"}, "text": "In modern document understanding systems [1,15], table extraction is typi-", "orig": "In modern document understanding systems [1,15], table extraction is typi-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 94, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 652.9, "r_x1": 480.596, "r_y1": 652.9, "r_x2": 480.596, "r_y2": 644.1030000000001, "r_x3": 134.765, "r_y3": 644.1030000000001, "coord_origin": "TOPLEFT"}, "text": "cally a two-step process. Firstly, every table on a page is located with a bounding", "orig": "cally a two-step process. Firstly, every table on a page is located with a bounding", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 95, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 664.855, "r_x1": 480.595, "r_y1": 664.855, "r_x2": 480.595, "r_y2": 656.058, "r_x3": 134.765, "r_y3": 656.058, "coord_origin": "TOPLEFT"}, "text": "box, and secondly, their logical row and column structure is recognized. As of", "orig": "box, and secondly, their logical row and column structure is recognized. As of", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 96, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 36.34, "r_y0": 555.0, "r_x1": 36.34, "r_y1": 375.0, "r_x2": 18.34, "r_y2": 375.0, "r_x3": 18.34, "r_y3": 555.0, "coord_origin": "TOPLEFT"}, "text": "arXiv:2305.03393v1", "orig": "arXiv:2305.03393v1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 97, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 36.34, "r_y0": 355.0, "r_x1": 36.34, "r_y1": 285.0, "r_x2": 18.34, "r_y2": 285.0, "r_x3": 18.34, "r_y3": 355.0, "coord_origin": "TOPLEFT"}, "text": "[cs.CV]", "orig": "[cs.CV]", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 98, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 36.34, "r_y0": 265.0, "r_x1": 36.34, "r_y1": 255.0, "r_x2": 18.34, "r_y2": 255.0, "r_x3": 18.34, "r_y3": 265.0, "coord_origin": "TOPLEFT"}, "text": "5", "orig": "5", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 99, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 36.34, "r_y0": 245.0, "r_x1": 36.34, "r_y1": 215.0, "r_x2": 18.34, "r_y2": 215.0, "r_x3": 18.34, "r_y3": 245.0, "coord_origin": "TOPLEFT"}, "text": "May", "orig": "May", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 100, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 36.34, "r_y0": 205.0, "r_x1": 36.34, "r_y1": 165.0, "r_x2": 18.34, "r_y2": 165.0, "r_x3": 18.34, "r_y3": 205.0, "coord_origin": "TOPLEFT"}, "text": "2023", "orig": "2023", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "parsed_page": null, "predictions": {"layout": {"clusters": [{"id": 5, "label": "section_header", "bbox": {"l": 134.765, "t": 115.899, "r": 480.597, "b": 146.514, "coord_origin": "TOPLEFT"}, "confidence": 0.8918349742889404, "cells": [{"index": 0, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 128.58100000000002, "r_x1": 480.597, "r_y1": 128.58100000000002, "r_x2": 480.597, "r_y2": 115.899, "r_x3": 134.765, "r_y3": 115.899, "coord_origin": "TOPLEFT"}, "text": "Optimized Table Tokenization for Table Structure", "orig": "Optimized Table Tokenization for Table Structure", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 266.675, "r_y0": 146.514, "r_x1": 348.685, "r_y1": 146.514, "r_x2": 348.685, "r_y2": 133.832, "r_x3": 266.675, "r_y3": 133.832, "coord_origin": "TOPLEFT"}, "text": "Recognition", "orig": "Recognition", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 16, "label": "key_value_region", "bbox": {"l": 139.343, "t": 170.159, "r": 476.013, "b": 236.27800000000002, "coord_origin": "TOPLEFT"}, "confidence": 0.48445820808410645, "cells": [{"index": 2, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 151.226, "r_y0": 180.471, "r_x1": 217.044, "r_y1": 180.471, "r_x2": 217.044, "r_y2": 171.67399999999998, "r_x3": 151.226, "r_y3": 171.67399999999998, "coord_origin": "TOPLEFT"}, "text": "Maksym Lysak", "orig": "Maksym Lysak", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 3, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 217.046, "r_y0": 176.25300000000004, "r_x1": 235.188, "r_y1": 176.25300000000004, "r_x2": 235.188, "r_y2": 170.159, "r_x3": 217.046, "r_y3": 170.159, "coord_origin": "TOPLEFT"}, "text": "[0000", "orig": "[0000", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 4, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 235.186, "r_y0": 176.154, "r_x1": 241.413, "r_y1": 176.154, "r_x2": 241.413, "r_y2": 170.159, "r_x3": 235.186, "r_y3": 170.159, "coord_origin": "TOPLEFT"}, "text": "-", "orig": "-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 5, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 241.413, "r_y0": 176.25300000000004, "r_x1": 257.299, "r_y1": 176.25300000000004, "r_x2": 257.299, "r_y2": 170.159, "r_x3": 241.413, "r_y3": 170.159, "coord_origin": "TOPLEFT"}, "text": "0002", "orig": "0002", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 6, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 257.298, "r_y0": 176.154, "r_x1": 263.525, "r_y1": 176.154, "r_x2": 263.525, "r_y2": 170.159, "r_x3": 257.298, "r_y3": 170.159, "coord_origin": "TOPLEFT"}, "text": "-", "orig": "-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 7, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 263.525, "r_y0": 176.25300000000004, "r_x1": 279.411, "r_y1": 176.25300000000004, "r_x2": 279.411, "r_y2": 170.159, "r_x3": 263.525, "r_y3": 170.159, "coord_origin": "TOPLEFT"}, "text": "3723", "orig": "3723", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 8, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 279.41, "r_y0": 176.154, "r_x1": 285.637, "r_y1": 176.154, "r_x2": 285.637, "r_y2": 170.159, "r_x3": 279.41, "r_y3": 170.159, "coord_origin": "TOPLEFT"}, "text": "-", "orig": "-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 9, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 285.636, "r_y0": 176.25300000000004, "r_x1": 303.778, "r_y1": 176.25300000000004, "r_x2": 303.778, "r_y2": 170.159, "r_x3": 285.636, "r_y3": 170.159, "coord_origin": "TOPLEFT"}, "text": "6960]", "orig": "6960]", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 10, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 304.275, "r_y0": 180.471, "r_x1": 307.042, "r_y1": 180.471, "r_x2": 307.042, "r_y2": 171.67399999999998, "r_x3": 304.275, "r_y3": 171.67399999999998, "coord_origin": "TOPLEFT"}, "text": ",", "orig": ",", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 11, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 310.359, "r_y0": 180.471, "r_x1": 374.138, "r_y1": 180.471, "r_x2": 374.138, "r_y2": 171.67399999999998, "r_x3": 310.359, "r_y3": 171.67399999999998, "coord_origin": "TOPLEFT"}, "text": "Ahmed Nassar", "orig": "Ahmed Nassar", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 12, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 374.135, "r_y0": 176.25300000000004, "r_x1": 392.277, "r_y1": 176.25300000000004, "r_x2": 392.277, "r_y2": 170.159, "r_x3": 374.135, "r_y3": 170.159, "coord_origin": "TOPLEFT"}, "text": "[0000", "orig": "[0000", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 13, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 392.275, "r_y0": 176.154, "r_x1": 398.502, "r_y1": 176.154, "r_x2": 398.502, "r_y2": 170.159, "r_x3": 392.275, "r_y3": 170.159, "coord_origin": "TOPLEFT"}, "text": "-", "orig": "-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 14, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 398.502, "r_y0": 176.25300000000004, "r_x1": 414.388, "r_y1": 176.25300000000004, "r_x2": 414.388, "r_y2": 170.159, "r_x3": 398.502, "r_y3": 170.159, "coord_origin": "TOPLEFT"}, "text": "0002", "orig": "0002", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 15, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 414.387, "r_y0": 176.154, "r_x1": 420.614, "r_y1": 176.154, "r_x2": 420.614, "r_y2": 170.159, "r_x3": 414.387, "r_y3": 170.159, "coord_origin": "TOPLEFT"}, "text": "-", "orig": "-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 16, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 420.613, "r_y0": 176.25300000000004, "r_x1": 436.499, "r_y1": 176.25300000000004, "r_x2": 436.499, "r_y2": 170.159, "r_x3": 420.613, "r_y3": 170.159, "coord_origin": "TOPLEFT"}, "text": "9468", "orig": "9468", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 17, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 436.498, "r_y0": 176.154, "r_x1": 442.725, "r_y1": 176.154, "r_x2": 442.725, "r_y2": 170.159, "r_x3": 436.498, "r_y3": 170.159, "coord_origin": "TOPLEFT"}, "text": "-", "orig": "-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 18, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 442.725, "r_y0": 176.25300000000004, "r_x1": 460.867, "r_y1": 176.25300000000004, "r_x2": 460.867, "r_y2": 170.159, "r_x3": 442.725, "r_y3": 170.159, "coord_origin": "TOPLEFT"}, "text": "0822]", "orig": "0822]", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 19, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 461.363, "r_y0": 180.471, "r_x1": 464.13, "r_y1": 180.471, "r_x2": 464.13, "r_y2": 171.67399999999998, "r_x3": 461.363, "r_y3": 171.67399999999998, "coord_origin": "TOPLEFT"}, "text": ",", "orig": ",", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 20, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 139.343, "r_y0": 192.42600000000004, "r_x1": 224.807, "r_y1": 192.42600000000004, "r_x2": 224.807, "r_y2": 183.62900000000002, "r_x3": 139.343, "r_y3": 183.62900000000002, "coord_origin": "TOPLEFT"}, "text": "Nikolaos Livathinos", "orig": "Nikolaos Livathinos", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 21, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 224.807, "r_y0": 188.20899999999995, "r_x1": 242.949, "r_y1": 188.20899999999995, "r_x2": 242.949, "r_y2": 182.115, "r_x3": 224.807, "r_y3": 182.115, "coord_origin": "TOPLEFT"}, "text": "[0000", "orig": "[0000", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 22, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 242.947, "r_y0": 188.11, "r_x1": 249.174, "r_y1": 188.11, "r_x2": 249.174, "r_y2": 182.115, "r_x3": 242.947, "r_y3": 182.115, "coord_origin": "TOPLEFT"}, "text": "-", "orig": "-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 23, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 249.174, "r_y0": 188.20899999999995, "r_x1": 265.06, "r_y1": 188.20899999999995, "r_x2": 265.06, "r_y2": 182.115, "r_x3": 249.174, "r_y3": 182.115, "coord_origin": "TOPLEFT"}, "text": "0001", "orig": "0001", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 24, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 265.059, "r_y0": 188.11, "r_x1": 271.286, "r_y1": 188.11, "r_x2": 271.286, "r_y2": 182.115, "r_x3": 265.059, "r_y3": 182.115, "coord_origin": "TOPLEFT"}, "text": "-", "orig": "-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 25, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 271.285, "r_y0": 188.20899999999995, "r_x1": 287.171, "r_y1": 188.20899999999995, "r_x2": 287.171, "r_y2": 182.115, "r_x3": 271.285, "r_y3": 182.115, "coord_origin": "TOPLEFT"}, "text": "8513", "orig": "8513", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 26, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 287.17, "r_y0": 188.11, "r_x1": 293.397, "r_y1": 188.11, "r_x2": 293.397, "r_y2": 182.115, "r_x3": 287.17, "r_y3": 182.115, "coord_origin": "TOPLEFT"}, "text": "-", "orig": "-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 27, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 293.397, "r_y0": 188.20899999999995, "r_x1": 311.539, "r_y1": 188.20899999999995, "r_x2": 311.539, "r_y2": 182.115, "r_x3": 293.397, "r_y3": 182.115, "coord_origin": "TOPLEFT"}, "text": "3491]", "orig": "3491]", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 28, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 312.035, "r_y0": 192.42600000000004, "r_x1": 314.802, "r_y1": 192.42600000000004, "r_x2": 314.802, "r_y2": 183.62900000000002, "r_x3": 312.035, "r_y3": 183.62900000000002, "coord_origin": "TOPLEFT"}, "text": ",", "orig": ",", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 29, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 318.119, "r_y0": 192.42600000000004, "r_x1": 386.02, "r_y1": 192.42600000000004, "r_x2": 386.02, "r_y2": 183.62900000000002, "r_x3": 318.119, "r_y3": 183.62900000000002, "coord_origin": "TOPLEFT"}, "text": "Christoph Auer", "orig": "Christoph Auer", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 30, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 386.018, "r_y0": 188.20899999999995, "r_x1": 404.16, "r_y1": 188.20899999999995, "r_x2": 404.16, "r_y2": 182.115, "r_x3": 386.018, "r_y3": 182.115, "coord_origin": "TOPLEFT"}, "text": "[0000", "orig": "[0000", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 31, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 404.158, "r_y0": 188.11, "r_x1": 410.385, "r_y1": 188.11, "r_x2": 410.385, "r_y2": 182.115, "r_x3": 404.158, "r_y3": 182.115, "coord_origin": "TOPLEFT"}, "text": "-", "orig": "-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 32, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 410.385, "r_y0": 188.20899999999995, "r_x1": 426.271, "r_y1": 188.20899999999995, "r_x2": 426.271, "r_y2": 182.115, "r_x3": 410.385, "r_y3": 182.115, "coord_origin": "TOPLEFT"}, "text": "0001", "orig": "0001", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 33, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 426.27, "r_y0": 188.11, "r_x1": 432.497, "r_y1": 188.11, "r_x2": 432.497, "r_y2": 182.115, "r_x3": 426.27, "r_y3": 182.115, "coord_origin": "TOPLEFT"}, "text": "-", "orig": "-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 34, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 432.496, "r_y0": 188.20899999999995, "r_x1": 448.382, "r_y1": 188.20899999999995, "r_x2": 448.382, "r_y2": 182.115, "r_x3": 432.496, "r_y3": 182.115, "coord_origin": "TOPLEFT"}, "text": "5761", "orig": "5761", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 35, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 448.381, "r_y0": 188.11, "r_x1": 454.608, "r_y1": 188.11, "r_x2": 454.608, "r_y2": 182.115, "r_x3": 448.381, "r_y3": 182.115, "coord_origin": "TOPLEFT"}, "text": "-", "orig": "-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 36, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 454.608, "r_y0": 188.20899999999995, "r_x1": 472.75, "r_y1": 188.20899999999995, "r_x2": 472.75, "r_y2": 182.115, "r_x3": 454.608, "r_y3": 182.115, "coord_origin": "TOPLEFT"}, "text": "0422]", "orig": "0422]", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 37, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 473.246, "r_y0": 192.42600000000004, "r_x1": 476.013, "r_y1": 192.42600000000004, "r_x2": 476.013, "r_y2": 183.62900000000002, "r_x3": 473.246, "r_y3": 183.62900000000002, "coord_origin": "TOPLEFT"}, "text": ",", "orig": ",", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 38, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 229.521, "r_y0": 204.38099999999997, "r_x1": 298.609, "r_y1": 204.38099999999997, "r_x2": 298.609, "r_y2": 195.58399999999995, "r_x3": 229.521, "r_y3": 195.58399999999995, "coord_origin": "TOPLEFT"}, "text": "and Peter Staar", "orig": "and Peter Staar", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 39, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 298.606, "r_y0": 200.164, "r_x1": 316.748, "r_y1": 200.164, "r_x2": 316.748, "r_y2": 194.07000000000005, "r_x3": 298.606, "r_y3": 194.07000000000005, "coord_origin": "TOPLEFT"}, "text": "[0000", "orig": "[0000", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 40, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 316.746, "r_y0": 200.06500000000005, "r_x1": 322.973, "r_y1": 200.06500000000005, "r_x2": 322.973, "r_y2": 194.07000000000005, "r_x3": 316.746, "r_y3": 194.07000000000005, "coord_origin": "TOPLEFT"}, "text": "-", "orig": "-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 41, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 322.973, "r_y0": 200.164, "r_x1": 338.859, "r_y1": 200.164, "r_x2": 338.859, "r_y2": 194.07000000000005, "r_x3": 322.973, "r_y3": 194.07000000000005, "coord_origin": "TOPLEFT"}, "text": "0002", "orig": "0002", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 42, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 338.858, "r_y0": 200.06500000000005, "r_x1": 345.085, "r_y1": 200.06500000000005, "r_x2": 345.085, "r_y2": 194.07000000000005, "r_x3": 338.858, "r_y3": 194.07000000000005, "coord_origin": "TOPLEFT"}, "text": "-", "orig": "-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 43, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 345.085, "r_y0": 200.164, "r_x1": 360.971, "r_y1": 200.164, "r_x2": 360.971, "r_y2": 194.07000000000005, "r_x3": 345.085, "r_y3": 194.07000000000005, "coord_origin": "TOPLEFT"}, "text": "8088", "orig": "8088", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 44, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 360.97, "r_y0": 200.06500000000005, "r_x1": 367.197, "r_y1": 200.06500000000005, "r_x2": 367.197, "r_y2": 194.07000000000005, "r_x3": 360.97, "r_y3": 194.07000000000005, "coord_origin": "TOPLEFT"}, "text": "-", "orig": "-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 45, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 367.196, "r_y0": 200.164, "r_x1": 385.338, "r_y1": 200.164, "r_x2": 385.338, "r_y2": 194.07000000000005, "r_x3": 367.196, "r_y3": 194.07000000000005, "coord_origin": "TOPLEFT"}, "text": "0823]", "orig": "0823]", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 46, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 279.105, "r_y0": 226.21500000000003, "r_x1": 336.251, "r_y1": 226.21500000000003, "r_x2": 336.251, "r_y2": 214.92600000000004, "r_x3": 279.105, "r_y3": 214.92600000000004, "coord_origin": "TOPLEFT"}, "text": "IBM Research", "orig": "IBM Research", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 47, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 222.966, "r_y0": 236.27800000000002, "r_x1": 392.39, "r_y1": 236.27800000000002, "r_x2": 392.39, "r_y2": 228.80899999999997, "r_x3": 222.966, "r_y3": 228.80899999999997, "coord_origin": "TOPLEFT"}, "text": "{mly,ahn,nli,cau,taa}@zurich.ibm.com", "orig": "{mly,ahn,nli,cau,taa}@zurich.ibm.com", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": [{"id": 7, "label": "text", "bbox": {"l": 139.343, "t": 170.159, "r": 476.013, "b": 200.164, "coord_origin": "TOPLEFT"}, "confidence": 0.7918068766593933, "cells": [{"index": 2, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 151.226, "r_y0": 180.471, "r_x1": 217.044, "r_y1": 180.471, "r_x2": 217.044, "r_y2": 171.67399999999998, "r_x3": 151.226, "r_y3": 171.67399999999998, "coord_origin": "TOPLEFT"}, "text": "Maksym Lysak", "orig": "Maksym Lysak", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 3, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 217.046, "r_y0": 176.25300000000004, "r_x1": 235.188, "r_y1": 176.25300000000004, "r_x2": 235.188, "r_y2": 170.159, "r_x3": 217.046, "r_y3": 170.159, "coord_origin": "TOPLEFT"}, "text": "[0000", "orig": "[0000", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 4, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 235.186, "r_y0": 176.154, "r_x1": 241.413, "r_y1": 176.154, "r_x2": 241.413, "r_y2": 170.159, "r_x3": 235.186, "r_y3": 170.159, "coord_origin": "TOPLEFT"}, "text": "-", "orig": "-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 5, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 241.413, "r_y0": 176.25300000000004, "r_x1": 257.299, "r_y1": 176.25300000000004, "r_x2": 257.299, "r_y2": 170.159, "r_x3": 241.413, "r_y3": 170.159, "coord_origin": "TOPLEFT"}, "text": "0002", "orig": "0002", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 6, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 257.298, "r_y0": 176.154, "r_x1": 263.525, "r_y1": 176.154, "r_x2": 263.525, "r_y2": 170.159, "r_x3": 257.298, "r_y3": 170.159, "coord_origin": "TOPLEFT"}, "text": "-", "orig": "-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 7, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 263.525, "r_y0": 176.25300000000004, "r_x1": 279.411, "r_y1": 176.25300000000004, "r_x2": 279.411, "r_y2": 170.159, "r_x3": 263.525, "r_y3": 170.159, "coord_origin": "TOPLEFT"}, "text": "3723", "orig": "3723", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 8, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 279.41, "r_y0": 176.154, "r_x1": 285.637, "r_y1": 176.154, "r_x2": 285.637, "r_y2": 170.159, "r_x3": 279.41, "r_y3": 170.159, "coord_origin": "TOPLEFT"}, "text": "-", "orig": "-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 9, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 285.636, "r_y0": 176.25300000000004, "r_x1": 303.778, "r_y1": 176.25300000000004, "r_x2": 303.778, "r_y2": 170.159, "r_x3": 285.636, "r_y3": 170.159, "coord_origin": "TOPLEFT"}, "text": "6960]", "orig": "6960]", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 10, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 304.275, "r_y0": 180.471, "r_x1": 307.042, "r_y1": 180.471, "r_x2": 307.042, "r_y2": 171.67399999999998, "r_x3": 304.275, "r_y3": 171.67399999999998, "coord_origin": "TOPLEFT"}, "text": ",", "orig": ",", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 11, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 310.359, "r_y0": 180.471, "r_x1": 374.138, "r_y1": 180.471, "r_x2": 374.138, "r_y2": 171.67399999999998, "r_x3": 310.359, "r_y3": 171.67399999999998, "coord_origin": "TOPLEFT"}, "text": "Ahmed Nassar", "orig": "Ahmed Nassar", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 12, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 374.135, "r_y0": 176.25300000000004, "r_x1": 392.277, "r_y1": 176.25300000000004, "r_x2": 392.277, "r_y2": 170.159, "r_x3": 374.135, "r_y3": 170.159, "coord_origin": "TOPLEFT"}, "text": "[0000", "orig": "[0000", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 13, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 392.275, "r_y0": 176.154, "r_x1": 398.502, "r_y1": 176.154, "r_x2": 398.502, "r_y2": 170.159, "r_x3": 392.275, "r_y3": 170.159, "coord_origin": "TOPLEFT"}, "text": "-", "orig": "-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 14, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 398.502, "r_y0": 176.25300000000004, "r_x1": 414.388, "r_y1": 176.25300000000004, "r_x2": 414.388, "r_y2": 170.159, "r_x3": 398.502, "r_y3": 170.159, "coord_origin": "TOPLEFT"}, "text": "0002", "orig": "0002", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 15, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 414.387, "r_y0": 176.154, "r_x1": 420.614, "r_y1": 176.154, "r_x2": 420.614, "r_y2": 170.159, "r_x3": 414.387, "r_y3": 170.159, "coord_origin": "TOPLEFT"}, "text": "-", "orig": "-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 16, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 420.613, "r_y0": 176.25300000000004, "r_x1": 436.499, "r_y1": 176.25300000000004, "r_x2": 436.499, "r_y2": 170.159, "r_x3": 420.613, "r_y3": 170.159, "coord_origin": "TOPLEFT"}, "text": "9468", "orig": "9468", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 17, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 436.498, "r_y0": 176.154, "r_x1": 442.725, "r_y1": 176.154, "r_x2": 442.725, "r_y2": 170.159, "r_x3": 436.498, "r_y3": 170.159, "coord_origin": "TOPLEFT"}, "text": "-", "orig": "-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 18, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 442.725, "r_y0": 176.25300000000004, "r_x1": 460.867, "r_y1": 176.25300000000004, "r_x2": 460.867, "r_y2": 170.159, "r_x3": 442.725, "r_y3": 170.159, "coord_origin": "TOPLEFT"}, "text": "0822]", "orig": "0822]", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 19, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 461.363, "r_y0": 180.471, "r_x1": 464.13, "r_y1": 180.471, "r_x2": 464.13, "r_y2": 171.67399999999998, "r_x3": 461.363, "r_y3": 171.67399999999998, "coord_origin": "TOPLEFT"}, "text": ",", "orig": ",", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 20, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 139.343, "r_y0": 192.42600000000004, "r_x1": 224.807, "r_y1": 192.42600000000004, "r_x2": 224.807, "r_y2": 183.62900000000002, "r_x3": 139.343, "r_y3": 183.62900000000002, "coord_origin": "TOPLEFT"}, "text": "Nikolaos Livathinos", "orig": "Nikolaos Livathinos", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 21, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 224.807, "r_y0": 188.20899999999995, "r_x1": 242.949, "r_y1": 188.20899999999995, "r_x2": 242.949, "r_y2": 182.115, "r_x3": 224.807, "r_y3": 182.115, "coord_origin": "TOPLEFT"}, "text": "[0000", "orig": "[0000", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 22, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 242.947, "r_y0": 188.11, "r_x1": 249.174, "r_y1": 188.11, "r_x2": 249.174, "r_y2": 182.115, "r_x3": 242.947, "r_y3": 182.115, "coord_origin": "TOPLEFT"}, "text": "-", "orig": "-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 23, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 249.174, "r_y0": 188.20899999999995, "r_x1": 265.06, "r_y1": 188.20899999999995, "r_x2": 265.06, "r_y2": 182.115, "r_x3": 249.174, "r_y3": 182.115, "coord_origin": "TOPLEFT"}, "text": "0001", "orig": "0001", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 24, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 265.059, "r_y0": 188.11, "r_x1": 271.286, "r_y1": 188.11, "r_x2": 271.286, "r_y2": 182.115, "r_x3": 265.059, "r_y3": 182.115, "coord_origin": "TOPLEFT"}, "text": "-", "orig": "-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 25, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 271.285, "r_y0": 188.20899999999995, "r_x1": 287.171, "r_y1": 188.20899999999995, "r_x2": 287.171, "r_y2": 182.115, "r_x3": 271.285, "r_y3": 182.115, "coord_origin": "TOPLEFT"}, "text": "8513", "orig": "8513", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 26, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 287.17, "r_y0": 188.11, "r_x1": 293.397, "r_y1": 188.11, "r_x2": 293.397, "r_y2": 182.115, "r_x3": 287.17, "r_y3": 182.115, "coord_origin": "TOPLEFT"}, "text": "-", "orig": "-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 27, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 293.397, "r_y0": 188.20899999999995, "r_x1": 311.539, "r_y1": 188.20899999999995, "r_x2": 311.539, "r_y2": 182.115, "r_x3": 293.397, "r_y3": 182.115, "coord_origin": "TOPLEFT"}, "text": "3491]", "orig": "3491]", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 28, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 312.035, "r_y0": 192.42600000000004, "r_x1": 314.802, "r_y1": 192.42600000000004, "r_x2": 314.802, "r_y2": 183.62900000000002, "r_x3": 312.035, "r_y3": 183.62900000000002, "coord_origin": "TOPLEFT"}, "text": ",", "orig": ",", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 29, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 318.119, "r_y0": 192.42600000000004, "r_x1": 386.02, "r_y1": 192.42600000000004, "r_x2": 386.02, "r_y2": 183.62900000000002, "r_x3": 318.119, "r_y3": 183.62900000000002, "coord_origin": "TOPLEFT"}, "text": "Christoph Auer", "orig": "Christoph Auer", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 30, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 386.018, "r_y0": 188.20899999999995, "r_x1": 404.16, "r_y1": 188.20899999999995, "r_x2": 404.16, "r_y2": 182.115, "r_x3": 386.018, "r_y3": 182.115, "coord_origin": "TOPLEFT"}, "text": "[0000", "orig": "[0000", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 31, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 404.158, "r_y0": 188.11, "r_x1": 410.385, "r_y1": 188.11, "r_x2": 410.385, "r_y2": 182.115, "r_x3": 404.158, "r_y3": 182.115, "coord_origin": "TOPLEFT"}, "text": "-", "orig": "-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 32, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 410.385, "r_y0": 188.20899999999995, "r_x1": 426.271, "r_y1": 188.20899999999995, "r_x2": 426.271, "r_y2": 182.115, "r_x3": 410.385, "r_y3": 182.115, "coord_origin": "TOPLEFT"}, "text": "0001", "orig": "0001", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 33, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 426.27, "r_y0": 188.11, "r_x1": 432.497, "r_y1": 188.11, "r_x2": 432.497, "r_y2": 182.115, "r_x3": 426.27, "r_y3": 182.115, "coord_origin": "TOPLEFT"}, "text": "-", "orig": "-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 34, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 432.496, "r_y0": 188.20899999999995, "r_x1": 448.382, "r_y1": 188.20899999999995, "r_x2": 448.382, "r_y2": 182.115, "r_x3": 432.496, "r_y3": 182.115, "coord_origin": "TOPLEFT"}, "text": "5761", "orig": "5761", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 35, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 448.381, "r_y0": 188.11, "r_x1": 454.608, "r_y1": 188.11, "r_x2": 454.608, "r_y2": 182.115, "r_x3": 448.381, "r_y3": 182.115, "coord_origin": "TOPLEFT"}, "text": "-", "orig": "-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 36, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 454.608, "r_y0": 188.20899999999995, "r_x1": 472.75, "r_y1": 188.20899999999995, "r_x2": 472.75, "r_y2": 182.115, "r_x3": 454.608, "r_y3": 182.115, "coord_origin": "TOPLEFT"}, "text": "0422]", "orig": "0422]", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 37, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 473.246, "r_y0": 192.42600000000004, "r_x1": 476.013, "r_y1": 192.42600000000004, "r_x2": 476.013, "r_y2": 183.62900000000002, "r_x3": 473.246, "r_y3": 183.62900000000002, "coord_origin": "TOPLEFT"}, "text": ",", "orig": ",", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 39, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 298.606, "r_y0": 200.164, "r_x1": 316.748, "r_y1": 200.164, "r_x2": 316.748, "r_y2": 194.07000000000005, "r_x3": 298.606, "r_y3": 194.07000000000005, "coord_origin": "TOPLEFT"}, "text": "[0000", "orig": "[0000", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 40, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 316.746, "r_y0": 200.06500000000005, "r_x1": 322.973, "r_y1": 200.06500000000005, "r_x2": 322.973, "r_y2": 194.07000000000005, "r_x3": 316.746, "r_y3": 194.07000000000005, "coord_origin": "TOPLEFT"}, "text": "-", "orig": "-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 41, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 322.973, "r_y0": 200.164, "r_x1": 338.859, "r_y1": 200.164, "r_x2": 338.859, "r_y2": 194.07000000000005, "r_x3": 322.973, "r_y3": 194.07000000000005, "coord_origin": "TOPLEFT"}, "text": "0002", "orig": "0002", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 42, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 338.858, "r_y0": 200.06500000000005, "r_x1": 345.085, "r_y1": 200.06500000000005, "r_x2": 345.085, "r_y2": 194.07000000000005, "r_x3": 338.858, "r_y3": 194.07000000000005, "coord_origin": "TOPLEFT"}, "text": "-", "orig": "-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 43, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 345.085, "r_y0": 200.164, "r_x1": 360.971, "r_y1": 200.164, "r_x2": 360.971, "r_y2": 194.07000000000005, "r_x3": 345.085, "r_y3": 194.07000000000005, "coord_origin": "TOPLEFT"}, "text": "8088", "orig": "8088", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 44, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 360.97, "r_y0": 200.06500000000005, "r_x1": 367.197, "r_y1": 200.06500000000005, "r_x2": 367.197, "r_y2": 194.07000000000005, "r_x3": 360.97, "r_y3": 194.07000000000005, "coord_origin": "TOPLEFT"}, "text": "-", "orig": "-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 45, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 367.196, "r_y0": 200.164, "r_x1": 385.338, "r_y1": 200.164, "r_x2": 385.338, "r_y2": 194.07000000000005, "r_x3": 367.196, "r_y3": 194.07000000000005, "coord_origin": "TOPLEFT"}, "text": "0823]", "orig": "0823]", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 13, "label": "text", "bbox": {"l": 229.521, "t": 195.58399999999995, "r": 298.609, "b": 204.38099999999997, "coord_origin": "TOPLEFT"}, "confidence": 0.5015263557434082, "cells": [{"index": 38, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 229.521, "r_y0": 204.38099999999997, "r_x1": 298.609, "r_y1": 204.38099999999997, "r_x2": 298.609, "r_y2": 195.58399999999995, "r_x3": 229.521, "r_y3": 195.58399999999995, "coord_origin": "TOPLEFT"}, "text": "and Peter Staar", "orig": "and Peter Staar", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 9, "label": "text", "bbox": {"l": 279.105, "t": 214.92600000000004, "r": 336.251, "b": 226.21500000000003, "coord_origin": "TOPLEFT"}, "confidence": 0.6310867667198181, "cells": [{"index": 46, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 279.105, "r_y0": 226.21500000000003, "r_x1": 336.251, "r_y1": 226.21500000000003, "r_x2": 336.251, "r_y2": 214.92600000000004, "r_x3": 279.105, "r_y3": 214.92600000000004, "coord_origin": "TOPLEFT"}, "text": "IBM Research", "orig": "IBM Research", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 8, "label": "text", "bbox": {"l": 222.966, "t": 228.80899999999997, "r": 392.39, "b": 236.27800000000002, "coord_origin": "TOPLEFT"}, "confidence": 0.6924149990081787, "cells": [{"index": 47, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 222.966, "r_y0": 236.27800000000002, "r_x1": 392.39, "r_y1": 236.27800000000002, "r_x2": 392.39, "r_y2": 228.80899999999997, "r_x3": 222.966, "r_y3": 228.80899999999997, "coord_origin": "TOPLEFT"}, "text": "{mly,ahn,nli,cau,taa}@zurich.ibm.com", "orig": "{mly,ahn,nli,cau,taa}@zurich.ibm.com", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}]}, {"id": 1, "label": "text", "bbox": {"l": 163.111, "t": 268.086, "r": 452.249, "b": 465.676, "coord_origin": "TOPLEFT"}, "confidence": 0.9807654023170471, "cells": [{"index": 48, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 163.111, "r_y0": 278.227, "r_x1": 206.636, "r_y1": 278.227, "r_x2": 206.636, "r_y2": 270.30100000000004, "r_x3": 163.111, "r_y3": 270.30100000000004, "coord_origin": "TOPLEFT"}, "text": "Abstract.", "orig": "Abstract.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 49, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 211.617, "r_y0": 279.375, "r_x1": 452.245, "r_y1": 279.375, "r_x2": 452.245, "r_y2": 268.086, "r_x3": 211.617, "r_y3": 268.086, "coord_origin": "TOPLEFT"}, "text": "Extracting tables from documents is a crucial task in any", "orig": "Extracting tables from documents is a crucial task in any", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 50, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 163.111, "r_y0": 290.334, "r_x1": 452.242, "r_y1": 290.334, "r_x2": 452.242, "r_y2": 279.04499999999996, "r_x3": 163.111, "r_y3": 279.04499999999996, "coord_origin": "TOPLEFT"}, "text": "document conversion pipeline. Recently, transformer-based models have", "orig": "document conversion pipeline. Recently, transformer-based models have", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 51, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 163.111, "r_y0": 301.293, "r_x1": 452.248, "r_y1": 301.293, "r_x2": 452.248, "r_y2": 290.004, "r_x3": 163.111, "r_y3": 290.004, "coord_origin": "TOPLEFT"}, "text": "demonstrated that table-structure can be recognized with impressive ac-", "orig": "demonstrated that table-structure can be recognized with impressive ac-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 52, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 163.111, "r_y0": 312.252, "r_x1": 452.241, "r_y1": 312.252, "r_x2": 452.241, "r_y2": 300.963, "r_x3": 163.111, "r_y3": 300.963, "coord_origin": "TOPLEFT"}, "text": "curacy using Image-to-Markup-Sequence (Im2Seq) approaches. Taking", "orig": "curacy using Image-to-Markup-Sequence (Im2Seq) approaches. Taking", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 53, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 163.111, "r_y0": 323.21, "r_x1": 452.246, "r_y1": 323.21, "r_x2": 452.246, "r_y2": 311.921, "r_x3": 163.111, "r_y3": 311.921, "coord_origin": "TOPLEFT"}, "text": "only the image of a table, such models predict a sequence of tokens (e.g.", "orig": "only the image of a table, such models predict a sequence of tokens (e.g.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 54, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 163.111, "r_y0": 334.169, "r_x1": 452.246, "r_y1": 334.169, "r_x2": 452.246, "r_y2": 322.88, "r_x3": 163.111, "r_y3": 322.88, "coord_origin": "TOPLEFT"}, "text": "in HTML, LaTeX) which represent the structure of the table. Since the", "orig": "in HTML, LaTeX) which represent the structure of the table. Since the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 55, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 163.111, "r_y0": 345.128, "r_x1": 452.247, "r_y1": 345.128, "r_x2": 452.247, "r_y2": 333.839, "r_x3": 163.111, "r_y3": 333.839, "coord_origin": "TOPLEFT"}, "text": "token representation of the table structure has a significant impact on", "orig": "token representation of the table structure has a significant impact on", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 56, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 163.111, "r_y0": 356.087, "r_x1": 452.246, "r_y1": 356.087, "r_x2": 452.246, "r_y2": 344.798, "r_x3": 163.111, "r_y3": 344.798, "coord_origin": "TOPLEFT"}, "text": "the accuracy and run-time performance of any Im2Seq model, we inves-", "orig": "the accuracy and run-time performance of any Im2Seq model, we inves-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 57, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 163.111, "r_y0": 367.046, "r_x1": 452.248, "r_y1": 367.046, "r_x2": 452.248, "r_y2": 355.757, "r_x3": 163.111, "r_y3": 355.757, "coord_origin": "TOPLEFT"}, "text": "tigate in this paper how table-structure representation can be optimised.", "orig": "tigate in this paper how table-structure representation can be optimised.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 58, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 163.111, "r_y0": 378.005, "r_x1": 452.246, "r_y1": 378.005, "r_x2": 452.246, "r_y2": 366.716, "r_x3": 163.111, "r_y3": 366.716, "coord_origin": "TOPLEFT"}, "text": "We propose a new, optimised table-structure language (OTSL) with a", "orig": "We propose a new, optimised table-structure language (OTSL) with a", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 59, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 163.111, "r_y0": 388.964, "r_x1": 452.242, "r_y1": 388.964, "r_x2": 452.242, "r_y2": 377.675, "r_x3": 163.111, "r_y3": 377.675, "coord_origin": "TOPLEFT"}, "text": "minimized vocabulary and specific rules. The benefits of OTSL are that", "orig": "minimized vocabulary and specific rules. The benefits of OTSL are that", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 60, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 163.111, "r_y0": 399.923, "r_x1": 169.253, "r_y1": 399.923, "r_x2": 169.253, "r_y2": 388.634, "r_x3": 163.111, "r_y3": 388.634, "coord_origin": "TOPLEFT"}, "text": "it", "orig": "it", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 61, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 172.795, "r_y0": 399.923, "r_x1": 452.244, "r_y1": 399.923, "r_x2": 452.244, "r_y2": 388.634, "r_x3": 172.795, "r_y3": 388.634, "coord_origin": "TOPLEFT"}, "text": "reduces the number of tokens to 5 (HTML needs 28+) and shortens", "orig": "reduces the number of tokens to 5 (HTML needs 28+) and shortens", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 62, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 163.111, "r_y0": 410.882, "r_x1": 452.249, "r_y1": 410.882, "r_x2": 452.249, "r_y2": 399.593, "r_x3": 163.111, "r_y3": 399.593, "coord_origin": "TOPLEFT"}, "text": "the sequence length to half of HTML on average. Consequently, model", "orig": "the sequence length to half of HTML on average. Consequently, model", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 63, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 163.111, "r_y0": 421.841, "r_x1": 198.194, "r_y1": 421.841, "r_x2": 198.194, "r_y2": 410.552, "r_x3": 163.111, "r_y3": 410.552, "coord_origin": "TOPLEFT"}, "text": "accuracy", "orig": "accuracy", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 64, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 202.632, "r_y0": 421.841, "r_x1": 292.676, "r_y1": 421.841, "r_x2": 292.676, "r_y2": 410.552, "r_x3": 202.632, "r_y3": 410.552, "coord_origin": "TOPLEFT"}, "text": "improves significantly,", "orig": "improves significantly,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 65, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 297.115, "r_y0": 421.841, "r_x1": 332.719, "r_y1": 421.841, "r_x2": 332.719, "r_y2": 410.552, "r_x3": 297.115, "r_y3": 410.552, "coord_origin": "TOPLEFT"}, "text": "inference", "orig": "inference", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 66, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 337.158, "r_y0": 421.841, "r_x1": 365.708, "r_y1": 421.841, "r_x2": 365.708, "r_y2": 410.552, "r_x3": 337.158, "r_y3": 410.552, "coord_origin": "TOPLEFT"}, "text": "time is", "orig": "time is", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 67, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 370.146, "r_y0": 421.841, "r_x1": 396.249, "r_y1": 421.841, "r_x2": 396.249, "r_y2": 410.552, "r_x3": 370.146, "r_y3": 410.552, "coord_origin": "TOPLEFT"}, "text": "halved", "orig": "halved", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 68, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 400.696, "r_y0": 421.841, "r_x1": 452.241, "r_y1": 421.841, "r_x2": 452.241, "r_y2": 410.552, "r_x3": 400.696, "r_y3": 410.552, "coord_origin": "TOPLEFT"}, "text": "compared to", "orig": "compared to", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 69, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 163.111, "r_y0": 432.799, "r_x1": 452.242, "r_y1": 432.799, "r_x2": 452.242, "r_y2": 421.51, "r_x3": 163.111, "r_y3": 421.51, "coord_origin": "TOPLEFT"}, "text": "HTML-based models, and the predicted table structures are always syn-", "orig": "HTML-based models, and the predicted table structures are always syn-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 70, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 163.111, "r_y0": 443.758, "r_x1": 200.22, "r_y1": 443.758, "r_x2": 200.22, "r_y2": 432.469, "r_x3": 163.111, "r_y3": 432.469, "coord_origin": "TOPLEFT"}, "text": "tactically", "orig": "tactically", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 71, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 204.282, "r_y0": 443.758, "r_x1": 234.527, "r_y1": 443.758, "r_x2": 234.527, "r_y2": 432.469, "r_x3": 204.282, "r_y3": 432.469, "coord_origin": "TOPLEFT"}, "text": "correct.", "orig": "correct.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 72, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 238.588, "r_y0": 443.758, "r_x1": 452.244, "r_y1": 443.758, "r_x2": 452.244, "r_y2": 432.469, "r_x3": 238.588, "r_y3": 432.469, "coord_origin": "TOPLEFT"}, "text": "This in turn eliminates most post-processing needs.", "orig": "This in turn eliminates most post-processing needs.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 73, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 163.111, "r_y0": 454.717, "r_x1": 452.246, "r_y1": 454.717, "r_x2": 452.246, "r_y2": 443.428, "r_x3": 163.111, "r_y3": 443.428, "coord_origin": "TOPLEFT"}, "text": "Popular table structure data-sets will be published in OTSL format to", "orig": "Popular table structure data-sets will be published in OTSL format to", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 74, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 163.111, "r_y0": 465.676, "r_x1": 225.561, "r_y1": 465.676, "r_x2": 225.561, "r_y2": 454.387, "r_x3": 163.111, "r_y3": 454.387, "coord_origin": "TOPLEFT"}, "text": "the community.", "orig": "the community.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 4, "label": "text", "bbox": {"l": 163.111, "t": 476.479, "r": 452.241, "b": 498.727, "coord_origin": "TOPLEFT"}, "confidence": 0.9304055571556091, "cells": [{"index": 75, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 163.111, "r_y0": 486.62, "r_x1": 211.942, "r_y1": 486.62, "r_x2": 211.942, "r_y2": 478.694, "r_x3": 163.111, "r_y3": 478.694, "coord_origin": "TOPLEFT"}, "text": "Keywords:", "orig": "Keywords:", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 76, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 216.552, "r_y0": 487.768, "r_x1": 452.241, "r_y1": 487.768, "r_x2": 452.241, "r_y2": 476.479, "r_x3": 216.552, "r_y3": 476.479, "coord_origin": "TOPLEFT"}, "text": "Table Structure Recognition \u00b7 Data Representation \u00b7 Trans-", "orig": "Table Structure Recognition \u00b7 Data Representation \u00b7 Trans-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 77, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 163.111, "r_y0": 498.727, "r_x1": 257.642, "r_y1": 498.727, "r_x2": 257.642, "r_y2": 487.438, "r_x3": 163.111, "r_y3": 487.438, "coord_origin": "TOPLEFT"}, "text": "formers \u00b7 Optimization.", "orig": "formers \u00b7 Optimization.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 3, "label": "section_header", "bbox": {"l": 134.765, "t": 522.12, "r": 228.934, "b": 532.688, "coord_origin": "TOPLEFT"}, "confidence": 0.9392016530036926, "cells": [{"index": 78, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 532.688, "r_x1": 141.489, "r_y1": 532.688, "r_x2": 141.489, "r_y2": 522.12, "r_x3": 134.765, "r_y3": 522.12, "coord_origin": "TOPLEFT"}, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 79, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 154.938, "r_y0": 532.688, "r_x1": 228.934, "r_y1": 532.688, "r_x2": 228.934, "r_y2": 522.12, "r_x3": 154.938, "r_y3": 522.12, "coord_origin": "TOPLEFT"}, "text": "Introduction", "orig": "Introduction", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 0, "label": "text", "bbox": {"l": 134.765, "t": 548.287, "r": 480.596, "b": 628.815, "coord_origin": "TOPLEFT"}, "confidence": 0.9835679531097412, "cells": [{"index": 80, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 557.0840000000001, "r_x1": 480.594, "r_y1": 557.0840000000001, "r_x2": 480.594, "r_y2": 548.287, "r_x3": 134.765, "r_y3": 548.287, "coord_origin": "TOPLEFT"}, "text": "Tables are ubiquitous in documents such as scientific papers, patents, reports,", "orig": "Tables are ubiquitous in documents such as scientific papers, patents, reports,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 81, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 569.04, "r_x1": 480.592, "r_y1": 569.04, "r_x2": 480.592, "r_y2": 560.2429999999999, "r_x3": 134.765, "r_y3": 560.2429999999999, "coord_origin": "TOPLEFT"}, "text": "manuals, specification sheets or marketing material. They often encode highly", "orig": "manuals, specification sheets or marketing material. They often encode highly", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 82, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 580.995, "r_x1": 170.451, "r_y1": 580.995, "r_x2": 170.451, "r_y2": 572.198, "r_x3": 134.765, "r_y3": 572.198, "coord_origin": "TOPLEFT"}, "text": "valuable", "orig": "valuable", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 83, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 175.173, "r_y0": 580.995, "r_x1": 225.832, "r_y1": 580.995, "r_x2": 225.832, "r_y2": 572.198, "r_x3": 175.173, "r_y3": 572.198, "coord_origin": "TOPLEFT"}, "text": "information", "orig": "information", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 84, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 230.544, "r_y0": 580.995, "r_x1": 289.826, "r_y1": 580.995, "r_x2": 289.826, "r_y2": 572.198, "r_x3": 230.544, "r_y3": 572.198, "coord_origin": "TOPLEFT"}, "text": "and therefore", "orig": "and therefore", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 85, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 294.538, "r_y0": 580.995, "r_x1": 388.395, "r_y1": 580.995, "r_x2": 388.395, "r_y2": 572.198, "r_x3": 294.538, "r_y3": 572.198, "coord_origin": "TOPLEFT"}, "text": "need to be extracted", "orig": "need to be extracted", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 86, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 393.107, "r_y0": 580.995, "r_x1": 480.593, "r_y1": 580.995, "r_x2": 480.593, "r_y2": 572.198, "r_x3": 393.107, "r_y3": 572.198, "coord_origin": "TOPLEFT"}, "text": "with high accuracy.", "orig": "with high accuracy.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 87, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 592.95, "r_x1": 480.596, "r_y1": 592.95, "r_x2": 480.596, "r_y2": 584.153, "r_x3": 134.765, "r_y3": 584.153, "coord_origin": "TOPLEFT"}, "text": "Unfortunately, tables appear in documents in various sizes, styling and struc-", "orig": "Unfortunately, tables appear in documents in various sizes, styling and struc-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 88, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 604.905, "r_x1": 155.266, "r_y1": 604.905, "r_x2": 155.266, "r_y2": 596.108, "r_x3": 134.765, "r_y3": 596.108, "coord_origin": "TOPLEFT"}, "text": "ture,", "orig": "ture,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 89, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 159.48, "r_y0": 604.905, "r_x1": 480.587, "r_y1": 604.905, "r_x2": 480.587, "r_y2": 596.108, "r_x3": 159.48, "r_y3": 596.108, "coord_origin": "TOPLEFT"}, "text": "making it difficult to recover their correct structure with simple analyt-", "orig": "making it difficult to recover their correct structure with simple analyt-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 90, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 616.86, "r_x1": 149.705, "r_y1": 616.86, "r_x2": 149.705, "r_y2": 608.063, "r_x3": 134.765, "r_y3": 608.063, "coord_origin": "TOPLEFT"}, "text": "ical", "orig": "ical", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 91, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 153.71, "r_y0": 616.86, "r_x1": 480.591, "r_y1": 616.86, "r_x2": 480.591, "r_y2": 608.063, "r_x3": 153.71, "r_y3": 608.063, "coord_origin": "TOPLEFT"}, "text": "methods. Therefore, accurate table extraction is achieved these days with", "orig": "methods. Therefore, accurate table extraction is achieved these days with", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 92, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 628.815, "r_x1": 279.327, "r_y1": 628.815, "r_x2": 279.327, "r_y2": 620.018, "r_x3": 134.765, "r_y3": 620.018, "coord_origin": "TOPLEFT"}, "text": "machine-learning based methods.", "orig": "machine-learning based methods.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 2, "label": "text", "bbox": {"l": 134.765, "t": 632.148, "r": 480.596, "b": 664.855, "coord_origin": "TOPLEFT"}, "confidence": 0.9696458578109741, "cells": [{"index": 93, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 149.708, "r_y0": 640.9449999999999, "r_x1": 480.589, "r_y1": 640.9449999999999, "r_x2": 480.589, "r_y2": 632.148, "r_x3": 149.708, "r_y3": 632.148, "coord_origin": "TOPLEFT"}, "text": "In modern document understanding systems [1,15], table extraction is typi-", "orig": "In modern document understanding systems [1,15], table extraction is typi-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 94, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 652.9, "r_x1": 480.596, "r_y1": 652.9, "r_x2": 480.596, "r_y2": 644.1030000000001, "r_x3": 134.765, "r_y3": 644.1030000000001, "coord_origin": "TOPLEFT"}, "text": "cally a two-step process. Firstly, every table on a page is located with a bounding", "orig": "cally a two-step process. Firstly, every table on a page is located with a bounding", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 95, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 664.855, "r_x1": 480.595, "r_y1": 664.855, "r_x2": 480.595, "r_y2": 656.058, "r_x3": 134.765, "r_y3": 656.058, "coord_origin": "TOPLEFT"}, "text": "box, and secondly, their logical row and column structure is recognized. As of", "orig": "box, and secondly, their logical row and column structure is recognized. As of", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 6, "label": "page_header", "bbox": {"l": 18.34, "t": 215.0, "r": 36.34, "b": 555.0, "coord_origin": "TOPLEFT"}, "confidence": 0.8899643421173096, "cells": [{"index": 96, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 36.34, "r_y0": 555.0, "r_x1": 36.34, "r_y1": 375.0, "r_x2": 18.34, "r_y2": 375.0, "r_x3": 18.34, "r_y3": 555.0, "coord_origin": "TOPLEFT"}, "text": "arXiv:2305.03393v1", "orig": "arXiv:2305.03393v1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 97, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 36.34, "r_y0": 355.0, "r_x1": 36.34, "r_y1": 285.0, "r_x2": 18.34, "r_y2": 285.0, "r_x3": 18.34, "r_y3": 355.0, "coord_origin": "TOPLEFT"}, "text": "[cs.CV]", "orig": "[cs.CV]", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 98, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 36.34, "r_y0": 265.0, "r_x1": 36.34, "r_y1": 255.0, "r_x2": 18.34, "r_y2": 255.0, "r_x3": 18.34, "r_y3": 265.0, "coord_origin": "TOPLEFT"}, "text": "5", "orig": "5", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 99, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 36.34, "r_y0": 245.0, "r_x1": 36.34, "r_y1": 215.0, "r_x2": 18.34, "r_y2": 215.0, "r_x3": 18.34, "r_y3": 245.0, "coord_origin": "TOPLEFT"}, "text": "May", "orig": "May", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 37, "label": "text", "bbox": {"l": 18.34, "t": 165.0, "r": 36.34, "b": 205.0, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 100, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 36.34, "r_y0": 205.0, "r_x1": 36.34, "r_y1": 165.0, "r_x2": 18.34, "r_y2": 165.0, "r_x3": 18.34, "r_y3": 205.0, "coord_origin": "TOPLEFT"}, "text": "2023", "orig": "2023", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}]}, "tablestructure": {"table_map": {}}, "figures_classification": null, "equations_prediction": null, "vlm_response": null}, "assembled": {"elements": [{"label": "section_header", "id": 5, "page_no": 0, "cluster": {"id": 5, "label": "section_header", "bbox": {"l": 134.765, "t": 115.899, "r": 480.597, "b": 146.514, "coord_origin": "TOPLEFT"}, "confidence": 0.8918349742889404, "cells": [{"index": 0, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 128.58100000000002, "r_x1": 480.597, "r_y1": 128.58100000000002, "r_x2": 480.597, "r_y2": 115.899, "r_x3": 134.765, "r_y3": 115.899, "coord_origin": "TOPLEFT"}, "text": "Optimized Table Tokenization for Table Structure", "orig": "Optimized Table Tokenization for Table Structure", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 266.675, "r_y0": 146.514, "r_x1": 348.685, "r_y1": 146.514, "r_x2": 348.685, "r_y2": 133.832, "r_x3": 266.675, "r_y3": 133.832, "coord_origin": "TOPLEFT"}, "text": "Recognition", "orig": "Recognition", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "Optimized Table Tokenization for Table Structure Recognition"}, {"label": "key_value_region", "id": 16, "page_no": 0, "cluster": {"id": 16, "label": "key_value_region", "bbox": {"l": 139.343, "t": 170.159, "r": 476.013, "b": 236.27800000000002, "coord_origin": "TOPLEFT"}, "confidence": 0.48445820808410645, "cells": [{"index": 2, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 151.226, "r_y0": 180.471, "r_x1": 217.044, "r_y1": 180.471, "r_x2": 217.044, "r_y2": 171.67399999999998, "r_x3": 151.226, "r_y3": 171.67399999999998, "coord_origin": "TOPLEFT"}, "text": "Maksym Lysak", "orig": "Maksym Lysak", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 3, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 217.046, "r_y0": 176.25300000000004, "r_x1": 235.188, "r_y1": 176.25300000000004, "r_x2": 235.188, "r_y2": 170.159, "r_x3": 217.046, "r_y3": 170.159, "coord_origin": "TOPLEFT"}, "text": "[0000", "orig": "[0000", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 4, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 235.186, "r_y0": 176.154, "r_x1": 241.413, "r_y1": 176.154, "r_x2": 241.413, "r_y2": 170.159, "r_x3": 235.186, "r_y3": 170.159, "coord_origin": "TOPLEFT"}, "text": "-", "orig": "-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 5, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 241.413, "r_y0": 176.25300000000004, "r_x1": 257.299, "r_y1": 176.25300000000004, "r_x2": 257.299, "r_y2": 170.159, "r_x3": 241.413, "r_y3": 170.159, "coord_origin": "TOPLEFT"}, "text": "0002", "orig": "0002", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 6, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 257.298, "r_y0": 176.154, "r_x1": 263.525, "r_y1": 176.154, "r_x2": 263.525, "r_y2": 170.159, "r_x3": 257.298, "r_y3": 170.159, "coord_origin": "TOPLEFT"}, "text": "-", "orig": "-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 7, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 263.525, "r_y0": 176.25300000000004, "r_x1": 279.411, "r_y1": 176.25300000000004, "r_x2": 279.411, "r_y2": 170.159, "r_x3": 263.525, "r_y3": 170.159, "coord_origin": "TOPLEFT"}, "text": "3723", "orig": "3723", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 8, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 279.41, "r_y0": 176.154, "r_x1": 285.637, "r_y1": 176.154, "r_x2": 285.637, "r_y2": 170.159, "r_x3": 279.41, "r_y3": 170.159, "coord_origin": "TOPLEFT"}, "text": "-", "orig": "-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 9, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 285.636, "r_y0": 176.25300000000004, "r_x1": 303.778, "r_y1": 176.25300000000004, "r_x2": 303.778, "r_y2": 170.159, "r_x3": 285.636, "r_y3": 170.159, "coord_origin": "TOPLEFT"}, "text": "6960]", "orig": "6960]", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 10, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 304.275, "r_y0": 180.471, "r_x1": 307.042, "r_y1": 180.471, "r_x2": 307.042, "r_y2": 171.67399999999998, "r_x3": 304.275, "r_y3": 171.67399999999998, "coord_origin": "TOPLEFT"}, "text": ",", "orig": ",", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 11, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 310.359, "r_y0": 180.471, "r_x1": 374.138, "r_y1": 180.471, "r_x2": 374.138, "r_y2": 171.67399999999998, "r_x3": 310.359, "r_y3": 171.67399999999998, "coord_origin": "TOPLEFT"}, "text": "Ahmed Nassar", "orig": "Ahmed Nassar", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 12, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 374.135, "r_y0": 176.25300000000004, "r_x1": 392.277, "r_y1": 176.25300000000004, "r_x2": 392.277, "r_y2": 170.159, "r_x3": 374.135, "r_y3": 170.159, "coord_origin": "TOPLEFT"}, "text": "[0000", "orig": "[0000", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 13, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 392.275, "r_y0": 176.154, "r_x1": 398.502, "r_y1": 176.154, "r_x2": 398.502, "r_y2": 170.159, "r_x3": 392.275, "r_y3": 170.159, "coord_origin": "TOPLEFT"}, "text": "-", "orig": "-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 14, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 398.502, "r_y0": 176.25300000000004, "r_x1": 414.388, "r_y1": 176.25300000000004, "r_x2": 414.388, "r_y2": 170.159, "r_x3": 398.502, "r_y3": 170.159, "coord_origin": "TOPLEFT"}, "text": "0002", "orig": "0002", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 15, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 414.387, "r_y0": 176.154, "r_x1": 420.614, "r_y1": 176.154, "r_x2": 420.614, "r_y2": 170.159, "r_x3": 414.387, "r_y3": 170.159, "coord_origin": "TOPLEFT"}, "text": "-", "orig": "-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 16, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 420.613, "r_y0": 176.25300000000004, "r_x1": 436.499, "r_y1": 176.25300000000004, "r_x2": 436.499, "r_y2": 170.159, "r_x3": 420.613, "r_y3": 170.159, "coord_origin": "TOPLEFT"}, "text": "9468", "orig": "9468", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 17, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 436.498, "r_y0": 176.154, "r_x1": 442.725, "r_y1": 176.154, "r_x2": 442.725, "r_y2": 170.159, "r_x3": 436.498, "r_y3": 170.159, "coord_origin": "TOPLEFT"}, "text": "-", "orig": "-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 18, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 442.725, "r_y0": 176.25300000000004, "r_x1": 460.867, "r_y1": 176.25300000000004, "r_x2": 460.867, "r_y2": 170.159, "r_x3": 442.725, "r_y3": 170.159, "coord_origin": "TOPLEFT"}, "text": "0822]", "orig": "0822]", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 19, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 461.363, "r_y0": 180.471, "r_x1": 464.13, "r_y1": 180.471, "r_x2": 464.13, "r_y2": 171.67399999999998, "r_x3": 461.363, "r_y3": 171.67399999999998, "coord_origin": "TOPLEFT"}, "text": ",", "orig": ",", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 20, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 139.343, "r_y0": 192.42600000000004, "r_x1": 224.807, "r_y1": 192.42600000000004, "r_x2": 224.807, "r_y2": 183.62900000000002, "r_x3": 139.343, "r_y3": 183.62900000000002, "coord_origin": "TOPLEFT"}, "text": "Nikolaos Livathinos", "orig": "Nikolaos Livathinos", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 21, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 224.807, "r_y0": 188.20899999999995, "r_x1": 242.949, "r_y1": 188.20899999999995, "r_x2": 242.949, "r_y2": 182.115, "r_x3": 224.807, "r_y3": 182.115, "coord_origin": "TOPLEFT"}, "text": "[0000", "orig": "[0000", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 22, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 242.947, "r_y0": 188.11, "r_x1": 249.174, "r_y1": 188.11, "r_x2": 249.174, "r_y2": 182.115, "r_x3": 242.947, "r_y3": 182.115, "coord_origin": "TOPLEFT"}, "text": "-", "orig": "-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 23, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 249.174, "r_y0": 188.20899999999995, "r_x1": 265.06, "r_y1": 188.20899999999995, "r_x2": 265.06, "r_y2": 182.115, "r_x3": 249.174, "r_y3": 182.115, "coord_origin": "TOPLEFT"}, "text": "0001", "orig": "0001", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 24, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 265.059, "r_y0": 188.11, "r_x1": 271.286, "r_y1": 188.11, "r_x2": 271.286, "r_y2": 182.115, "r_x3": 265.059, "r_y3": 182.115, "coord_origin": "TOPLEFT"}, "text": "-", "orig": "-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 25, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 271.285, "r_y0": 188.20899999999995, "r_x1": 287.171, "r_y1": 188.20899999999995, "r_x2": 287.171, "r_y2": 182.115, "r_x3": 271.285, "r_y3": 182.115, "coord_origin": "TOPLEFT"}, "text": "8513", "orig": "8513", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 26, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 287.17, "r_y0": 188.11, "r_x1": 293.397, "r_y1": 188.11, "r_x2": 293.397, "r_y2": 182.115, "r_x3": 287.17, "r_y3": 182.115, "coord_origin": "TOPLEFT"}, "text": "-", "orig": "-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 27, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 293.397, "r_y0": 188.20899999999995, "r_x1": 311.539, "r_y1": 188.20899999999995, "r_x2": 311.539, "r_y2": 182.115, "r_x3": 293.397, "r_y3": 182.115, "coord_origin": "TOPLEFT"}, "text": "3491]", "orig": "3491]", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 28, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 312.035, "r_y0": 192.42600000000004, "r_x1": 314.802, "r_y1": 192.42600000000004, "r_x2": 314.802, "r_y2": 183.62900000000002, "r_x3": 312.035, "r_y3": 183.62900000000002, "coord_origin": "TOPLEFT"}, "text": ",", "orig": ",", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 29, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 318.119, "r_y0": 192.42600000000004, "r_x1": 386.02, "r_y1": 192.42600000000004, "r_x2": 386.02, "r_y2": 183.62900000000002, "r_x3": 318.119, "r_y3": 183.62900000000002, "coord_origin": "TOPLEFT"}, "text": "Christoph Auer", "orig": "Christoph Auer", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 30, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 386.018, "r_y0": 188.20899999999995, "r_x1": 404.16, "r_y1": 188.20899999999995, "r_x2": 404.16, "r_y2": 182.115, "r_x3": 386.018, "r_y3": 182.115, "coord_origin": "TOPLEFT"}, "text": "[0000", "orig": "[0000", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 31, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 404.158, "r_y0": 188.11, "r_x1": 410.385, "r_y1": 188.11, "r_x2": 410.385, "r_y2": 182.115, "r_x3": 404.158, "r_y3": 182.115, "coord_origin": "TOPLEFT"}, "text": "-", "orig": "-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 32, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 410.385, "r_y0": 188.20899999999995, "r_x1": 426.271, "r_y1": 188.20899999999995, "r_x2": 426.271, "r_y2": 182.115, "r_x3": 410.385, "r_y3": 182.115, "coord_origin": "TOPLEFT"}, "text": "0001", "orig": "0001", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 33, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 426.27, "r_y0": 188.11, "r_x1": 432.497, "r_y1": 188.11, "r_x2": 432.497, "r_y2": 182.115, "r_x3": 426.27, "r_y3": 182.115, "coord_origin": "TOPLEFT"}, "text": "-", "orig": "-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 34, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 432.496, "r_y0": 188.20899999999995, "r_x1": 448.382, "r_y1": 188.20899999999995, "r_x2": 448.382, "r_y2": 182.115, "r_x3": 432.496, "r_y3": 182.115, "coord_origin": "TOPLEFT"}, "text": "5761", "orig": "5761", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 35, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 448.381, "r_y0": 188.11, "r_x1": 454.608, "r_y1": 188.11, "r_x2": 454.608, "r_y2": 182.115, "r_x3": 448.381, "r_y3": 182.115, "coord_origin": "TOPLEFT"}, "text": "-", "orig": "-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 36, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 454.608, "r_y0": 188.20899999999995, "r_x1": 472.75, "r_y1": 188.20899999999995, "r_x2": 472.75, "r_y2": 182.115, "r_x3": 454.608, "r_y3": 182.115, "coord_origin": "TOPLEFT"}, "text": "0422]", "orig": "0422]", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 37, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 473.246, "r_y0": 192.42600000000004, "r_x1": 476.013, "r_y1": 192.42600000000004, "r_x2": 476.013, "r_y2": 183.62900000000002, "r_x3": 473.246, "r_y3": 183.62900000000002, "coord_origin": "TOPLEFT"}, "text": ",", "orig": ",", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 38, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 229.521, "r_y0": 204.38099999999997, "r_x1": 298.609, "r_y1": 204.38099999999997, "r_x2": 298.609, "r_y2": 195.58399999999995, "r_x3": 229.521, "r_y3": 195.58399999999995, "coord_origin": "TOPLEFT"}, "text": "and Peter Staar", "orig": "and Peter Staar", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 39, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 298.606, "r_y0": 200.164, "r_x1": 316.748, "r_y1": 200.164, "r_x2": 316.748, "r_y2": 194.07000000000005, "r_x3": 298.606, "r_y3": 194.07000000000005, "coord_origin": "TOPLEFT"}, "text": "[0000", "orig": "[0000", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 40, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 316.746, "r_y0": 200.06500000000005, "r_x1": 322.973, "r_y1": 200.06500000000005, "r_x2": 322.973, "r_y2": 194.07000000000005, "r_x3": 316.746, "r_y3": 194.07000000000005, "coord_origin": "TOPLEFT"}, "text": "-", "orig": "-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 41, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 322.973, "r_y0": 200.164, "r_x1": 338.859, "r_y1": 200.164, "r_x2": 338.859, "r_y2": 194.07000000000005, "r_x3": 322.973, "r_y3": 194.07000000000005, "coord_origin": "TOPLEFT"}, "text": "0002", "orig": "0002", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 42, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 338.858, "r_y0": 200.06500000000005, "r_x1": 345.085, "r_y1": 200.06500000000005, "r_x2": 345.085, "r_y2": 194.07000000000005, "r_x3": 338.858, "r_y3": 194.07000000000005, "coord_origin": "TOPLEFT"}, "text": "-", "orig": "-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 43, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 345.085, "r_y0": 200.164, "r_x1": 360.971, "r_y1": 200.164, "r_x2": 360.971, "r_y2": 194.07000000000005, "r_x3": 345.085, "r_y3": 194.07000000000005, "coord_origin": "TOPLEFT"}, "text": "8088", "orig": "8088", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 44, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 360.97, "r_y0": 200.06500000000005, "r_x1": 367.197, "r_y1": 200.06500000000005, "r_x2": 367.197, "r_y2": 194.07000000000005, "r_x3": 360.97, "r_y3": 194.07000000000005, "coord_origin": "TOPLEFT"}, "text": "-", "orig": "-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 45, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 367.196, "r_y0": 200.164, "r_x1": 385.338, "r_y1": 200.164, "r_x2": 385.338, "r_y2": 194.07000000000005, "r_x3": 367.196, "r_y3": 194.07000000000005, "coord_origin": "TOPLEFT"}, "text": "0823]", "orig": "0823]", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 46, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 279.105, "r_y0": 226.21500000000003, "r_x1": 336.251, "r_y1": 226.21500000000003, "r_x2": 336.251, "r_y2": 214.92600000000004, "r_x3": 279.105, "r_y3": 214.92600000000004, "coord_origin": "TOPLEFT"}, "text": "IBM Research", "orig": "IBM Research", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 47, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 222.966, "r_y0": 236.27800000000002, "r_x1": 392.39, "r_y1": 236.27800000000002, "r_x2": 392.39, "r_y2": 228.80899999999997, "r_x3": 222.966, "r_y3": 228.80899999999997, "coord_origin": "TOPLEFT"}, "text": "{mly,ahn,nli,cau,taa}@zurich.ibm.com", "orig": "{mly,ahn,nli,cau,taa}@zurich.ibm.com", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": [{"id": 7, "label": "text", "bbox": {"l": 139.343, "t": 170.159, "r": 476.013, "b": 200.164, "coord_origin": "TOPLEFT"}, "confidence": 0.7918068766593933, "cells": [{"index": 2, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 151.226, "r_y0": 180.471, "r_x1": 217.044, "r_y1": 180.471, "r_x2": 217.044, "r_y2": 171.67399999999998, "r_x3": 151.226, "r_y3": 171.67399999999998, "coord_origin": "TOPLEFT"}, "text": "Maksym Lysak", "orig": "Maksym Lysak", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 3, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 217.046, "r_y0": 176.25300000000004, "r_x1": 235.188, "r_y1": 176.25300000000004, "r_x2": 235.188, "r_y2": 170.159, "r_x3": 217.046, "r_y3": 170.159, "coord_origin": "TOPLEFT"}, "text": "[0000", "orig": "[0000", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 4, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 235.186, "r_y0": 176.154, "r_x1": 241.413, "r_y1": 176.154, "r_x2": 241.413, "r_y2": 170.159, "r_x3": 235.186, "r_y3": 170.159, "coord_origin": "TOPLEFT"}, "text": "-", "orig": "-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 5, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 241.413, "r_y0": 176.25300000000004, "r_x1": 257.299, "r_y1": 176.25300000000004, "r_x2": 257.299, "r_y2": 170.159, "r_x3": 241.413, "r_y3": 170.159, "coord_origin": "TOPLEFT"}, "text": "0002", "orig": "0002", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 6, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 257.298, "r_y0": 176.154, "r_x1": 263.525, "r_y1": 176.154, "r_x2": 263.525, "r_y2": 170.159, "r_x3": 257.298, "r_y3": 170.159, "coord_origin": "TOPLEFT"}, "text": "-", "orig": "-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 7, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 263.525, "r_y0": 176.25300000000004, "r_x1": 279.411, "r_y1": 176.25300000000004, "r_x2": 279.411, "r_y2": 170.159, "r_x3": 263.525, "r_y3": 170.159, "coord_origin": "TOPLEFT"}, "text": "3723", "orig": "3723", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 8, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 279.41, "r_y0": 176.154, "r_x1": 285.637, "r_y1": 176.154, "r_x2": 285.637, "r_y2": 170.159, "r_x3": 279.41, "r_y3": 170.159, "coord_origin": "TOPLEFT"}, "text": "-", "orig": "-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 9, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 285.636, "r_y0": 176.25300000000004, "r_x1": 303.778, "r_y1": 176.25300000000004, "r_x2": 303.778, "r_y2": 170.159, "r_x3": 285.636, "r_y3": 170.159, "coord_origin": "TOPLEFT"}, "text": "6960]", "orig": "6960]", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 10, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 304.275, "r_y0": 180.471, "r_x1": 307.042, "r_y1": 180.471, "r_x2": 307.042, "r_y2": 171.67399999999998, "r_x3": 304.275, "r_y3": 171.67399999999998, "coord_origin": "TOPLEFT"}, "text": ",", "orig": ",", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 11, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 310.359, "r_y0": 180.471, "r_x1": 374.138, "r_y1": 180.471, "r_x2": 374.138, "r_y2": 171.67399999999998, "r_x3": 310.359, "r_y3": 171.67399999999998, "coord_origin": "TOPLEFT"}, "text": "Ahmed Nassar", "orig": "Ahmed Nassar", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 12, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 374.135, "r_y0": 176.25300000000004, "r_x1": 392.277, "r_y1": 176.25300000000004, "r_x2": 392.277, "r_y2": 170.159, "r_x3": 374.135, "r_y3": 170.159, "coord_origin": "TOPLEFT"}, "text": "[0000", "orig": "[0000", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 13, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 392.275, "r_y0": 176.154, "r_x1": 398.502, "r_y1": 176.154, "r_x2": 398.502, "r_y2": 170.159, "r_x3": 392.275, "r_y3": 170.159, "coord_origin": "TOPLEFT"}, "text": "-", "orig": "-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 14, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 398.502, "r_y0": 176.25300000000004, "r_x1": 414.388, "r_y1": 176.25300000000004, "r_x2": 414.388, "r_y2": 170.159, "r_x3": 398.502, "r_y3": 170.159, "coord_origin": "TOPLEFT"}, "text": "0002", "orig": "0002", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 15, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 414.387, "r_y0": 176.154, "r_x1": 420.614, "r_y1": 176.154, "r_x2": 420.614, "r_y2": 170.159, "r_x3": 414.387, "r_y3": 170.159, "coord_origin": "TOPLEFT"}, "text": "-", "orig": "-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 16, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 420.613, "r_y0": 176.25300000000004, "r_x1": 436.499, "r_y1": 176.25300000000004, "r_x2": 436.499, "r_y2": 170.159, "r_x3": 420.613, "r_y3": 170.159, "coord_origin": "TOPLEFT"}, "text": "9468", "orig": "9468", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 17, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 436.498, "r_y0": 176.154, "r_x1": 442.725, "r_y1": 176.154, "r_x2": 442.725, "r_y2": 170.159, "r_x3": 436.498, "r_y3": 170.159, "coord_origin": "TOPLEFT"}, "text": "-", "orig": "-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 18, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 442.725, "r_y0": 176.25300000000004, "r_x1": 460.867, "r_y1": 176.25300000000004, "r_x2": 460.867, "r_y2": 170.159, "r_x3": 442.725, "r_y3": 170.159, "coord_origin": "TOPLEFT"}, "text": "0822]", "orig": "0822]", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 19, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 461.363, "r_y0": 180.471, "r_x1": 464.13, "r_y1": 180.471, "r_x2": 464.13, "r_y2": 171.67399999999998, "r_x3": 461.363, "r_y3": 171.67399999999998, "coord_origin": "TOPLEFT"}, "text": ",", "orig": ",", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 20, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 139.343, "r_y0": 192.42600000000004, "r_x1": 224.807, "r_y1": 192.42600000000004, "r_x2": 224.807, "r_y2": 183.62900000000002, "r_x3": 139.343, "r_y3": 183.62900000000002, "coord_origin": "TOPLEFT"}, "text": "Nikolaos Livathinos", "orig": "Nikolaos Livathinos", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 21, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 224.807, "r_y0": 188.20899999999995, "r_x1": 242.949, "r_y1": 188.20899999999995, "r_x2": 242.949, "r_y2": 182.115, "r_x3": 224.807, "r_y3": 182.115, "coord_origin": "TOPLEFT"}, "text": "[0000", "orig": "[0000", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 22, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 242.947, "r_y0": 188.11, "r_x1": 249.174, "r_y1": 188.11, "r_x2": 249.174, "r_y2": 182.115, "r_x3": 242.947, "r_y3": 182.115, "coord_origin": "TOPLEFT"}, "text": "-", "orig": "-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 23, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 249.174, "r_y0": 188.20899999999995, "r_x1": 265.06, "r_y1": 188.20899999999995, "r_x2": 265.06, "r_y2": 182.115, "r_x3": 249.174, "r_y3": 182.115, "coord_origin": "TOPLEFT"}, "text": "0001", "orig": "0001", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 24, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 265.059, "r_y0": 188.11, "r_x1": 271.286, "r_y1": 188.11, "r_x2": 271.286, "r_y2": 182.115, "r_x3": 265.059, "r_y3": 182.115, "coord_origin": "TOPLEFT"}, "text": "-", "orig": "-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 25, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 271.285, "r_y0": 188.20899999999995, "r_x1": 287.171, "r_y1": 188.20899999999995, "r_x2": 287.171, "r_y2": 182.115, "r_x3": 271.285, "r_y3": 182.115, "coord_origin": "TOPLEFT"}, "text": "8513", "orig": "8513", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 26, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 287.17, "r_y0": 188.11, "r_x1": 293.397, "r_y1": 188.11, "r_x2": 293.397, "r_y2": 182.115, "r_x3": 287.17, "r_y3": 182.115, "coord_origin": "TOPLEFT"}, "text": "-", "orig": "-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 27, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 293.397, "r_y0": 188.20899999999995, "r_x1": 311.539, "r_y1": 188.20899999999995, "r_x2": 311.539, "r_y2": 182.115, "r_x3": 293.397, "r_y3": 182.115, "coord_origin": "TOPLEFT"}, "text": "3491]", "orig": "3491]", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 28, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 312.035, "r_y0": 192.42600000000004, "r_x1": 314.802, "r_y1": 192.42600000000004, "r_x2": 314.802, "r_y2": 183.62900000000002, "r_x3": 312.035, "r_y3": 183.62900000000002, "coord_origin": "TOPLEFT"}, "text": ",", "orig": ",", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 29, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 318.119, "r_y0": 192.42600000000004, "r_x1": 386.02, "r_y1": 192.42600000000004, "r_x2": 386.02, "r_y2": 183.62900000000002, "r_x3": 318.119, "r_y3": 183.62900000000002, "coord_origin": "TOPLEFT"}, "text": "Christoph Auer", "orig": "Christoph Auer", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 30, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 386.018, "r_y0": 188.20899999999995, "r_x1": 404.16, "r_y1": 188.20899999999995, "r_x2": 404.16, "r_y2": 182.115, "r_x3": 386.018, "r_y3": 182.115, "coord_origin": "TOPLEFT"}, "text": "[0000", "orig": "[0000", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 31, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 404.158, "r_y0": 188.11, "r_x1": 410.385, "r_y1": 188.11, "r_x2": 410.385, "r_y2": 182.115, "r_x3": 404.158, "r_y3": 182.115, "coord_origin": "TOPLEFT"}, "text": "-", "orig": "-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 32, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 410.385, "r_y0": 188.20899999999995, "r_x1": 426.271, "r_y1": 188.20899999999995, "r_x2": 426.271, "r_y2": 182.115, "r_x3": 410.385, "r_y3": 182.115, "coord_origin": "TOPLEFT"}, "text": "0001", "orig": "0001", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 33, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 426.27, "r_y0": 188.11, "r_x1": 432.497, "r_y1": 188.11, "r_x2": 432.497, "r_y2": 182.115, "r_x3": 426.27, "r_y3": 182.115, "coord_origin": "TOPLEFT"}, "text": "-", "orig": "-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 34, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 432.496, "r_y0": 188.20899999999995, "r_x1": 448.382, "r_y1": 188.20899999999995, "r_x2": 448.382, "r_y2": 182.115, "r_x3": 432.496, "r_y3": 182.115, "coord_origin": "TOPLEFT"}, "text": "5761", "orig": "5761", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 35, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 448.381, "r_y0": 188.11, "r_x1": 454.608, "r_y1": 188.11, "r_x2": 454.608, "r_y2": 182.115, "r_x3": 448.381, "r_y3": 182.115, "coord_origin": "TOPLEFT"}, "text": "-", "orig": "-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 36, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 454.608, "r_y0": 188.20899999999995, "r_x1": 472.75, "r_y1": 188.20899999999995, "r_x2": 472.75, "r_y2": 182.115, "r_x3": 454.608, "r_y3": 182.115, "coord_origin": "TOPLEFT"}, "text": "0422]", "orig": "0422]", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 37, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 473.246, "r_y0": 192.42600000000004, "r_x1": 476.013, "r_y1": 192.42600000000004, "r_x2": 476.013, "r_y2": 183.62900000000002, "r_x3": 473.246, "r_y3": 183.62900000000002, "coord_origin": "TOPLEFT"}, "text": ",", "orig": ",", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 39, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 298.606, "r_y0": 200.164, "r_x1": 316.748, "r_y1": 200.164, "r_x2": 316.748, "r_y2": 194.07000000000005, "r_x3": 298.606, "r_y3": 194.07000000000005, "coord_origin": "TOPLEFT"}, "text": "[0000", "orig": "[0000", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 40, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 316.746, "r_y0": 200.06500000000005, "r_x1": 322.973, "r_y1": 200.06500000000005, "r_x2": 322.973, "r_y2": 194.07000000000005, "r_x3": 316.746, "r_y3": 194.07000000000005, "coord_origin": "TOPLEFT"}, "text": "-", "orig": "-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 41, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 322.973, "r_y0": 200.164, "r_x1": 338.859, "r_y1": 200.164, "r_x2": 338.859, "r_y2": 194.07000000000005, "r_x3": 322.973, "r_y3": 194.07000000000005, "coord_origin": "TOPLEFT"}, "text": "0002", "orig": "0002", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 42, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 338.858, "r_y0": 200.06500000000005, "r_x1": 345.085, "r_y1": 200.06500000000005, "r_x2": 345.085, "r_y2": 194.07000000000005, "r_x3": 338.858, "r_y3": 194.07000000000005, "coord_origin": "TOPLEFT"}, "text": "-", "orig": "-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 43, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 345.085, "r_y0": 200.164, "r_x1": 360.971, "r_y1": 200.164, "r_x2": 360.971, "r_y2": 194.07000000000005, "r_x3": 345.085, "r_y3": 194.07000000000005, "coord_origin": "TOPLEFT"}, "text": "8088", "orig": "8088", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 44, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 360.97, "r_y0": 200.06500000000005, "r_x1": 367.197, "r_y1": 200.06500000000005, "r_x2": 367.197, "r_y2": 194.07000000000005, "r_x3": 360.97, "r_y3": 194.07000000000005, "coord_origin": "TOPLEFT"}, "text": "-", "orig": "-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 45, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 367.196, "r_y0": 200.164, "r_x1": 385.338, "r_y1": 200.164, "r_x2": 385.338, "r_y2": 194.07000000000005, "r_x3": 367.196, "r_y3": 194.07000000000005, "coord_origin": "TOPLEFT"}, "text": "0823]", "orig": "0823]", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 13, "label": "text", "bbox": {"l": 229.521, "t": 195.58399999999995, "r": 298.609, "b": 204.38099999999997, "coord_origin": "TOPLEFT"}, "confidence": 0.5015263557434082, "cells": [{"index": 38, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 229.521, "r_y0": 204.38099999999997, "r_x1": 298.609, "r_y1": 204.38099999999997, "r_x2": 298.609, "r_y2": 195.58399999999995, "r_x3": 229.521, "r_y3": 195.58399999999995, "coord_origin": "TOPLEFT"}, "text": "and Peter Staar", "orig": "and Peter Staar", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 9, "label": "text", "bbox": {"l": 279.105, "t": 214.92600000000004, "r": 336.251, "b": 226.21500000000003, "coord_origin": "TOPLEFT"}, "confidence": 0.6310867667198181, "cells": [{"index": 46, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 279.105, "r_y0": 226.21500000000003, "r_x1": 336.251, "r_y1": 226.21500000000003, "r_x2": 336.251, "r_y2": 214.92600000000004, "r_x3": 279.105, "r_y3": 214.92600000000004, "coord_origin": "TOPLEFT"}, "text": "IBM Research", "orig": "IBM Research", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 8, "label": "text", "bbox": {"l": 222.966, "t": 228.80899999999997, "r": 392.39, "b": 236.27800000000002, "coord_origin": "TOPLEFT"}, "confidence": 0.6924149990081787, "cells": [{"index": 47, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 222.966, "r_y0": 236.27800000000002, "r_x1": 392.39, "r_y1": 236.27800000000002, "r_x2": 392.39, "r_y2": 228.80899999999997, "r_x3": 222.966, "r_y3": 228.80899999999997, "coord_origin": "TOPLEFT"}, "text": "{mly,ahn,nli,cau,taa}@zurich.ibm.com", "orig": "{mly,ahn,nli,cau,taa}@zurich.ibm.com", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}]}, "text": null}, {"label": "text", "id": 1, "page_no": 0, "cluster": {"id": 1, "label": "text", "bbox": {"l": 163.111, "t": 268.086, "r": 452.249, "b": 465.676, "coord_origin": "TOPLEFT"}, "confidence": 0.9807654023170471, "cells": [{"index": 48, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 163.111, "r_y0": 278.227, "r_x1": 206.636, "r_y1": 278.227, "r_x2": 206.636, "r_y2": 270.30100000000004, "r_x3": 163.111, "r_y3": 270.30100000000004, "coord_origin": "TOPLEFT"}, "text": "Abstract.", "orig": "Abstract.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 49, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 211.617, "r_y0": 279.375, "r_x1": 452.245, "r_y1": 279.375, "r_x2": 452.245, "r_y2": 268.086, "r_x3": 211.617, "r_y3": 268.086, "coord_origin": "TOPLEFT"}, "text": "Extracting tables from documents is a crucial task in any", "orig": "Extracting tables from documents is a crucial task in any", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 50, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 163.111, "r_y0": 290.334, "r_x1": 452.242, "r_y1": 290.334, "r_x2": 452.242, "r_y2": 279.04499999999996, "r_x3": 163.111, "r_y3": 279.04499999999996, "coord_origin": "TOPLEFT"}, "text": "document conversion pipeline. Recently, transformer-based models have", "orig": "document conversion pipeline. Recently, transformer-based models have", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 51, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 163.111, "r_y0": 301.293, "r_x1": 452.248, "r_y1": 301.293, "r_x2": 452.248, "r_y2": 290.004, "r_x3": 163.111, "r_y3": 290.004, "coord_origin": "TOPLEFT"}, "text": "demonstrated that table-structure can be recognized with impressive ac-", "orig": "demonstrated that table-structure can be recognized with impressive ac-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 52, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 163.111, "r_y0": 312.252, "r_x1": 452.241, "r_y1": 312.252, "r_x2": 452.241, "r_y2": 300.963, "r_x3": 163.111, "r_y3": 300.963, "coord_origin": "TOPLEFT"}, "text": "curacy using Image-to-Markup-Sequence (Im2Seq) approaches. Taking", "orig": "curacy using Image-to-Markup-Sequence (Im2Seq) approaches. Taking", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 53, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 163.111, "r_y0": 323.21, "r_x1": 452.246, "r_y1": 323.21, "r_x2": 452.246, "r_y2": 311.921, "r_x3": 163.111, "r_y3": 311.921, "coord_origin": "TOPLEFT"}, "text": "only the image of a table, such models predict a sequence of tokens (e.g.", "orig": "only the image of a table, such models predict a sequence of tokens (e.g.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 54, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 163.111, "r_y0": 334.169, "r_x1": 452.246, "r_y1": 334.169, "r_x2": 452.246, "r_y2": 322.88, "r_x3": 163.111, "r_y3": 322.88, "coord_origin": "TOPLEFT"}, "text": "in HTML, LaTeX) which represent the structure of the table. Since the", "orig": "in HTML, LaTeX) which represent the structure of the table. Since the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 55, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 163.111, "r_y0": 345.128, "r_x1": 452.247, "r_y1": 345.128, "r_x2": 452.247, "r_y2": 333.839, "r_x3": 163.111, "r_y3": 333.839, "coord_origin": "TOPLEFT"}, "text": "token representation of the table structure has a significant impact on", "orig": "token representation of the table structure has a significant impact on", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 56, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 163.111, "r_y0": 356.087, "r_x1": 452.246, "r_y1": 356.087, "r_x2": 452.246, "r_y2": 344.798, "r_x3": 163.111, "r_y3": 344.798, "coord_origin": "TOPLEFT"}, "text": "the accuracy and run-time performance of any Im2Seq model, we inves-", "orig": "the accuracy and run-time performance of any Im2Seq model, we inves-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 57, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 163.111, "r_y0": 367.046, "r_x1": 452.248, "r_y1": 367.046, "r_x2": 452.248, "r_y2": 355.757, "r_x3": 163.111, "r_y3": 355.757, "coord_origin": "TOPLEFT"}, "text": "tigate in this paper how table-structure representation can be optimised.", "orig": "tigate in this paper how table-structure representation can be optimised.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 58, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 163.111, "r_y0": 378.005, "r_x1": 452.246, "r_y1": 378.005, "r_x2": 452.246, "r_y2": 366.716, "r_x3": 163.111, "r_y3": 366.716, "coord_origin": "TOPLEFT"}, "text": "We propose a new, optimised table-structure language (OTSL) with a", "orig": "We propose a new, optimised table-structure language (OTSL) with a", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 59, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 163.111, "r_y0": 388.964, "r_x1": 452.242, "r_y1": 388.964, "r_x2": 452.242, "r_y2": 377.675, "r_x3": 163.111, "r_y3": 377.675, "coord_origin": "TOPLEFT"}, "text": "minimized vocabulary and specific rules. The benefits of OTSL are that", "orig": "minimized vocabulary and specific rules. The benefits of OTSL are that", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 60, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 163.111, "r_y0": 399.923, "r_x1": 169.253, "r_y1": 399.923, "r_x2": 169.253, "r_y2": 388.634, "r_x3": 163.111, "r_y3": 388.634, "coord_origin": "TOPLEFT"}, "text": "it", "orig": "it", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 61, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 172.795, "r_y0": 399.923, "r_x1": 452.244, "r_y1": 399.923, "r_x2": 452.244, "r_y2": 388.634, "r_x3": 172.795, "r_y3": 388.634, "coord_origin": "TOPLEFT"}, "text": "reduces the number of tokens to 5 (HTML needs 28+) and shortens", "orig": "reduces the number of tokens to 5 (HTML needs 28+) and shortens", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 62, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 163.111, "r_y0": 410.882, "r_x1": 452.249, "r_y1": 410.882, "r_x2": 452.249, "r_y2": 399.593, "r_x3": 163.111, "r_y3": 399.593, "coord_origin": "TOPLEFT"}, "text": "the sequence length to half of HTML on average. Consequently, model", "orig": "the sequence length to half of HTML on average. Consequently, model", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 63, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 163.111, "r_y0": 421.841, "r_x1": 198.194, "r_y1": 421.841, "r_x2": 198.194, "r_y2": 410.552, "r_x3": 163.111, "r_y3": 410.552, "coord_origin": "TOPLEFT"}, "text": "accuracy", "orig": "accuracy", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 64, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 202.632, "r_y0": 421.841, "r_x1": 292.676, "r_y1": 421.841, "r_x2": 292.676, "r_y2": 410.552, "r_x3": 202.632, "r_y3": 410.552, "coord_origin": "TOPLEFT"}, "text": "improves significantly,", "orig": "improves significantly,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 65, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 297.115, "r_y0": 421.841, "r_x1": 332.719, "r_y1": 421.841, "r_x2": 332.719, "r_y2": 410.552, "r_x3": 297.115, "r_y3": 410.552, "coord_origin": "TOPLEFT"}, "text": "inference", "orig": "inference", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 66, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 337.158, "r_y0": 421.841, "r_x1": 365.708, "r_y1": 421.841, "r_x2": 365.708, "r_y2": 410.552, "r_x3": 337.158, "r_y3": 410.552, "coord_origin": "TOPLEFT"}, "text": "time is", "orig": "time is", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 67, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 370.146, "r_y0": 421.841, "r_x1": 396.249, "r_y1": 421.841, "r_x2": 396.249, "r_y2": 410.552, "r_x3": 370.146, "r_y3": 410.552, "coord_origin": "TOPLEFT"}, "text": "halved", "orig": "halved", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 68, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 400.696, "r_y0": 421.841, "r_x1": 452.241, "r_y1": 421.841, "r_x2": 452.241, "r_y2": 410.552, "r_x3": 400.696, "r_y3": 410.552, "coord_origin": "TOPLEFT"}, "text": "compared to", "orig": "compared to", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 69, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 163.111, "r_y0": 432.799, "r_x1": 452.242, "r_y1": 432.799, "r_x2": 452.242, "r_y2": 421.51, "r_x3": 163.111, "r_y3": 421.51, "coord_origin": "TOPLEFT"}, "text": "HTML-based models, and the predicted table structures are always syn-", "orig": "HTML-based models, and the predicted table structures are always syn-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 70, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 163.111, "r_y0": 443.758, "r_x1": 200.22, "r_y1": 443.758, "r_x2": 200.22, "r_y2": 432.469, "r_x3": 163.111, "r_y3": 432.469, "coord_origin": "TOPLEFT"}, "text": "tactically", "orig": "tactically", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 71, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 204.282, "r_y0": 443.758, "r_x1": 234.527, "r_y1": 443.758, "r_x2": 234.527, "r_y2": 432.469, "r_x3": 204.282, "r_y3": 432.469, "coord_origin": "TOPLEFT"}, "text": "correct.", "orig": "correct.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 72, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 238.588, "r_y0": 443.758, "r_x1": 452.244, "r_y1": 443.758, "r_x2": 452.244, "r_y2": 432.469, "r_x3": 238.588, "r_y3": 432.469, "coord_origin": "TOPLEFT"}, "text": "This in turn eliminates most post-processing needs.", "orig": "This in turn eliminates most post-processing needs.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 73, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 163.111, "r_y0": 454.717, "r_x1": 452.246, "r_y1": 454.717, "r_x2": 452.246, "r_y2": 443.428, "r_x3": 163.111, "r_y3": 443.428, "coord_origin": "TOPLEFT"}, "text": "Popular table structure data-sets will be published in OTSL format to", "orig": "Popular table structure data-sets will be published in OTSL format to", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 74, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 163.111, "r_y0": 465.676, "r_x1": 225.561, "r_y1": 465.676, "r_x2": 225.561, "r_y2": 454.387, "r_x3": 163.111, "r_y3": 454.387, "coord_origin": "TOPLEFT"}, "text": "the community.", "orig": "the community.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "Abstract. Extracting tables from documents is a crucial task in any document conversion pipeline. Recently, transformer-based models have demonstrated that table-structure can be recognized with impressive accuracy using Image-to-Markup-Sequence (Im2Seq) approaches. Taking only the image of a table, such models predict a sequence of tokens (e.g. in HTML, LaTeX) which represent the structure of the table. Since the token representation of the table structure has a significant impact on the accuracy and run-time performance of any Im2Seq model, we investigate in this paper how table-structure representation can be optimised. We propose a new, optimised table-structure language (OTSL) with a minimized vocabulary and specific rules. The benefits of OTSL are that it reduces the number of tokens to 5 (HTML needs 28+) and shortens the sequence length to half of HTML on average. Consequently, model accuracy improves significantly, inference time is halved compared to HTML-based models, and the predicted table structures are always syntactically correct. This in turn eliminates most post-processing needs. Popular table structure data-sets will be published in OTSL format to the community."}, {"label": "text", "id": 4, "page_no": 0, "cluster": {"id": 4, "label": "text", "bbox": {"l": 163.111, "t": 476.479, "r": 452.241, "b": 498.727, "coord_origin": "TOPLEFT"}, "confidence": 0.9304055571556091, "cells": [{"index": 75, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 163.111, "r_y0": 486.62, "r_x1": 211.942, "r_y1": 486.62, "r_x2": 211.942, "r_y2": 478.694, "r_x3": 163.111, "r_y3": 478.694, "coord_origin": "TOPLEFT"}, "text": "Keywords:", "orig": "Keywords:", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 76, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 216.552, "r_y0": 487.768, "r_x1": 452.241, "r_y1": 487.768, "r_x2": 452.241, "r_y2": 476.479, "r_x3": 216.552, "r_y3": 476.479, "coord_origin": "TOPLEFT"}, "text": "Table Structure Recognition \u00b7 Data Representation \u00b7 Trans-", "orig": "Table Structure Recognition \u00b7 Data Representation \u00b7 Trans-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 77, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 163.111, "r_y0": 498.727, "r_x1": 257.642, "r_y1": 498.727, "r_x2": 257.642, "r_y2": 487.438, "r_x3": 163.111, "r_y3": 487.438, "coord_origin": "TOPLEFT"}, "text": "formers \u00b7 Optimization.", "orig": "formers \u00b7 Optimization.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "Keywords: Table Structure Recognition \u00b7 Data Representation \u00b7 Transformers \u00b7 Optimization."}, {"label": "section_header", "id": 3, "page_no": 0, "cluster": {"id": 3, "label": "section_header", "bbox": {"l": 134.765, "t": 522.12, "r": 228.934, "b": 532.688, "coord_origin": "TOPLEFT"}, "confidence": 0.9392016530036926, "cells": [{"index": 78, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 532.688, "r_x1": 141.489, "r_y1": 532.688, "r_x2": 141.489, "r_y2": 522.12, "r_x3": 134.765, "r_y3": 522.12, "coord_origin": "TOPLEFT"}, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 79, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 154.938, "r_y0": 532.688, "r_x1": 228.934, "r_y1": 532.688, "r_x2": 228.934, "r_y2": 522.12, "r_x3": 154.938, "r_y3": 522.12, "coord_origin": "TOPLEFT"}, "text": "Introduction", "orig": "Introduction", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "1 Introduction"}, {"label": "text", "id": 0, "page_no": 0, "cluster": {"id": 0, "label": "text", "bbox": {"l": 134.765, "t": 548.287, "r": 480.596, "b": 628.815, "coord_origin": "TOPLEFT"}, "confidence": 0.9835679531097412, "cells": [{"index": 80, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 557.0840000000001, "r_x1": 480.594, "r_y1": 557.0840000000001, "r_x2": 480.594, "r_y2": 548.287, "r_x3": 134.765, "r_y3": 548.287, "coord_origin": "TOPLEFT"}, "text": "Tables are ubiquitous in documents such as scientific papers, patents, reports,", "orig": "Tables are ubiquitous in documents such as scientific papers, patents, reports,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 81, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 569.04, "r_x1": 480.592, "r_y1": 569.04, "r_x2": 480.592, "r_y2": 560.2429999999999, "r_x3": 134.765, "r_y3": 560.2429999999999, "coord_origin": "TOPLEFT"}, "text": "manuals, specification sheets or marketing material. They often encode highly", "orig": "manuals, specification sheets or marketing material. They often encode highly", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 82, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 580.995, "r_x1": 170.451, "r_y1": 580.995, "r_x2": 170.451, "r_y2": 572.198, "r_x3": 134.765, "r_y3": 572.198, "coord_origin": "TOPLEFT"}, "text": "valuable", "orig": "valuable", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 83, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 175.173, "r_y0": 580.995, "r_x1": 225.832, "r_y1": 580.995, "r_x2": 225.832, "r_y2": 572.198, "r_x3": 175.173, "r_y3": 572.198, "coord_origin": "TOPLEFT"}, "text": "information", "orig": "information", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 84, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 230.544, "r_y0": 580.995, "r_x1": 289.826, "r_y1": 580.995, "r_x2": 289.826, "r_y2": 572.198, "r_x3": 230.544, "r_y3": 572.198, "coord_origin": "TOPLEFT"}, "text": "and therefore", "orig": "and therefore", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 85, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 294.538, "r_y0": 580.995, "r_x1": 388.395, "r_y1": 580.995, "r_x2": 388.395, "r_y2": 572.198, "r_x3": 294.538, "r_y3": 572.198, "coord_origin": "TOPLEFT"}, "text": "need to be extracted", "orig": "need to be extracted", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 86, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 393.107, "r_y0": 580.995, "r_x1": 480.593, "r_y1": 580.995, "r_x2": 480.593, "r_y2": 572.198, "r_x3": 393.107, "r_y3": 572.198, "coord_origin": "TOPLEFT"}, "text": "with high accuracy.", "orig": "with high accuracy.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 87, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 592.95, "r_x1": 480.596, "r_y1": 592.95, "r_x2": 480.596, "r_y2": 584.153, "r_x3": 134.765, "r_y3": 584.153, "coord_origin": "TOPLEFT"}, "text": "Unfortunately, tables appear in documents in various sizes, styling and struc-", "orig": "Unfortunately, tables appear in documents in various sizes, styling and struc-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 88, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 604.905, "r_x1": 155.266, "r_y1": 604.905, "r_x2": 155.266, "r_y2": 596.108, "r_x3": 134.765, "r_y3": 596.108, "coord_origin": "TOPLEFT"}, "text": "ture,", "orig": "ture,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 89, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 159.48, "r_y0": 604.905, "r_x1": 480.587, "r_y1": 604.905, "r_x2": 480.587, "r_y2": 596.108, "r_x3": 159.48, "r_y3": 596.108, "coord_origin": "TOPLEFT"}, "text": "making it difficult to recover their correct structure with simple analyt-", "orig": "making it difficult to recover their correct structure with simple analyt-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 90, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 616.86, "r_x1": 149.705, "r_y1": 616.86, "r_x2": 149.705, "r_y2": 608.063, "r_x3": 134.765, "r_y3": 608.063, "coord_origin": "TOPLEFT"}, "text": "ical", "orig": "ical", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 91, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 153.71, "r_y0": 616.86, "r_x1": 480.591, "r_y1": 616.86, "r_x2": 480.591, "r_y2": 608.063, "r_x3": 153.71, "r_y3": 608.063, "coord_origin": "TOPLEFT"}, "text": "methods. Therefore, accurate table extraction is achieved these days with", "orig": "methods. Therefore, accurate table extraction is achieved these days with", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 92, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 628.815, "r_x1": 279.327, "r_y1": 628.815, "r_x2": 279.327, "r_y2": 620.018, "r_x3": 134.765, "r_y3": 620.018, "coord_origin": "TOPLEFT"}, "text": "machine-learning based methods.", "orig": "machine-learning based methods.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "Tables are ubiquitous in documents such as scientific papers, patents, reports, manuals, specification sheets or marketing material. They often encode highly valuable information and therefore need to be extracted with high accuracy. Unfortunately, tables appear in documents in various sizes, styling and structure, making it difficult to recover their correct structure with simple analytical methods. Therefore, accurate table extraction is achieved these days with machine-learning based methods."}, {"label": "text", "id": 2, "page_no": 0, "cluster": {"id": 2, "label": "text", "bbox": {"l": 134.765, "t": 632.148, "r": 480.596, "b": 664.855, "coord_origin": "TOPLEFT"}, "confidence": 0.9696458578109741, "cells": [{"index": 93, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 149.708, "r_y0": 640.9449999999999, "r_x1": 480.589, "r_y1": 640.9449999999999, "r_x2": 480.589, "r_y2": 632.148, "r_x3": 149.708, "r_y3": 632.148, "coord_origin": "TOPLEFT"}, "text": "In modern document understanding systems [1,15], table extraction is typi-", "orig": "In modern document understanding systems [1,15], table extraction is typi-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 94, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 652.9, "r_x1": 480.596, "r_y1": 652.9, "r_x2": 480.596, "r_y2": 644.1030000000001, "r_x3": 134.765, "r_y3": 644.1030000000001, "coord_origin": "TOPLEFT"}, "text": "cally a two-step process. Firstly, every table on a page is located with a bounding", "orig": "cally a two-step process. Firstly, every table on a page is located with a bounding", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 95, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 664.855, "r_x1": 480.595, "r_y1": 664.855, "r_x2": 480.595, "r_y2": 656.058, "r_x3": 134.765, "r_y3": 656.058, "coord_origin": "TOPLEFT"}, "text": "box, and secondly, their logical row and column structure is recognized. As of", "orig": "box, and secondly, their logical row and column structure is recognized. As of", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "In modern document understanding systems [1,15], table extraction is typically a two-step process. Firstly, every table on a page is located with a bounding box, and secondly, their logical row and column structure is recognized. As of"}, {"label": "page_header", "id": 6, "page_no": 0, "cluster": {"id": 6, "label": "page_header", "bbox": {"l": 18.34, "t": 215.0, "r": 36.34, "b": 555.0, "coord_origin": "TOPLEFT"}, "confidence": 0.8899643421173096, "cells": [{"index": 96, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 36.34, "r_y0": 555.0, "r_x1": 36.34, "r_y1": 375.0, "r_x2": 18.34, "r_y2": 375.0, "r_x3": 18.34, "r_y3": 555.0, "coord_origin": "TOPLEFT"}, "text": "arXiv:2305.03393v1", "orig": "arXiv:2305.03393v1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 97, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 36.34, "r_y0": 355.0, "r_x1": 36.34, "r_y1": 285.0, "r_x2": 18.34, "r_y2": 285.0, "r_x3": 18.34, "r_y3": 355.0, "coord_origin": "TOPLEFT"}, "text": "[cs.CV]", "orig": "[cs.CV]", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 98, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 36.34, "r_y0": 265.0, "r_x1": 36.34, "r_y1": 255.0, "r_x2": 18.34, "r_y2": 255.0, "r_x3": 18.34, "r_y3": 265.0, "coord_origin": "TOPLEFT"}, "text": "5", "orig": "5", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 99, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 36.34, "r_y0": 245.0, "r_x1": 36.34, "r_y1": 215.0, "r_x2": 18.34, "r_y2": 215.0, "r_x3": 18.34, "r_y3": 245.0, "coord_origin": "TOPLEFT"}, "text": "May", "orig": "May", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "arXiv:2305.03393v1 [cs.CV] 5 May"}, {"label": "text", "id": 37, "page_no": 0, "cluster": {"id": 37, "label": "text", "bbox": {"l": 18.34, "t": 165.0, "r": 36.34, "b": 205.0, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 100, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 36.34, "r_y0": 205.0, "r_x1": 36.34, "r_y1": 165.0, "r_x2": 18.34, "r_y2": 165.0, "r_x3": 18.34, "r_y3": 205.0, "coord_origin": "TOPLEFT"}, "text": "2023", "orig": "2023", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "2023"}], "body": [{"label": "section_header", "id": 5, "page_no": 0, "cluster": {"id": 5, "label": "section_header", "bbox": {"l": 134.765, "t": 115.899, "r": 480.597, "b": 146.514, "coord_origin": "TOPLEFT"}, "confidence": 0.8918349742889404, "cells": [{"index": 0, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 128.58100000000002, "r_x1": 480.597, "r_y1": 128.58100000000002, "r_x2": 480.597, "r_y2": 115.899, "r_x3": 134.765, "r_y3": 115.899, "coord_origin": "TOPLEFT"}, "text": "Optimized Table Tokenization for Table Structure", "orig": "Optimized Table Tokenization for Table Structure", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 266.675, "r_y0": 146.514, "r_x1": 348.685, "r_y1": 146.514, "r_x2": 348.685, "r_y2": 133.832, "r_x3": 266.675, "r_y3": 133.832, "coord_origin": "TOPLEFT"}, "text": "Recognition", "orig": "Recognition", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "Optimized Table Tokenization for Table Structure Recognition"}, {"label": "key_value_region", "id": 16, "page_no": 0, "cluster": {"id": 16, "label": "key_value_region", "bbox": {"l": 139.343, "t": 170.159, "r": 476.013, "b": 236.27800000000002, "coord_origin": "TOPLEFT"}, "confidence": 0.48445820808410645, "cells": [{"index": 2, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 151.226, "r_y0": 180.471, "r_x1": 217.044, "r_y1": 180.471, "r_x2": 217.044, "r_y2": 171.67399999999998, "r_x3": 151.226, "r_y3": 171.67399999999998, "coord_origin": "TOPLEFT"}, "text": "Maksym Lysak", "orig": "Maksym Lysak", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 3, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 217.046, "r_y0": 176.25300000000004, "r_x1": 235.188, "r_y1": 176.25300000000004, "r_x2": 235.188, "r_y2": 170.159, "r_x3": 217.046, "r_y3": 170.159, "coord_origin": "TOPLEFT"}, "text": "[0000", "orig": "[0000", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 4, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 235.186, "r_y0": 176.154, "r_x1": 241.413, "r_y1": 176.154, "r_x2": 241.413, "r_y2": 170.159, "r_x3": 235.186, "r_y3": 170.159, "coord_origin": "TOPLEFT"}, "text": "-", "orig": "-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 5, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 241.413, "r_y0": 176.25300000000004, "r_x1": 257.299, "r_y1": 176.25300000000004, "r_x2": 257.299, "r_y2": 170.159, "r_x3": 241.413, "r_y3": 170.159, "coord_origin": "TOPLEFT"}, "text": "0002", "orig": "0002", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 6, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 257.298, "r_y0": 176.154, "r_x1": 263.525, "r_y1": 176.154, "r_x2": 263.525, "r_y2": 170.159, "r_x3": 257.298, "r_y3": 170.159, "coord_origin": "TOPLEFT"}, "text": "-", "orig": "-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 7, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 263.525, "r_y0": 176.25300000000004, "r_x1": 279.411, "r_y1": 176.25300000000004, "r_x2": 279.411, "r_y2": 170.159, "r_x3": 263.525, "r_y3": 170.159, "coord_origin": "TOPLEFT"}, "text": "3723", "orig": "3723", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 8, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 279.41, "r_y0": 176.154, "r_x1": 285.637, "r_y1": 176.154, "r_x2": 285.637, "r_y2": 170.159, "r_x3": 279.41, "r_y3": 170.159, "coord_origin": "TOPLEFT"}, "text": "-", "orig": "-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 9, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 285.636, "r_y0": 176.25300000000004, "r_x1": 303.778, "r_y1": 176.25300000000004, "r_x2": 303.778, "r_y2": 170.159, "r_x3": 285.636, "r_y3": 170.159, "coord_origin": "TOPLEFT"}, "text": "6960]", "orig": "6960]", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 10, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 304.275, "r_y0": 180.471, "r_x1": 307.042, "r_y1": 180.471, "r_x2": 307.042, "r_y2": 171.67399999999998, "r_x3": 304.275, "r_y3": 171.67399999999998, "coord_origin": "TOPLEFT"}, "text": ",", "orig": ",", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 11, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 310.359, "r_y0": 180.471, "r_x1": 374.138, "r_y1": 180.471, "r_x2": 374.138, "r_y2": 171.67399999999998, "r_x3": 310.359, "r_y3": 171.67399999999998, "coord_origin": "TOPLEFT"}, "text": "Ahmed Nassar", "orig": "Ahmed Nassar", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 12, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 374.135, "r_y0": 176.25300000000004, "r_x1": 392.277, "r_y1": 176.25300000000004, "r_x2": 392.277, "r_y2": 170.159, "r_x3": 374.135, "r_y3": 170.159, "coord_origin": "TOPLEFT"}, "text": "[0000", "orig": "[0000", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 13, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 392.275, "r_y0": 176.154, "r_x1": 398.502, "r_y1": 176.154, "r_x2": 398.502, "r_y2": 170.159, "r_x3": 392.275, "r_y3": 170.159, "coord_origin": "TOPLEFT"}, "text": "-", "orig": "-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 14, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 398.502, "r_y0": 176.25300000000004, "r_x1": 414.388, "r_y1": 176.25300000000004, "r_x2": 414.388, "r_y2": 170.159, "r_x3": 398.502, "r_y3": 170.159, "coord_origin": "TOPLEFT"}, "text": "0002", "orig": "0002", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 15, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 414.387, "r_y0": 176.154, "r_x1": 420.614, "r_y1": 176.154, "r_x2": 420.614, "r_y2": 170.159, "r_x3": 414.387, "r_y3": 170.159, "coord_origin": "TOPLEFT"}, "text": "-", "orig": "-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 16, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 420.613, "r_y0": 176.25300000000004, "r_x1": 436.499, "r_y1": 176.25300000000004, "r_x2": 436.499, "r_y2": 170.159, "r_x3": 420.613, "r_y3": 170.159, "coord_origin": "TOPLEFT"}, "text": "9468", "orig": "9468", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 17, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 436.498, "r_y0": 176.154, "r_x1": 442.725, "r_y1": 176.154, "r_x2": 442.725, "r_y2": 170.159, "r_x3": 436.498, "r_y3": 170.159, "coord_origin": "TOPLEFT"}, "text": "-", "orig": "-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 18, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 442.725, "r_y0": 176.25300000000004, "r_x1": 460.867, "r_y1": 176.25300000000004, "r_x2": 460.867, "r_y2": 170.159, "r_x3": 442.725, "r_y3": 170.159, "coord_origin": "TOPLEFT"}, "text": "0822]", "orig": "0822]", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 19, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 461.363, "r_y0": 180.471, "r_x1": 464.13, "r_y1": 180.471, "r_x2": 464.13, "r_y2": 171.67399999999998, "r_x3": 461.363, "r_y3": 171.67399999999998, "coord_origin": "TOPLEFT"}, "text": ",", "orig": ",", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 20, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 139.343, "r_y0": 192.42600000000004, "r_x1": 224.807, "r_y1": 192.42600000000004, "r_x2": 224.807, "r_y2": 183.62900000000002, "r_x3": 139.343, "r_y3": 183.62900000000002, "coord_origin": "TOPLEFT"}, "text": "Nikolaos Livathinos", "orig": "Nikolaos Livathinos", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 21, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 224.807, "r_y0": 188.20899999999995, "r_x1": 242.949, "r_y1": 188.20899999999995, "r_x2": 242.949, "r_y2": 182.115, "r_x3": 224.807, "r_y3": 182.115, "coord_origin": "TOPLEFT"}, "text": "[0000", "orig": "[0000", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 22, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 242.947, "r_y0": 188.11, "r_x1": 249.174, "r_y1": 188.11, "r_x2": 249.174, "r_y2": 182.115, "r_x3": 242.947, "r_y3": 182.115, "coord_origin": "TOPLEFT"}, "text": "-", "orig": "-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 23, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 249.174, "r_y0": 188.20899999999995, "r_x1": 265.06, "r_y1": 188.20899999999995, "r_x2": 265.06, "r_y2": 182.115, "r_x3": 249.174, "r_y3": 182.115, "coord_origin": "TOPLEFT"}, "text": "0001", "orig": "0001", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 24, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 265.059, "r_y0": 188.11, "r_x1": 271.286, "r_y1": 188.11, "r_x2": 271.286, "r_y2": 182.115, "r_x3": 265.059, "r_y3": 182.115, "coord_origin": "TOPLEFT"}, "text": "-", "orig": "-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 25, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 271.285, "r_y0": 188.20899999999995, "r_x1": 287.171, "r_y1": 188.20899999999995, "r_x2": 287.171, "r_y2": 182.115, "r_x3": 271.285, "r_y3": 182.115, "coord_origin": "TOPLEFT"}, "text": "8513", "orig": "8513", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 26, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 287.17, "r_y0": 188.11, "r_x1": 293.397, "r_y1": 188.11, "r_x2": 293.397, "r_y2": 182.115, "r_x3": 287.17, "r_y3": 182.115, "coord_origin": "TOPLEFT"}, "text": "-", "orig": "-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 27, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 293.397, "r_y0": 188.20899999999995, "r_x1": 311.539, "r_y1": 188.20899999999995, "r_x2": 311.539, "r_y2": 182.115, "r_x3": 293.397, "r_y3": 182.115, "coord_origin": "TOPLEFT"}, "text": "3491]", "orig": "3491]", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 28, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 312.035, "r_y0": 192.42600000000004, "r_x1": 314.802, "r_y1": 192.42600000000004, "r_x2": 314.802, "r_y2": 183.62900000000002, "r_x3": 312.035, "r_y3": 183.62900000000002, "coord_origin": "TOPLEFT"}, "text": ",", "orig": ",", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 29, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 318.119, "r_y0": 192.42600000000004, "r_x1": 386.02, "r_y1": 192.42600000000004, "r_x2": 386.02, "r_y2": 183.62900000000002, "r_x3": 318.119, "r_y3": 183.62900000000002, "coord_origin": "TOPLEFT"}, "text": "Christoph Auer", "orig": "Christoph Auer", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 30, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 386.018, "r_y0": 188.20899999999995, "r_x1": 404.16, "r_y1": 188.20899999999995, "r_x2": 404.16, "r_y2": 182.115, "r_x3": 386.018, "r_y3": 182.115, "coord_origin": "TOPLEFT"}, "text": "[0000", "orig": "[0000", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 31, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 404.158, "r_y0": 188.11, "r_x1": 410.385, "r_y1": 188.11, "r_x2": 410.385, "r_y2": 182.115, "r_x3": 404.158, "r_y3": 182.115, "coord_origin": "TOPLEFT"}, "text": "-", "orig": "-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 32, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 410.385, "r_y0": 188.20899999999995, "r_x1": 426.271, "r_y1": 188.20899999999995, "r_x2": 426.271, "r_y2": 182.115, "r_x3": 410.385, "r_y3": 182.115, "coord_origin": "TOPLEFT"}, "text": "0001", "orig": "0001", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 33, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 426.27, "r_y0": 188.11, "r_x1": 432.497, "r_y1": 188.11, "r_x2": 432.497, "r_y2": 182.115, "r_x3": 426.27, "r_y3": 182.115, "coord_origin": "TOPLEFT"}, "text": "-", "orig": "-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 34, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 432.496, "r_y0": 188.20899999999995, "r_x1": 448.382, "r_y1": 188.20899999999995, "r_x2": 448.382, "r_y2": 182.115, "r_x3": 432.496, "r_y3": 182.115, "coord_origin": "TOPLEFT"}, "text": "5761", "orig": "5761", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 35, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 448.381, "r_y0": 188.11, "r_x1": 454.608, "r_y1": 188.11, "r_x2": 454.608, "r_y2": 182.115, "r_x3": 448.381, "r_y3": 182.115, "coord_origin": "TOPLEFT"}, "text": "-", "orig": "-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 36, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 454.608, "r_y0": 188.20899999999995, "r_x1": 472.75, "r_y1": 188.20899999999995, "r_x2": 472.75, "r_y2": 182.115, "r_x3": 454.608, "r_y3": 182.115, "coord_origin": "TOPLEFT"}, "text": "0422]", "orig": "0422]", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 37, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 473.246, "r_y0": 192.42600000000004, "r_x1": 476.013, "r_y1": 192.42600000000004, "r_x2": 476.013, "r_y2": 183.62900000000002, "r_x3": 473.246, "r_y3": 183.62900000000002, "coord_origin": "TOPLEFT"}, "text": ",", "orig": ",", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 38, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 229.521, "r_y0": 204.38099999999997, "r_x1": 298.609, "r_y1": 204.38099999999997, "r_x2": 298.609, "r_y2": 195.58399999999995, "r_x3": 229.521, "r_y3": 195.58399999999995, "coord_origin": "TOPLEFT"}, "text": "and Peter Staar", "orig": "and Peter Staar", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 39, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 298.606, "r_y0": 200.164, "r_x1": 316.748, "r_y1": 200.164, "r_x2": 316.748, "r_y2": 194.07000000000005, "r_x3": 298.606, "r_y3": 194.07000000000005, "coord_origin": "TOPLEFT"}, "text": "[0000", "orig": "[0000", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 40, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 316.746, "r_y0": 200.06500000000005, "r_x1": 322.973, "r_y1": 200.06500000000005, "r_x2": 322.973, "r_y2": 194.07000000000005, "r_x3": 316.746, "r_y3": 194.07000000000005, "coord_origin": "TOPLEFT"}, "text": "-", "orig": "-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 41, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 322.973, "r_y0": 200.164, "r_x1": 338.859, "r_y1": 200.164, "r_x2": 338.859, "r_y2": 194.07000000000005, "r_x3": 322.973, "r_y3": 194.07000000000005, "coord_origin": "TOPLEFT"}, "text": "0002", "orig": "0002", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 42, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 338.858, "r_y0": 200.06500000000005, "r_x1": 345.085, "r_y1": 200.06500000000005, "r_x2": 345.085, "r_y2": 194.07000000000005, "r_x3": 338.858, "r_y3": 194.07000000000005, "coord_origin": "TOPLEFT"}, "text": "-", "orig": "-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 43, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 345.085, "r_y0": 200.164, "r_x1": 360.971, "r_y1": 200.164, "r_x2": 360.971, "r_y2": 194.07000000000005, "r_x3": 345.085, "r_y3": 194.07000000000005, "coord_origin": "TOPLEFT"}, "text": "8088", "orig": "8088", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 44, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 360.97, "r_y0": 200.06500000000005, "r_x1": 367.197, "r_y1": 200.06500000000005, "r_x2": 367.197, "r_y2": 194.07000000000005, "r_x3": 360.97, "r_y3": 194.07000000000005, "coord_origin": "TOPLEFT"}, "text": "-", "orig": "-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 45, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 367.196, "r_y0": 200.164, "r_x1": 385.338, "r_y1": 200.164, "r_x2": 385.338, "r_y2": 194.07000000000005, "r_x3": 367.196, "r_y3": 194.07000000000005, "coord_origin": "TOPLEFT"}, "text": "0823]", "orig": "0823]", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 46, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 279.105, "r_y0": 226.21500000000003, "r_x1": 336.251, "r_y1": 226.21500000000003, "r_x2": 336.251, "r_y2": 214.92600000000004, "r_x3": 279.105, "r_y3": 214.92600000000004, "coord_origin": "TOPLEFT"}, "text": "IBM Research", "orig": "IBM Research", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 47, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 222.966, "r_y0": 236.27800000000002, "r_x1": 392.39, "r_y1": 236.27800000000002, "r_x2": 392.39, "r_y2": 228.80899999999997, "r_x3": 222.966, "r_y3": 228.80899999999997, "coord_origin": "TOPLEFT"}, "text": "{mly,ahn,nli,cau,taa}@zurich.ibm.com", "orig": "{mly,ahn,nli,cau,taa}@zurich.ibm.com", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": [{"id": 7, "label": "text", "bbox": {"l": 139.343, "t": 170.159, "r": 476.013, "b": 200.164, "coord_origin": "TOPLEFT"}, "confidence": 0.7918068766593933, "cells": [{"index": 2, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 151.226, "r_y0": 180.471, "r_x1": 217.044, "r_y1": 180.471, "r_x2": 217.044, "r_y2": 171.67399999999998, "r_x3": 151.226, "r_y3": 171.67399999999998, "coord_origin": "TOPLEFT"}, "text": "Maksym Lysak", "orig": "Maksym Lysak", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 3, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 217.046, "r_y0": 176.25300000000004, "r_x1": 235.188, "r_y1": 176.25300000000004, "r_x2": 235.188, "r_y2": 170.159, "r_x3": 217.046, "r_y3": 170.159, "coord_origin": "TOPLEFT"}, "text": "[0000", "orig": "[0000", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 4, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 235.186, "r_y0": 176.154, "r_x1": 241.413, "r_y1": 176.154, "r_x2": 241.413, "r_y2": 170.159, "r_x3": 235.186, "r_y3": 170.159, "coord_origin": "TOPLEFT"}, "text": "-", "orig": "-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 5, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 241.413, "r_y0": 176.25300000000004, "r_x1": 257.299, "r_y1": 176.25300000000004, "r_x2": 257.299, "r_y2": 170.159, "r_x3": 241.413, "r_y3": 170.159, "coord_origin": "TOPLEFT"}, "text": "0002", "orig": "0002", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 6, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 257.298, "r_y0": 176.154, "r_x1": 263.525, "r_y1": 176.154, "r_x2": 263.525, "r_y2": 170.159, "r_x3": 257.298, "r_y3": 170.159, "coord_origin": "TOPLEFT"}, "text": "-", "orig": "-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 7, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 263.525, "r_y0": 176.25300000000004, "r_x1": 279.411, "r_y1": 176.25300000000004, "r_x2": 279.411, "r_y2": 170.159, "r_x3": 263.525, "r_y3": 170.159, "coord_origin": "TOPLEFT"}, "text": "3723", "orig": "3723", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 8, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 279.41, "r_y0": 176.154, "r_x1": 285.637, "r_y1": 176.154, "r_x2": 285.637, "r_y2": 170.159, "r_x3": 279.41, "r_y3": 170.159, "coord_origin": "TOPLEFT"}, "text": "-", "orig": "-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 9, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 285.636, "r_y0": 176.25300000000004, "r_x1": 303.778, "r_y1": 176.25300000000004, "r_x2": 303.778, "r_y2": 170.159, "r_x3": 285.636, "r_y3": 170.159, "coord_origin": "TOPLEFT"}, "text": "6960]", "orig": "6960]", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 10, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 304.275, "r_y0": 180.471, "r_x1": 307.042, "r_y1": 180.471, "r_x2": 307.042, "r_y2": 171.67399999999998, "r_x3": 304.275, "r_y3": 171.67399999999998, "coord_origin": "TOPLEFT"}, "text": ",", "orig": ",", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 11, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 310.359, "r_y0": 180.471, "r_x1": 374.138, "r_y1": 180.471, "r_x2": 374.138, "r_y2": 171.67399999999998, "r_x3": 310.359, "r_y3": 171.67399999999998, "coord_origin": "TOPLEFT"}, "text": "Ahmed Nassar", "orig": "Ahmed Nassar", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 12, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 374.135, "r_y0": 176.25300000000004, "r_x1": 392.277, "r_y1": 176.25300000000004, "r_x2": 392.277, "r_y2": 170.159, "r_x3": 374.135, "r_y3": 170.159, "coord_origin": "TOPLEFT"}, "text": "[0000", "orig": "[0000", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 13, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 392.275, "r_y0": 176.154, "r_x1": 398.502, "r_y1": 176.154, "r_x2": 398.502, "r_y2": 170.159, "r_x3": 392.275, "r_y3": 170.159, "coord_origin": "TOPLEFT"}, "text": "-", "orig": "-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 14, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 398.502, "r_y0": 176.25300000000004, "r_x1": 414.388, "r_y1": 176.25300000000004, "r_x2": 414.388, "r_y2": 170.159, "r_x3": 398.502, "r_y3": 170.159, "coord_origin": "TOPLEFT"}, "text": "0002", "orig": "0002", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 15, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 414.387, "r_y0": 176.154, "r_x1": 420.614, "r_y1": 176.154, "r_x2": 420.614, "r_y2": 170.159, "r_x3": 414.387, "r_y3": 170.159, "coord_origin": "TOPLEFT"}, "text": "-", "orig": "-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 16, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 420.613, "r_y0": 176.25300000000004, "r_x1": 436.499, "r_y1": 176.25300000000004, "r_x2": 436.499, "r_y2": 170.159, "r_x3": 420.613, "r_y3": 170.159, "coord_origin": "TOPLEFT"}, "text": "9468", "orig": "9468", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 17, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 436.498, "r_y0": 176.154, "r_x1": 442.725, "r_y1": 176.154, "r_x2": 442.725, "r_y2": 170.159, "r_x3": 436.498, "r_y3": 170.159, "coord_origin": "TOPLEFT"}, "text": "-", "orig": "-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 18, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 442.725, "r_y0": 176.25300000000004, "r_x1": 460.867, "r_y1": 176.25300000000004, "r_x2": 460.867, "r_y2": 170.159, "r_x3": 442.725, "r_y3": 170.159, "coord_origin": "TOPLEFT"}, "text": "0822]", "orig": "0822]", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 19, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 461.363, "r_y0": 180.471, "r_x1": 464.13, "r_y1": 180.471, "r_x2": 464.13, "r_y2": 171.67399999999998, "r_x3": 461.363, "r_y3": 171.67399999999998, "coord_origin": "TOPLEFT"}, "text": ",", "orig": ",", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 20, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 139.343, "r_y0": 192.42600000000004, "r_x1": 224.807, "r_y1": 192.42600000000004, "r_x2": 224.807, "r_y2": 183.62900000000002, "r_x3": 139.343, "r_y3": 183.62900000000002, "coord_origin": "TOPLEFT"}, "text": "Nikolaos Livathinos", "orig": "Nikolaos Livathinos", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 21, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 224.807, "r_y0": 188.20899999999995, "r_x1": 242.949, "r_y1": 188.20899999999995, "r_x2": 242.949, "r_y2": 182.115, "r_x3": 224.807, "r_y3": 182.115, "coord_origin": "TOPLEFT"}, "text": "[0000", "orig": "[0000", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 22, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 242.947, "r_y0": 188.11, "r_x1": 249.174, "r_y1": 188.11, "r_x2": 249.174, "r_y2": 182.115, "r_x3": 242.947, "r_y3": 182.115, "coord_origin": "TOPLEFT"}, "text": "-", "orig": "-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 23, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 249.174, "r_y0": 188.20899999999995, "r_x1": 265.06, "r_y1": 188.20899999999995, "r_x2": 265.06, "r_y2": 182.115, "r_x3": 249.174, "r_y3": 182.115, "coord_origin": "TOPLEFT"}, "text": "0001", "orig": "0001", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 24, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 265.059, "r_y0": 188.11, "r_x1": 271.286, "r_y1": 188.11, "r_x2": 271.286, "r_y2": 182.115, "r_x3": 265.059, "r_y3": 182.115, "coord_origin": "TOPLEFT"}, "text": "-", "orig": "-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 25, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 271.285, "r_y0": 188.20899999999995, "r_x1": 287.171, "r_y1": 188.20899999999995, "r_x2": 287.171, "r_y2": 182.115, "r_x3": 271.285, "r_y3": 182.115, "coord_origin": "TOPLEFT"}, "text": "8513", "orig": "8513", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 26, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 287.17, "r_y0": 188.11, "r_x1": 293.397, "r_y1": 188.11, "r_x2": 293.397, "r_y2": 182.115, "r_x3": 287.17, "r_y3": 182.115, "coord_origin": "TOPLEFT"}, "text": "-", "orig": "-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 27, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 293.397, "r_y0": 188.20899999999995, "r_x1": 311.539, "r_y1": 188.20899999999995, "r_x2": 311.539, "r_y2": 182.115, "r_x3": 293.397, "r_y3": 182.115, "coord_origin": "TOPLEFT"}, "text": "3491]", "orig": "3491]", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 28, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 312.035, "r_y0": 192.42600000000004, "r_x1": 314.802, "r_y1": 192.42600000000004, "r_x2": 314.802, "r_y2": 183.62900000000002, "r_x3": 312.035, "r_y3": 183.62900000000002, "coord_origin": "TOPLEFT"}, "text": ",", "orig": ",", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 29, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 318.119, "r_y0": 192.42600000000004, "r_x1": 386.02, "r_y1": 192.42600000000004, "r_x2": 386.02, "r_y2": 183.62900000000002, "r_x3": 318.119, "r_y3": 183.62900000000002, "coord_origin": "TOPLEFT"}, "text": "Christoph Auer", "orig": "Christoph Auer", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 30, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 386.018, "r_y0": 188.20899999999995, "r_x1": 404.16, "r_y1": 188.20899999999995, "r_x2": 404.16, "r_y2": 182.115, "r_x3": 386.018, "r_y3": 182.115, "coord_origin": "TOPLEFT"}, "text": "[0000", "orig": "[0000", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 31, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 404.158, "r_y0": 188.11, "r_x1": 410.385, "r_y1": 188.11, "r_x2": 410.385, "r_y2": 182.115, "r_x3": 404.158, "r_y3": 182.115, "coord_origin": "TOPLEFT"}, "text": "-", "orig": "-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 32, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 410.385, "r_y0": 188.20899999999995, "r_x1": 426.271, "r_y1": 188.20899999999995, "r_x2": 426.271, "r_y2": 182.115, "r_x3": 410.385, "r_y3": 182.115, "coord_origin": "TOPLEFT"}, "text": "0001", "orig": "0001", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 33, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 426.27, "r_y0": 188.11, "r_x1": 432.497, "r_y1": 188.11, "r_x2": 432.497, "r_y2": 182.115, "r_x3": 426.27, "r_y3": 182.115, "coord_origin": "TOPLEFT"}, "text": "-", "orig": "-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 34, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 432.496, "r_y0": 188.20899999999995, "r_x1": 448.382, "r_y1": 188.20899999999995, "r_x2": 448.382, "r_y2": 182.115, "r_x3": 432.496, "r_y3": 182.115, "coord_origin": "TOPLEFT"}, "text": "5761", "orig": "5761", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 35, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 448.381, "r_y0": 188.11, "r_x1": 454.608, "r_y1": 188.11, "r_x2": 454.608, "r_y2": 182.115, "r_x3": 448.381, "r_y3": 182.115, "coord_origin": "TOPLEFT"}, "text": "-", "orig": "-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 36, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 454.608, "r_y0": 188.20899999999995, "r_x1": 472.75, "r_y1": 188.20899999999995, "r_x2": 472.75, "r_y2": 182.115, "r_x3": 454.608, "r_y3": 182.115, "coord_origin": "TOPLEFT"}, "text": "0422]", "orig": "0422]", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 37, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 473.246, "r_y0": 192.42600000000004, "r_x1": 476.013, "r_y1": 192.42600000000004, "r_x2": 476.013, "r_y2": 183.62900000000002, "r_x3": 473.246, "r_y3": 183.62900000000002, "coord_origin": "TOPLEFT"}, "text": ",", "orig": ",", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 39, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 298.606, "r_y0": 200.164, "r_x1": 316.748, "r_y1": 200.164, "r_x2": 316.748, "r_y2": 194.07000000000005, "r_x3": 298.606, "r_y3": 194.07000000000005, "coord_origin": "TOPLEFT"}, "text": "[0000", "orig": "[0000", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 40, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 316.746, "r_y0": 200.06500000000005, "r_x1": 322.973, "r_y1": 200.06500000000005, "r_x2": 322.973, "r_y2": 194.07000000000005, "r_x3": 316.746, "r_y3": 194.07000000000005, "coord_origin": "TOPLEFT"}, "text": "-", "orig": "-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 41, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 322.973, "r_y0": 200.164, "r_x1": 338.859, "r_y1": 200.164, "r_x2": 338.859, "r_y2": 194.07000000000005, "r_x3": 322.973, "r_y3": 194.07000000000005, "coord_origin": "TOPLEFT"}, "text": "0002", "orig": "0002", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 42, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 338.858, "r_y0": 200.06500000000005, "r_x1": 345.085, "r_y1": 200.06500000000005, "r_x2": 345.085, "r_y2": 194.07000000000005, "r_x3": 338.858, "r_y3": 194.07000000000005, "coord_origin": "TOPLEFT"}, "text": "-", "orig": "-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 43, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 345.085, "r_y0": 200.164, "r_x1": 360.971, "r_y1": 200.164, "r_x2": 360.971, "r_y2": 194.07000000000005, "r_x3": 345.085, "r_y3": 194.07000000000005, "coord_origin": "TOPLEFT"}, "text": "8088", "orig": "8088", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 44, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 360.97, "r_y0": 200.06500000000005, "r_x1": 367.197, "r_y1": 200.06500000000005, "r_x2": 367.197, "r_y2": 194.07000000000005, "r_x3": 360.97, "r_y3": 194.07000000000005, "coord_origin": "TOPLEFT"}, "text": "-", "orig": "-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 45, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 367.196, "r_y0": 200.164, "r_x1": 385.338, "r_y1": 200.164, "r_x2": 385.338, "r_y2": 194.07000000000005, "r_x3": 367.196, "r_y3": 194.07000000000005, "coord_origin": "TOPLEFT"}, "text": "0823]", "orig": "0823]", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 13, "label": "text", "bbox": {"l": 229.521, "t": 195.58399999999995, "r": 298.609, "b": 204.38099999999997, "coord_origin": "TOPLEFT"}, "confidence": 0.5015263557434082, "cells": [{"index": 38, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 229.521, "r_y0": 204.38099999999997, "r_x1": 298.609, "r_y1": 204.38099999999997, "r_x2": 298.609, "r_y2": 195.58399999999995, "r_x3": 229.521, "r_y3": 195.58399999999995, "coord_origin": "TOPLEFT"}, "text": "and Peter Staar", "orig": "and Peter Staar", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 9, "label": "text", "bbox": {"l": 279.105, "t": 214.92600000000004, "r": 336.251, "b": 226.21500000000003, "coord_origin": "TOPLEFT"}, "confidence": 0.6310867667198181, "cells": [{"index": 46, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 279.105, "r_y0": 226.21500000000003, "r_x1": 336.251, "r_y1": 226.21500000000003, "r_x2": 336.251, "r_y2": 214.92600000000004, "r_x3": 279.105, "r_y3": 214.92600000000004, "coord_origin": "TOPLEFT"}, "text": "IBM Research", "orig": "IBM Research", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 8, "label": "text", "bbox": {"l": 222.966, "t": 228.80899999999997, "r": 392.39, "b": 236.27800000000002, "coord_origin": "TOPLEFT"}, "confidence": 0.6924149990081787, "cells": [{"index": 47, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 222.966, "r_y0": 236.27800000000002, "r_x1": 392.39, "r_y1": 236.27800000000002, "r_x2": 392.39, "r_y2": 228.80899999999997, "r_x3": 222.966, "r_y3": 228.80899999999997, "coord_origin": "TOPLEFT"}, "text": "{mly,ahn,nli,cau,taa}@zurich.ibm.com", "orig": "{mly,ahn,nli,cau,taa}@zurich.ibm.com", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}]}, "text": null}, {"label": "text", "id": 1, "page_no": 0, "cluster": {"id": 1, "label": "text", "bbox": {"l": 163.111, "t": 268.086, "r": 452.249, "b": 465.676, "coord_origin": "TOPLEFT"}, "confidence": 0.9807654023170471, "cells": [{"index": 48, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 163.111, "r_y0": 278.227, "r_x1": 206.636, "r_y1": 278.227, "r_x2": 206.636, "r_y2": 270.30100000000004, "r_x3": 163.111, "r_y3": 270.30100000000004, "coord_origin": "TOPLEFT"}, "text": "Abstract.", "orig": "Abstract.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 49, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 211.617, "r_y0": 279.375, "r_x1": 452.245, "r_y1": 279.375, "r_x2": 452.245, "r_y2": 268.086, "r_x3": 211.617, "r_y3": 268.086, "coord_origin": "TOPLEFT"}, "text": "Extracting tables from documents is a crucial task in any", "orig": "Extracting tables from documents is a crucial task in any", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 50, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 163.111, "r_y0": 290.334, "r_x1": 452.242, "r_y1": 290.334, "r_x2": 452.242, "r_y2": 279.04499999999996, "r_x3": 163.111, "r_y3": 279.04499999999996, "coord_origin": "TOPLEFT"}, "text": "document conversion pipeline. Recently, transformer-based models have", "orig": "document conversion pipeline. Recently, transformer-based models have", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 51, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 163.111, "r_y0": 301.293, "r_x1": 452.248, "r_y1": 301.293, "r_x2": 452.248, "r_y2": 290.004, "r_x3": 163.111, "r_y3": 290.004, "coord_origin": "TOPLEFT"}, "text": "demonstrated that table-structure can be recognized with impressive ac-", "orig": "demonstrated that table-structure can be recognized with impressive ac-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 52, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 163.111, "r_y0": 312.252, "r_x1": 452.241, "r_y1": 312.252, "r_x2": 452.241, "r_y2": 300.963, "r_x3": 163.111, "r_y3": 300.963, "coord_origin": "TOPLEFT"}, "text": "curacy using Image-to-Markup-Sequence (Im2Seq) approaches. Taking", "orig": "curacy using Image-to-Markup-Sequence (Im2Seq) approaches. Taking", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 53, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 163.111, "r_y0": 323.21, "r_x1": 452.246, "r_y1": 323.21, "r_x2": 452.246, "r_y2": 311.921, "r_x3": 163.111, "r_y3": 311.921, "coord_origin": "TOPLEFT"}, "text": "only the image of a table, such models predict a sequence of tokens (e.g.", "orig": "only the image of a table, such models predict a sequence of tokens (e.g.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 54, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 163.111, "r_y0": 334.169, "r_x1": 452.246, "r_y1": 334.169, "r_x2": 452.246, "r_y2": 322.88, "r_x3": 163.111, "r_y3": 322.88, "coord_origin": "TOPLEFT"}, "text": "in HTML, LaTeX) which represent the structure of the table. Since the", "orig": "in HTML, LaTeX) which represent the structure of the table. Since the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 55, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 163.111, "r_y0": 345.128, "r_x1": 452.247, "r_y1": 345.128, "r_x2": 452.247, "r_y2": 333.839, "r_x3": 163.111, "r_y3": 333.839, "coord_origin": "TOPLEFT"}, "text": "token representation of the table structure has a significant impact on", "orig": "token representation of the table structure has a significant impact on", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 56, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 163.111, "r_y0": 356.087, "r_x1": 452.246, "r_y1": 356.087, "r_x2": 452.246, "r_y2": 344.798, "r_x3": 163.111, "r_y3": 344.798, "coord_origin": "TOPLEFT"}, "text": "the accuracy and run-time performance of any Im2Seq model, we inves-", "orig": "the accuracy and run-time performance of any Im2Seq model, we inves-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 57, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 163.111, "r_y0": 367.046, "r_x1": 452.248, "r_y1": 367.046, "r_x2": 452.248, "r_y2": 355.757, "r_x3": 163.111, "r_y3": 355.757, "coord_origin": "TOPLEFT"}, "text": "tigate in this paper how table-structure representation can be optimised.", "orig": "tigate in this paper how table-structure representation can be optimised.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 58, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 163.111, "r_y0": 378.005, "r_x1": 452.246, "r_y1": 378.005, "r_x2": 452.246, "r_y2": 366.716, "r_x3": 163.111, "r_y3": 366.716, "coord_origin": "TOPLEFT"}, "text": "We propose a new, optimised table-structure language (OTSL) with a", "orig": "We propose a new, optimised table-structure language (OTSL) with a", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 59, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 163.111, "r_y0": 388.964, "r_x1": 452.242, "r_y1": 388.964, "r_x2": 452.242, "r_y2": 377.675, "r_x3": 163.111, "r_y3": 377.675, "coord_origin": "TOPLEFT"}, "text": "minimized vocabulary and specific rules. The benefits of OTSL are that", "orig": "minimized vocabulary and specific rules. The benefits of OTSL are that", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 60, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 163.111, "r_y0": 399.923, "r_x1": 169.253, "r_y1": 399.923, "r_x2": 169.253, "r_y2": 388.634, "r_x3": 163.111, "r_y3": 388.634, "coord_origin": "TOPLEFT"}, "text": "it", "orig": "it", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 61, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 172.795, "r_y0": 399.923, "r_x1": 452.244, "r_y1": 399.923, "r_x2": 452.244, "r_y2": 388.634, "r_x3": 172.795, "r_y3": 388.634, "coord_origin": "TOPLEFT"}, "text": "reduces the number of tokens to 5 (HTML needs 28+) and shortens", "orig": "reduces the number of tokens to 5 (HTML needs 28+) and shortens", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 62, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 163.111, "r_y0": 410.882, "r_x1": 452.249, "r_y1": 410.882, "r_x2": 452.249, "r_y2": 399.593, "r_x3": 163.111, "r_y3": 399.593, "coord_origin": "TOPLEFT"}, "text": "the sequence length to half of HTML on average. Consequently, model", "orig": "the sequence length to half of HTML on average. Consequently, model", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 63, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 163.111, "r_y0": 421.841, "r_x1": 198.194, "r_y1": 421.841, "r_x2": 198.194, "r_y2": 410.552, "r_x3": 163.111, "r_y3": 410.552, "coord_origin": "TOPLEFT"}, "text": "accuracy", "orig": "accuracy", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 64, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 202.632, "r_y0": 421.841, "r_x1": 292.676, "r_y1": 421.841, "r_x2": 292.676, "r_y2": 410.552, "r_x3": 202.632, "r_y3": 410.552, "coord_origin": "TOPLEFT"}, "text": "improves significantly,", "orig": "improves significantly,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 65, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 297.115, "r_y0": 421.841, "r_x1": 332.719, "r_y1": 421.841, "r_x2": 332.719, "r_y2": 410.552, "r_x3": 297.115, "r_y3": 410.552, "coord_origin": "TOPLEFT"}, "text": "inference", "orig": "inference", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 66, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 337.158, "r_y0": 421.841, "r_x1": 365.708, "r_y1": 421.841, "r_x2": 365.708, "r_y2": 410.552, "r_x3": 337.158, "r_y3": 410.552, "coord_origin": "TOPLEFT"}, "text": "time is", "orig": "time is", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 67, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 370.146, "r_y0": 421.841, "r_x1": 396.249, "r_y1": 421.841, "r_x2": 396.249, "r_y2": 410.552, "r_x3": 370.146, "r_y3": 410.552, "coord_origin": "TOPLEFT"}, "text": "halved", "orig": "halved", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 68, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 400.696, "r_y0": 421.841, "r_x1": 452.241, "r_y1": 421.841, "r_x2": 452.241, "r_y2": 410.552, "r_x3": 400.696, "r_y3": 410.552, "coord_origin": "TOPLEFT"}, "text": "compared to", "orig": "compared to", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 69, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 163.111, "r_y0": 432.799, "r_x1": 452.242, "r_y1": 432.799, "r_x2": 452.242, "r_y2": 421.51, "r_x3": 163.111, "r_y3": 421.51, "coord_origin": "TOPLEFT"}, "text": "HTML-based models, and the predicted table structures are always syn-", "orig": "HTML-based models, and the predicted table structures are always syn-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 70, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 163.111, "r_y0": 443.758, "r_x1": 200.22, "r_y1": 443.758, "r_x2": 200.22, "r_y2": 432.469, "r_x3": 163.111, "r_y3": 432.469, "coord_origin": "TOPLEFT"}, "text": "tactically", "orig": "tactically", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 71, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 204.282, "r_y0": 443.758, "r_x1": 234.527, "r_y1": 443.758, "r_x2": 234.527, "r_y2": 432.469, "r_x3": 204.282, "r_y3": 432.469, "coord_origin": "TOPLEFT"}, "text": "correct.", "orig": "correct.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 72, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 238.588, "r_y0": 443.758, "r_x1": 452.244, "r_y1": 443.758, "r_x2": 452.244, "r_y2": 432.469, "r_x3": 238.588, "r_y3": 432.469, "coord_origin": "TOPLEFT"}, "text": "This in turn eliminates most post-processing needs.", "orig": "This in turn eliminates most post-processing needs.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 73, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 163.111, "r_y0": 454.717, "r_x1": 452.246, "r_y1": 454.717, "r_x2": 452.246, "r_y2": 443.428, "r_x3": 163.111, "r_y3": 443.428, "coord_origin": "TOPLEFT"}, "text": "Popular table structure data-sets will be published in OTSL format to", "orig": "Popular table structure data-sets will be published in OTSL format to", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 74, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 163.111, "r_y0": 465.676, "r_x1": 225.561, "r_y1": 465.676, "r_x2": 225.561, "r_y2": 454.387, "r_x3": 163.111, "r_y3": 454.387, "coord_origin": "TOPLEFT"}, "text": "the community.", "orig": "the community.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "Abstract. Extracting tables from documents is a crucial task in any document conversion pipeline. Recently, transformer-based models have demonstrated that table-structure can be recognized with impressive accuracy using Image-to-Markup-Sequence (Im2Seq) approaches. Taking only the image of a table, such models predict a sequence of tokens (e.g. in HTML, LaTeX) which represent the structure of the table. Since the token representation of the table structure has a significant impact on the accuracy and run-time performance of any Im2Seq model, we investigate in this paper how table-structure representation can be optimised. We propose a new, optimised table-structure language (OTSL) with a minimized vocabulary and specific rules. The benefits of OTSL are that it reduces the number of tokens to 5 (HTML needs 28+) and shortens the sequence length to half of HTML on average. Consequently, model accuracy improves significantly, inference time is halved compared to HTML-based models, and the predicted table structures are always syntactically correct. This in turn eliminates most post-processing needs. Popular table structure data-sets will be published in OTSL format to the community."}, {"label": "text", "id": 4, "page_no": 0, "cluster": {"id": 4, "label": "text", "bbox": {"l": 163.111, "t": 476.479, "r": 452.241, "b": 498.727, "coord_origin": "TOPLEFT"}, "confidence": 0.9304055571556091, "cells": [{"index": 75, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 163.111, "r_y0": 486.62, "r_x1": 211.942, "r_y1": 486.62, "r_x2": 211.942, "r_y2": 478.694, "r_x3": 163.111, "r_y3": 478.694, "coord_origin": "TOPLEFT"}, "text": "Keywords:", "orig": "Keywords:", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 76, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 216.552, "r_y0": 487.768, "r_x1": 452.241, "r_y1": 487.768, "r_x2": 452.241, "r_y2": 476.479, "r_x3": 216.552, "r_y3": 476.479, "coord_origin": "TOPLEFT"}, "text": "Table Structure Recognition \u00b7 Data Representation \u00b7 Trans-", "orig": "Table Structure Recognition \u00b7 Data Representation \u00b7 Trans-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 77, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 163.111, "r_y0": 498.727, "r_x1": 257.642, "r_y1": 498.727, "r_x2": 257.642, "r_y2": 487.438, "r_x3": 163.111, "r_y3": 487.438, "coord_origin": "TOPLEFT"}, "text": "formers \u00b7 Optimization.", "orig": "formers \u00b7 Optimization.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "Keywords: Table Structure Recognition \u00b7 Data Representation \u00b7 Transformers \u00b7 Optimization."}, {"label": "section_header", "id": 3, "page_no": 0, "cluster": {"id": 3, "label": "section_header", "bbox": {"l": 134.765, "t": 522.12, "r": 228.934, "b": 532.688, "coord_origin": "TOPLEFT"}, "confidence": 0.9392016530036926, "cells": [{"index": 78, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 532.688, "r_x1": 141.489, "r_y1": 532.688, "r_x2": 141.489, "r_y2": 522.12, "r_x3": 134.765, "r_y3": 522.12, "coord_origin": "TOPLEFT"}, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 79, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 154.938, "r_y0": 532.688, "r_x1": 228.934, "r_y1": 532.688, "r_x2": 228.934, "r_y2": 522.12, "r_x3": 154.938, "r_y3": 522.12, "coord_origin": "TOPLEFT"}, "text": "Introduction", "orig": "Introduction", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "1 Introduction"}, {"label": "text", "id": 0, "page_no": 0, "cluster": {"id": 0, "label": "text", "bbox": {"l": 134.765, "t": 548.287, "r": 480.596, "b": 628.815, "coord_origin": "TOPLEFT"}, "confidence": 0.9835679531097412, "cells": [{"index": 80, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 557.0840000000001, "r_x1": 480.594, "r_y1": 557.0840000000001, "r_x2": 480.594, "r_y2": 548.287, "r_x3": 134.765, "r_y3": 548.287, "coord_origin": "TOPLEFT"}, "text": "Tables are ubiquitous in documents such as scientific papers, patents, reports,", "orig": "Tables are ubiquitous in documents such as scientific papers, patents, reports,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 81, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 569.04, "r_x1": 480.592, "r_y1": 569.04, "r_x2": 480.592, "r_y2": 560.2429999999999, "r_x3": 134.765, "r_y3": 560.2429999999999, "coord_origin": "TOPLEFT"}, "text": "manuals, specification sheets or marketing material. They often encode highly", "orig": "manuals, specification sheets or marketing material. They often encode highly", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 82, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 580.995, "r_x1": 170.451, "r_y1": 580.995, "r_x2": 170.451, "r_y2": 572.198, "r_x3": 134.765, "r_y3": 572.198, "coord_origin": "TOPLEFT"}, "text": "valuable", "orig": "valuable", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 83, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 175.173, "r_y0": 580.995, "r_x1": 225.832, "r_y1": 580.995, "r_x2": 225.832, "r_y2": 572.198, "r_x3": 175.173, "r_y3": 572.198, "coord_origin": "TOPLEFT"}, "text": "information", "orig": "information", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 84, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 230.544, "r_y0": 580.995, "r_x1": 289.826, "r_y1": 580.995, "r_x2": 289.826, "r_y2": 572.198, "r_x3": 230.544, "r_y3": 572.198, "coord_origin": "TOPLEFT"}, "text": "and therefore", "orig": "and therefore", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 85, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 294.538, "r_y0": 580.995, "r_x1": 388.395, "r_y1": 580.995, "r_x2": 388.395, "r_y2": 572.198, "r_x3": 294.538, "r_y3": 572.198, "coord_origin": "TOPLEFT"}, "text": "need to be extracted", "orig": "need to be extracted", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 86, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 393.107, "r_y0": 580.995, "r_x1": 480.593, "r_y1": 580.995, "r_x2": 480.593, "r_y2": 572.198, "r_x3": 393.107, "r_y3": 572.198, "coord_origin": "TOPLEFT"}, "text": "with high accuracy.", "orig": "with high accuracy.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 87, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 592.95, "r_x1": 480.596, "r_y1": 592.95, "r_x2": 480.596, "r_y2": 584.153, "r_x3": 134.765, "r_y3": 584.153, "coord_origin": "TOPLEFT"}, "text": "Unfortunately, tables appear in documents in various sizes, styling and struc-", "orig": "Unfortunately, tables appear in documents in various sizes, styling and struc-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 88, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 604.905, "r_x1": 155.266, "r_y1": 604.905, "r_x2": 155.266, "r_y2": 596.108, "r_x3": 134.765, "r_y3": 596.108, "coord_origin": "TOPLEFT"}, "text": "ture,", "orig": "ture,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 89, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 159.48, "r_y0": 604.905, "r_x1": 480.587, "r_y1": 604.905, "r_x2": 480.587, "r_y2": 596.108, "r_x3": 159.48, "r_y3": 596.108, "coord_origin": "TOPLEFT"}, "text": "making it difficult to recover their correct structure with simple analyt-", "orig": "making it difficult to recover their correct structure with simple analyt-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 90, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 616.86, "r_x1": 149.705, "r_y1": 616.86, "r_x2": 149.705, "r_y2": 608.063, "r_x3": 134.765, "r_y3": 608.063, "coord_origin": "TOPLEFT"}, "text": "ical", "orig": "ical", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 91, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 153.71, "r_y0": 616.86, "r_x1": 480.591, "r_y1": 616.86, "r_x2": 480.591, "r_y2": 608.063, "r_x3": 153.71, "r_y3": 608.063, "coord_origin": "TOPLEFT"}, "text": "methods. Therefore, accurate table extraction is achieved these days with", "orig": "methods. Therefore, accurate table extraction is achieved these days with", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 92, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 628.815, "r_x1": 279.327, "r_y1": 628.815, "r_x2": 279.327, "r_y2": 620.018, "r_x3": 134.765, "r_y3": 620.018, "coord_origin": "TOPLEFT"}, "text": "machine-learning based methods.", "orig": "machine-learning based methods.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "Tables are ubiquitous in documents such as scientific papers, patents, reports, manuals, specification sheets or marketing material. They often encode highly valuable information and therefore need to be extracted with high accuracy. Unfortunately, tables appear in documents in various sizes, styling and structure, making it difficult to recover their correct structure with simple analytical methods. Therefore, accurate table extraction is achieved these days with machine-learning based methods."}, {"label": "text", "id": 2, "page_no": 0, "cluster": {"id": 2, "label": "text", "bbox": {"l": 134.765, "t": 632.148, "r": 480.596, "b": 664.855, "coord_origin": "TOPLEFT"}, "confidence": 0.9696458578109741, "cells": [{"index": 93, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 149.708, "r_y0": 640.9449999999999, "r_x1": 480.589, "r_y1": 640.9449999999999, "r_x2": 480.589, "r_y2": 632.148, "r_x3": 149.708, "r_y3": 632.148, "coord_origin": "TOPLEFT"}, "text": "In modern document understanding systems [1,15], table extraction is typi-", "orig": "In modern document understanding systems [1,15], table extraction is typi-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 94, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 652.9, "r_x1": 480.596, "r_y1": 652.9, "r_x2": 480.596, "r_y2": 644.1030000000001, "r_x3": 134.765, "r_y3": 644.1030000000001, "coord_origin": "TOPLEFT"}, "text": "cally a two-step process. Firstly, every table on a page is located with a bounding", "orig": "cally a two-step process. Firstly, every table on a page is located with a bounding", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 95, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 664.855, "r_x1": 480.595, "r_y1": 664.855, "r_x2": 480.595, "r_y2": 656.058, "r_x3": 134.765, "r_y3": 656.058, "coord_origin": "TOPLEFT"}, "text": "box, and secondly, their logical row and column structure is recognized. As of", "orig": "box, and secondly, their logical row and column structure is recognized. As of", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "In modern document understanding systems [1,15], table extraction is typically a two-step process. Firstly, every table on a page is located with a bounding box, and secondly, their logical row and column structure is recognized. As of"}, {"label": "text", "id": 37, "page_no": 0, "cluster": {"id": 37, "label": "text", "bbox": {"l": 18.34, "t": 165.0, "r": 36.34, "b": 205.0, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 100, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 36.34, "r_y0": 205.0, "r_x1": 36.34, "r_y1": 165.0, "r_x2": 18.34, "r_y2": 165.0, "r_x3": 18.34, "r_y3": 205.0, "coord_origin": "TOPLEFT"}, "text": "2023", "orig": "2023", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "2023"}], "headers": [{"label": "page_header", "id": 6, "page_no": 0, "cluster": {"id": 6, "label": "page_header", "bbox": {"l": 18.34, "t": 215.0, "r": 36.34, "b": 555.0, "coord_origin": "TOPLEFT"}, "confidence": 0.8899643421173096, "cells": [{"index": 96, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 36.34, "r_y0": 555.0, "r_x1": 36.34, "r_y1": 375.0, "r_x2": 18.34, "r_y2": 375.0, "r_x3": 18.34, "r_y3": 555.0, "coord_origin": "TOPLEFT"}, "text": "arXiv:2305.03393v1", "orig": "arXiv:2305.03393v1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 97, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 36.34, "r_y0": 355.0, "r_x1": 36.34, "r_y1": 285.0, "r_x2": 18.34, "r_y2": 285.0, "r_x3": 18.34, "r_y3": 355.0, "coord_origin": "TOPLEFT"}, "text": "[cs.CV]", "orig": "[cs.CV]", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 98, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 36.34, "r_y0": 265.0, "r_x1": 36.34, "r_y1": 255.0, "r_x2": 18.34, "r_y2": 255.0, "r_x3": 18.34, "r_y3": 265.0, "coord_origin": "TOPLEFT"}, "text": "5", "orig": "5", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 99, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 36.34, "r_y0": 245.0, "r_x1": 36.34, "r_y1": 215.0, "r_x2": 18.34, "r_y2": 215.0, "r_x3": 18.34, "r_y3": 245.0, "coord_origin": "TOPLEFT"}, "text": "May", "orig": "May", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "arXiv:2305.03393v1 [cs.CV] 5 May"}]}}, {"page_no": 1, "size": {"width": 612.0, "height": 792.0}, "cells": [{"index": 0, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 102.78200000000004, "r_x1": 139.372, "r_y1": 102.78200000000004, "r_x2": 139.372, "r_y2": 91.49300000000005, "r_x3": 134.765, "r_y3": 91.49300000000005, "coord_origin": "TOPLEFT"}, "text": "2", "orig": "2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 167.813, "r_y0": 102.78200000000004, "r_x1": 231.722, "r_y1": 102.78200000000004, "r_x2": 231.722, "r_y2": 91.49300000000005, "r_x3": 167.813, "r_y3": 91.49300000000005, "coord_origin": "TOPLEFT"}, "text": "M. Lysak, et al.", "orig": "M. Lysak, et al.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 2, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 134.26, "r_x1": 162.644, "r_y1": 134.26, "r_x2": 162.644, "r_y2": 126.33399999999995, "r_x3": 134.765, "r_y3": 126.33399999999995, "coord_origin": "TOPLEFT"}, "text": "Fig. 1.", "orig": "Fig. 1.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 3, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 167.062, "r_y0": 135.40800000000002, "r_x1": 480.591, "r_y1": 135.40800000000002, "r_x2": 480.591, "r_y2": 124.11900000000003, "r_x3": 167.062, "r_y3": 124.11900000000003, "coord_origin": "TOPLEFT"}, "text": "Comparison between HTML and OTSL table structure representation: (A)", "orig": "Comparison between HTML and OTSL table structure representation: (A)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 4, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 146.36699999999996, "r_x1": 190.823, "r_y1": 146.36699999999996, "r_x2": 190.823, "r_y2": 135.07799999999997, "r_x3": 134.765, "r_y3": 135.07799999999997, "coord_origin": "TOPLEFT"}, "text": "table-example", "orig": "table-example", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 5, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 195.199, "r_y0": 146.36699999999996, "r_x1": 480.59, "r_y1": 146.36699999999996, "r_x2": 480.59, "r_y2": 135.07799999999997, "r_x3": 195.199, "r_y3": 135.07799999999997, "coord_origin": "TOPLEFT"}, "text": "with complex row and column headers, including a 2D empty span,", "orig": "with complex row and column headers, including a 2D empty span,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 6, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 157.32600000000002, "r_x1": 480.591, "r_y1": 157.32600000000002, "r_x2": 480.591, "r_y2": 146.03700000000003, "r_x3": 134.765, "r_y3": 146.03700000000003, "coord_origin": "TOPLEFT"}, "text": "(B) minimal graphical representation of table structure using rectangular layout, (C)", "orig": "(B) minimal graphical representation of table structure using rectangular layout, (C)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 7, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 168.28499999999997, "r_x1": 480.592, "r_y1": 168.28499999999997, "r_x2": 480.592, "r_y2": 156.99599999999998, "r_x3": 134.765, "r_y3": 156.99599999999998, "coord_origin": "TOPLEFT"}, "text": "HTML representation, (D) OTSL representation. This example demonstrates many of", "orig": "HTML representation, (D) OTSL representation. This example demonstrates many of", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 8, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 179.24400000000003, "r_x1": 480.589, "r_y1": 179.24400000000003, "r_x2": 480.589, "r_y2": 167.95500000000004, "r_x3": 134.765, "r_y3": 167.95500000000004, "coord_origin": "TOPLEFT"}, "text": "the key-features of OTSL, namely its reduced vocabulary size (12 versus 5 in this case),", "orig": "the key-features of OTSL, namely its reduced vocabulary size (12 versus 5 in this case),", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 9, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 190.20299999999997, "r_x1": 480.59, "r_y1": 190.20299999999997, "r_x2": 480.59, "r_y2": 178.914, "r_x3": 134.765, "r_y3": 178.914, "coord_origin": "TOPLEFT"}, "text": "its reduced sequence length (55 versus 30) and a enhanced internal structure (variable", "orig": "its reduced sequence length (55 versus 30) and a enhanced internal structure (variable", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 10, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 201.16200000000003, "r_x1": 460.871, "r_y1": 201.16200000000003, "r_x2": 460.871, "r_y2": 189.87300000000005, "r_x3": 134.765, "r_y3": 189.87300000000005, "coord_origin": "TOPLEFT"}, "text": "token sequence length per row in HTML versus a fixed length of rows in OTSL).", "orig": "token sequence length per row in HTML versus a fixed length of rows in OTSL).", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 11, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 396.411, "r_y0": 289.478, "r_x1": 446.134, "r_y1": 288.875, "r_x2": 446.134, "r_y2": 280.49, "r_x3": 396.411, "r_y3": 281.093, "coord_origin": "TOPLEFT"}, "text": "C L C L L", "orig": "C L C L L", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 12, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 395.748, "r_y0": 311.731, "r_x1": 463.795, "r_y1": 311.337, "r_x2": 463.795, "r_y2": 302.952, "r_x3": 395.748, "r_y3": 303.346, "coord_origin": "TOPLEFT"}, "text": "C C C C C NL", "orig": "C C C C C NL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 13, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 407.563, "r_y0": 322.9, "r_x1": 463.716, "r_y1": 322.618, "r_x2": 463.716, "r_y2": 314.233, "r_x3": 407.563, "r_y3": 314.515, "coord_origin": "TOPLEFT"}, "text": "C C C C NL", "orig": "C C C C NL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 14, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 418.511, "r_y0": 300.579, "r_x1": 463.773, "r_y1": 300.093, "r_x2": 463.773, "r_y2": 291.708, "r_x3": 418.511, "r_y3": 292.194, "coord_origin": "TOPLEFT"}, "text": "C C C NL", "orig": "C C C NL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 15, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 407.397, "r_y0": 333.784, "r_x1": 463.915, "r_y1": 333.963, "r_x2": 463.915, "r_y2": 325.578, "r_x3": 407.397, "r_y3": 325.399, "coord_origin": "TOPLEFT"}, "text": "C C C C NL", "orig": "C C C C NL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 16, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 451.895, "r_y0": 288.651, "r_x1": 463.513, "r_y1": 288.651, "r_x2": 463.513, "r_y2": 280.266, "r_x3": 451.895, "r_y3": 280.266, "coord_origin": "TOPLEFT"}, "text": "NL", "orig": "NL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 17, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 396.097, "r_y0": 322.989, "r_x1": 402.659, "r_y1": 322.989, "r_x2": 402.659, "r_y2": 314.604, "r_x3": 396.097, "r_y3": 314.604, "coord_origin": "TOPLEFT"}, "text": "U", "orig": "U", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 18, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 395.998, "r_y0": 333.883, "r_x1": 402.561, "r_y1": 333.883, "r_x2": 402.561, "r_y2": 325.498, "r_x3": 395.998, "r_y3": 325.498, "coord_origin": "TOPLEFT"}, "text": "U", "orig": "U", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 19, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 396.275, "r_y0": 300.765, "r_x1": 414.036, "r_y1": 300.628, "r_x2": 414.036, "r_y2": 292.243, "r_x3": 396.275, "r_y3": 292.38, "coord_origin": "TOPLEFT"}, "text": "U X", "orig": "U X", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 20, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 441.256, "r_y0": 419.675, "r_x1": 452.874, "r_y1": 419.675, "r_x2": 452.874, "r_y2": 411.29, "r_x3": 441.256, "r_y3": 411.29, "coord_origin": "TOPLEFT"}, "text": "NL", "orig": "NL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 21, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 393.753, "r_y0": 406.873, "r_x1": 432.489, "r_y1": 406.873, "r_x2": 432.489, "r_y2": 399.886, "r_x3": 393.753, "r_y3": 399.886, "coord_origin": "TOPLEFT"}, "text": "vocabulary:", "orig": "vocabulary:", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 22, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 434.59, "r_y0": 406.873, "r_x1": 438.801, "r_y1": 406.873, "r_x2": 438.801, "r_y2": 399.886, "r_x3": 434.59, "r_y3": 399.886, "coord_origin": "TOPLEFT"}, "text": "5", "orig": "5", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 23, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 440.906, "r_y0": 406.873, "r_x1": 463.222, "r_y1": 406.873, "r_x2": 463.222, "r_y2": 399.886, "r_x3": 440.906, "r_y3": 399.886, "coord_origin": "TOPLEFT"}, "text": "tokens", "orig": "tokens", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 24, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 384.118, "r_y0": 265.626, "r_x1": 413.993, "r_y1": 265.626, "r_x2": 413.993, "r_y2": 258.63800000000003, "r_x3": 384.118, "r_y3": 258.63800000000003, "coord_origin": "TOPLEFT"}, "text": "D OTSL", "orig": "D OTSL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 25, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 393.753, "r_y0": 273.75300000000004, "r_x1": 451.451, "r_y1": 273.75300000000004, "r_x2": 451.451, "r_y2": 266.76599999999996, "r_x3": 393.753, "r_y3": 266.76599999999996, "coord_origin": "TOPLEFT"}, "text": "sequence length:", "orig": "sequence length:", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 26, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 453.551, "r_y0": 273.75300000000004, "r_x1": 461.975, "r_y1": 273.75300000000004, "r_x2": 461.975, "r_y2": 266.76599999999996, "r_x3": 453.551, "r_y3": 266.76599999999996, "coord_origin": "TOPLEFT"}, "text": "30", "orig": "30", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 27, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 151.793, "r_y0": 406.839, "r_x1": 233.894, "r_y1": 406.839, "r_x2": 233.894, "r_y2": 399.851, "r_x3": 151.793, "r_y3": 399.851, "coord_origin": "TOPLEFT"}, "text": "vocabulary for this table:", "orig": "vocabulary for this table:", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 28, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 235.993, "r_y0": 406.839, "r_x1": 244.417, "r_y1": 406.839, "r_x2": 244.417, "r_y2": 399.851, "r_x3": 235.993, "r_y3": 399.851, "coord_origin": "TOPLEFT"}, "text": "12", "orig": "12", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 29, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 246.522, "r_y0": 406.839, "r_x1": 268.839, "r_y1": 406.839, "r_x2": 268.839, "r_y2": 399.851, "r_x3": 246.522, "r_y3": 399.851, "coord_origin": "TOPLEFT"}, "text": "tokens", "orig": "tokens", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 30, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 154.33, "r_y0": 220.65300000000002, "r_x1": 159.798, "r_y1": 220.65300000000002, "r_x2": 159.798, "r_y2": 213.66600000000005, "r_x3": 154.33, "r_y3": 213.66600000000005, "coord_origin": "TOPLEFT"}, "text": "A", "orig": "A", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 31, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 321.071, "r_y0": 220.65300000000002, "r_x1": 326.539, "r_y1": 220.65300000000002, "r_x2": 326.539, "r_y2": 213.66600000000005, "r_x3": 321.071, "r_y3": 213.66600000000005, "coord_origin": "TOPLEFT"}, "text": "B", "orig": "B", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 32, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 153.095, "r_y0": 286.675, "r_x1": 175.839, "r_y1": 286.675, "r_x2": 175.839, "r_y2": 280.386, "r_x3": 153.095, "r_y3": 280.386, "coord_origin": "TOPLEFT"}, "text": "<table>", "orig": "<table>", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 33, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 160.67, "r_y0": 293.491, "r_x1": 172.796, "r_y1": 293.491, "r_x2": 172.796, "r_y2": 287.203, "r_x3": 160.67, "r_y3": 287.203, "coord_origin": "TOPLEFT"}, "text": "<tr>", "orig": "<tr>", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 34, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 168.246, "r_y0": 300.308, "r_x1": 351.469, "r_y1": 300.308, "r_x2": 351.469, "r_y2": 294.019, "r_x3": 168.246, "r_y3": 294.019, "coord_origin": "TOPLEFT"}, "text": "<td colspan='2' rowspan='2' > </td> <td colspan='3' > </td>", "orig": "<td colspan='2' rowspan='2' > </td> <td colspan='3' > </td>", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 35, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 160.67, "r_y0": 307.125, "r_x1": 174.69, "r_y1": 307.125, "r_x2": 174.69, "r_y2": 300.836, "r_x3": 160.67, "r_y3": 300.836, "coord_origin": "TOPLEFT"}, "text": "</tr>", "orig": "</tr>", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 36, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 160.67, "r_y0": 313.942, "r_x1": 172.796, "r_y1": 313.942, "r_x2": 172.796, "r_y2": 307.653, "r_x3": 160.67, "r_y3": 307.653, "coord_origin": "TOPLEFT"}, "text": "<tr>", "orig": "<tr>", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 37, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 168.246, "r_y0": 320.759, "r_x1": 265.275, "r_y1": 320.759, "r_x2": 265.275, "r_y2": 314.47, "r_x3": 168.246, "r_y3": 314.47, "coord_origin": "TOPLEFT"}, "text": "<td> </td> <td> </td> <td> </td>", "orig": "<td> </td> <td> </td> <td> </td>", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 38, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 160.67, "r_y0": 327.575, "r_x1": 174.69, "r_y1": 327.575, "r_x2": 174.69, "r_y2": 321.287, "r_x3": 160.67, "r_y3": 321.287, "coord_origin": "TOPLEFT"}, "text": "</tr>", "orig": "</tr>", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 39, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 160.67, "r_y0": 334.392, "r_x1": 172.796, "r_y1": 334.392, "r_x2": 172.796, "r_y2": 328.103, "r_x3": 160.67, "r_y3": 328.103, "coord_origin": "TOPLEFT"}, "text": "<tr>", "orig": "<tr>", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 40, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 168.246, "r_y0": 341.209, "r_x1": 373.091, "r_y1": 341.209, "r_x2": 373.091, "r_y2": 334.92, "r_x3": 168.246, "r_y3": 334.92, "coord_origin": "TOPLEFT"}, "text": "<td rowspan='3' > </td> <td> </td> <td> </td> <td> </td> <td> </td>", "orig": "<td rowspan='3' > </td> <td> </td> <td> </td> <td> </td> <td> </td>", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 41, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 160.67, "r_y0": 348.026, "r_x1": 174.69, "r_y1": 348.026, "r_x2": 174.69, "r_y2": 341.737, "r_x3": 160.67, "r_y3": 341.737, "coord_origin": "TOPLEFT"}, "text": "</tr>", "orig": "</tr>", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 42, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 160.67, "r_y0": 354.842, "r_x1": 172.796, "r_y1": 354.842, "r_x2": 172.796, "r_y2": 348.553, "r_x3": 160.67, "r_y3": 348.553, "coord_origin": "TOPLEFT"}, "text": "<tr>", "orig": "<tr>", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 43, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 168.246, "r_y0": 361.659, "r_x1": 298.249, "r_y1": 361.659, "r_x2": 298.249, "r_y2": 355.37, "r_x3": 168.246, "r_y3": 355.37, "coord_origin": "TOPLEFT"}, "text": "<td> </td> <td> </td> <td> </td> <td> </td>", "orig": "<td> </td> <td> </td> <td> </td> <td> </td>", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 44, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 160.67, "r_y0": 368.476, "r_x1": 174.69, "r_y1": 368.476, "r_x2": 174.69, "r_y2": 362.187, "r_x3": 160.67, "r_y3": 362.187, "coord_origin": "TOPLEFT"}, "text": "</tr>", "orig": "</tr>", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 45, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 160.67, "r_y0": 375.292, "r_x1": 172.796, "r_y1": 375.292, "r_x2": 172.796, "r_y2": 369.004, "r_x3": 160.67, "r_y3": 369.004, "coord_origin": "TOPLEFT"}, "text": "<tr>", "orig": "<tr>", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 46, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 168.246, "r_y0": 382.109, "r_x1": 298.249, "r_y1": 382.109, "r_x2": 298.249, "r_y2": 375.821, "r_x3": 168.246, "r_y3": 375.821, "coord_origin": "TOPLEFT"}, "text": "<td> </td> <td> </td> <td> </td> <td> </td>", "orig": "<td> </td> <td> </td> <td> </td> <td> </td>", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 47, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 160.67, "r_y0": 388.926, "r_x1": 174.69, "r_y1": 388.926, "r_x2": 174.69, "r_y2": 382.637, "r_x3": 160.67, "r_y3": 382.637, "coord_origin": "TOPLEFT"}, "text": "</tr>", "orig": "</tr>", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 48, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 153.095, "r_y0": 395.743, "r_x1": 177.733, "r_y1": 395.743, "r_x2": 177.733, "r_y2": 389.454, "r_x3": 153.095, "r_y3": 389.454, "coord_origin": "TOPLEFT"}, "text": "</table>", "orig": "</table>", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 49, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 395.061, "r_y0": 419.828, "r_x1": 412.476, "r_y1": 419.828, "r_x2": 412.476, "r_y2": 411.443, "r_x3": 395.061, "r_y3": 411.443, "coord_origin": "TOPLEFT"}, "text": "C L", "orig": "C L", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 50, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 418.693, "r_y0": 419.828, "r_x1": 436.571, "r_y1": 419.828, "r_x2": 436.571, "r_y2": 411.443, "r_x3": 418.693, "r_y3": 411.443, "coord_origin": "TOPLEFT"}, "text": "U X", "orig": "U X", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 51, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 152.362, "r_y0": 416.144, "r_x1": 175.106, "r_y1": 416.144, "r_x2": 175.106, "r_y2": 409.855, "r_x3": 152.362, "r_y3": 409.855, "coord_origin": "TOPLEFT"}, "text": "<table>", "orig": "<table>", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 52, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 178.894, "r_y0": 416.144, "r_x1": 191.019, "r_y1": 416.144, "r_x2": 191.019, "r_y2": 409.855, "r_x3": 178.894, "r_y3": 409.855, "coord_origin": "TOPLEFT"}, "text": "<tr>", "orig": "<tr>", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 53, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 194.807, "r_y0": 416.144, "r_x1": 208.826, "r_y1": 416.144, "r_x2": 208.826, "r_y2": 409.855, "r_x3": 194.807, "r_y3": 409.855, "coord_origin": "TOPLEFT"}, "text": "</tr>", "orig": "</tr>", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 54, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 212.614, "r_y0": 416.144, "r_x1": 226.26, "r_y1": 416.144, "r_x2": 226.26, "r_y2": 409.855, "r_x3": 212.614, "r_y3": 409.855, "coord_origin": "TOPLEFT"}, "text": "<td>", "orig": "<td>", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 55, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 230.047, "r_y0": 416.144, "r_x1": 245.588, "r_y1": 416.144, "r_x2": 245.588, "r_y2": 409.855, "r_x3": 230.047, "r_y3": 409.855, "coord_origin": "TOPLEFT"}, "text": "</td>", "orig": "</td>", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 56, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 249.375, "r_y0": 416.144, "r_x1": 259.039, "r_y1": 416.144, "r_x2": 259.039, "r_y2": 409.855, "r_x3": 249.375, "r_y3": 409.855, "coord_origin": "TOPLEFT"}, "text": "<td", "orig": "<td", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 57, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 262.828, "r_y0": 416.144, "r_x1": 298.936, "r_y1": 416.144, "r_x2": 298.936, "r_y2": 409.855, "r_x3": 262.828, "r_y3": 409.855, "coord_origin": "TOPLEFT"}, "text": "colspan=\"2\"", "orig": "colspan=\"2\"", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 58, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 302.724, "r_y0": 416.144, "r_x1": 338.832, "r_y1": 416.144, "r_x2": 338.832, "r_y2": 409.855, "r_x3": 302.724, "r_y3": 409.855, "coord_origin": "TOPLEFT"}, "text": "colspan=\"3\"", "orig": "colspan=\"3\"", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 59, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 152.362, "r_y0": 424.476, "r_x1": 190.741, "r_y1": 424.476, "r_x2": 190.741, "r_y2": 418.187, "r_x3": 152.362, "r_y3": 418.187, "coord_origin": "TOPLEFT"}, "text": "rowspan=\"2\"", "orig": "rowspan=\"2\"", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 60, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 194.529, "r_y0": 424.476, "r_x1": 232.908, "r_y1": 424.476, "r_x2": 232.908, "r_y2": 418.187, "r_x3": 194.529, "r_y3": 418.187, "coord_origin": "TOPLEFT"}, "text": "rowspan=\"3\"", "orig": "rowspan=\"3\"", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 61, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 236.695, "r_y0": 424.476, "r_x1": 269.101, "r_y1": 424.476, "r_x2": 269.101, "r_y2": 418.187, "r_x3": 236.695, "r_y3": 418.187, "coord_origin": "TOPLEFT"}, "text": "> </table>", "orig": "> </table>", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 62, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 154.506, "r_y0": 265.679, "r_x1": 185.219, "r_y1": 265.679, "r_x2": 185.219, "r_y2": 258.692, "r_x3": 154.506, "r_y3": 258.692, "coord_origin": "TOPLEFT"}, "text": "C HTML", "orig": "C HTML", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 63, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 164.355, "r_y0": 273.57500000000005, "r_x1": 222.054, "r_y1": 273.57500000000005, "r_x2": 222.054, "r_y2": 266.58799999999997, "r_x3": 164.355, "r_y3": 266.58799999999997, "coord_origin": "TOPLEFT"}, "text": "sequence length:", "orig": "sequence length:", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 64, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 224.153, "r_y0": 273.57500000000005, "r_x1": 232.577, "r_y1": 273.57500000000005, "r_x2": 232.577, "r_y2": 266.58799999999997, "r_x3": 224.153, "r_y3": 266.58799999999997, "coord_origin": "TOPLEFT"}, "text": "55", "orig": "55", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 65, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 461.111, "r_x1": 161.329, "r_y1": 461.111, "r_x2": 161.329, "r_y2": 452.314, "r_x3": 134.765, "r_y3": 452.314, "coord_origin": "TOPLEFT"}, "text": "today,", "orig": "today,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 66, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 164.269, "r_y0": 461.111, "r_x1": 226.286, "r_y1": 461.111, "r_x2": 226.286, "r_y2": 452.314, "r_x3": 164.269, "r_y3": 452.314, "coord_origin": "TOPLEFT"}, "text": "table detection", "orig": "table detection", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 67, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 229.992, "r_y0": 461.111, "r_x1": 480.592, "r_y1": 461.111, "r_x2": 480.592, "r_y2": 452.314, "r_x3": 229.992, "r_y3": 452.314, "coord_origin": "TOPLEFT"}, "text": "in documents is a well understood problem, and the latest", "orig": "in documents is a well understood problem, and the latest", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 68, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 473.066, "r_x1": 480.592, "r_y1": 473.066, "r_x2": 480.592, "r_y2": 464.269, "r_x3": 134.765, "r_y3": 464.269, "coord_origin": "TOPLEFT"}, "text": "state-of-the-art (SOTA) object detection methods provide an accuracy compa-", "orig": "state-of-the-art (SOTA) object detection methods provide an accuracy compa-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 69, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 485.021, "r_x1": 480.587, "r_y1": 485.021, "r_x2": 480.587, "r_y2": 476.224, "r_x3": 134.765, "r_y3": 476.224, "coord_origin": "TOPLEFT"}, "text": "rable to human observers [7,8,10,14,23]. On the other hand, the problem of table", "orig": "rable to human observers [7,8,10,14,23]. On the other hand, the problem of table", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 70, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 496.977, "r_x1": 480.587, "r_y1": 496.977, "r_x2": 480.587, "r_y2": 488.18, "r_x3": 134.765, "r_y3": 488.18, "coord_origin": "TOPLEFT"}, "text": "structure recognition (TSR) is a lot more challenging and remains a very active", "orig": "structure recognition (TSR) is a lot more challenging and remains a very active", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 71, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 508.932, "r_x1": 165.481, "r_y1": 508.932, "r_x2": 165.481, "r_y2": 500.135, "r_x3": 134.765, "r_y3": 500.135, "coord_origin": "TOPLEFT"}, "text": "area of", "orig": "area of", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 72, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 169.874, "r_y0": 508.932, "r_x1": 207.895, "r_y1": 508.932, "r_x2": 207.895, "r_y2": 500.135, "r_x3": 169.874, "r_y3": 500.135, "coord_origin": "TOPLEFT"}, "text": "research,", "orig": "research,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 73, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 212.289, "r_y0": 508.932, "r_x1": 220.589, "r_y1": 508.932, "r_x2": 220.589, "r_y2": 500.135, "r_x3": 212.289, "r_y3": 500.135, "coord_origin": "TOPLEFT"}, "text": "in", "orig": "in", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 74, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 224.992, "r_y0": 508.932, "r_x1": 480.59, "r_y1": 508.932, "r_x2": 480.59, "r_y2": 500.135, "r_x3": 224.992, "r_y3": 500.135, "coord_origin": "TOPLEFT"}, "text": "which many novel machine learning algorithms are being", "orig": "which many novel machine learning algorithms are being", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 75, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 520.887, "r_x1": 313.246, "r_y1": 520.887, "r_x2": 313.246, "r_y2": 512.0899999999999, "r_x3": 134.765, "r_y3": 512.0899999999999, "coord_origin": "TOPLEFT"}, "text": "explored [3,4,5,9,11,12,13,14,17,18,21,22].", "orig": "explored [3,4,5,9,11,12,13,14,17,18,21,22].", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 76, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 149.709, "r_y0": 533.348, "r_x1": 187.471, "r_y1": 533.348, "r_x2": 187.471, "r_y2": 524.5509999999999, "r_x3": 149.709, "r_y3": 524.5509999999999, "coord_origin": "TOPLEFT"}, "text": "Recently", "orig": "Recently", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 77, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 192.194, "r_y0": 533.348, "r_x1": 480.589, "r_y1": 533.348, "r_x2": 480.589, "r_y2": 524.5509999999999, "r_x3": 192.194, "r_y3": 524.5509999999999, "coord_origin": "TOPLEFT"}, "text": "emerging SOTA methods for table structure recognition employ", "orig": "emerging SOTA methods for table structure recognition employ", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 78, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 545.304, "r_x1": 480.592, "r_y1": 545.304, "r_x2": 480.592, "r_y2": 536.5070000000001, "r_x3": 134.765, "r_y3": 536.5070000000001, "coord_origin": "TOPLEFT"}, "text": "transformer-based models, in which an image of the table is provided to the net-", "orig": "transformer-based models, in which an image of the table is provided to the net-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 79, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 557.259, "r_x1": 480.589, "r_y1": 557.259, "r_x2": 480.589, "r_y2": 548.462, "r_x3": 134.765, "r_y3": 548.462, "coord_origin": "TOPLEFT"}, "text": "work in order to predict the structure of the table as a sequence of tokens. These", "orig": "work in order to predict the structure of the table as a sequence of tokens. These", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 80, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 569.2139999999999, "r_x1": 480.588, "r_y1": 569.2139999999999, "r_x2": 480.588, "r_y2": 560.417, "r_x3": 134.765, "r_y3": 560.417, "coord_origin": "TOPLEFT"}, "text": "image-to-sequence (Im2Seq) models are extremely powerful, since they allow for", "orig": "image-to-sequence (Im2Seq) models are extremely powerful, since they allow for", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 81, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 581.169, "r_x1": 480.59, "r_y1": 581.169, "r_x2": 480.59, "r_y2": 572.3720000000001, "r_x3": 134.765, "r_y3": 572.3720000000001, "coord_origin": "TOPLEFT"}, "text": "a purely data-driven solution. The tokens of the sequence typically belong to a", "orig": "a purely data-driven solution. The tokens of the sequence typically belong to a", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 82, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 593.124, "r_x1": 480.595, "r_y1": 593.124, "r_x2": 480.595, "r_y2": 584.327, "r_x3": 134.765, "r_y3": 584.327, "coord_origin": "TOPLEFT"}, "text": "markup language such as HTML, Latex or Markdown, which allow to describe", "orig": "markup language such as HTML, Latex or Markdown, which allow to describe", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 83, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 605.08, "r_x1": 480.587, "r_y1": 605.08, "r_x2": 480.587, "r_y2": 596.283, "r_x3": 134.765, "r_y3": 596.283, "coord_origin": "TOPLEFT"}, "text": "table structure as rows, columns and spanning cells in various configurations.", "orig": "table structure as rows, columns and spanning cells in various configurations.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 84, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 617.035, "r_x1": 480.595, "r_y1": 617.035, "r_x2": 480.595, "r_y2": 608.238, "r_x3": 134.765, "r_y3": 608.238, "coord_origin": "TOPLEFT"}, "text": "In Figure 1, we illustrate how HTML is used to represent the table-structure", "orig": "In Figure 1, we illustrate how HTML is used to represent the table-structure", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 85, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 628.99, "r_x1": 480.594, "r_y1": 628.99, "r_x2": 480.594, "r_y2": 620.193, "r_x3": 134.765, "r_y3": 620.193, "coord_origin": "TOPLEFT"}, "text": "of a particular example table. Public table-structure data sets such as PubTab-", "orig": "of a particular example table. Public table-structure data sets such as PubTab-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 86, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 640.9449999999999, "r_x1": 480.595, "r_y1": 640.9449999999999, "r_x2": 480.595, "r_y2": 632.148, "r_x3": 134.765, "r_y3": 632.148, "coord_origin": "TOPLEFT"}, "text": "Net [22], and FinTabNet [21], which were created in a semi-automated way from", "orig": "Net [22], and FinTabNet [21], which were created in a semi-automated way from", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 87, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 652.9, "r_x1": 480.588, "r_y1": 652.9, "r_x2": 480.588, "r_y2": 644.1030000000001, "r_x3": 134.765, "r_y3": 644.1030000000001, "coord_origin": "TOPLEFT"}, "text": "paired PDF and HTML sources (e.g. PubMed Central), popularized primarily", "orig": "paired PDF and HTML sources (e.g. PubMed Central), popularized primarily", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 88, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 664.855, "r_x1": 421.454, "r_y1": 664.855, "r_x2": 421.454, "r_y2": 656.058, "r_x3": 134.765, "r_y3": 656.058, "coord_origin": "TOPLEFT"}, "text": "the use of HTML as ground-truth representation format for TSR.", "orig": "the use of HTML as ground-truth representation format for TSR.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "parsed_page": null, "predictions": {"layout": {"clusters": [{"id": 5, "label": "page_header", "bbox": {"l": 134.765, "t": 91.49300000000005, "r": 139.372, "b": 102.78200000000004, "coord_origin": "TOPLEFT"}, "confidence": 0.8580349683761597, "cells": [{"index": 0, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 102.78200000000004, "r_x1": 139.372, "r_y1": 102.78200000000004, "r_x2": 139.372, "r_y2": 91.49300000000005, "r_x3": 134.765, "r_y3": 91.49300000000005, "coord_origin": "TOPLEFT"}, "text": "2", "orig": "2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 3, "label": "page_header", "bbox": {"l": 167.813, "t": 91.49300000000005, "r": 231.722, "b": 102.78200000000004, "coord_origin": "TOPLEFT"}, "confidence": 0.9076642990112305, "cells": [{"index": 1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 167.813, "r_y0": 102.78200000000004, "r_x1": 231.722, "r_y1": 102.78200000000004, "r_x2": 231.722, "r_y2": 91.49300000000005, "r_x3": 167.813, "r_y3": 91.49300000000005, "coord_origin": "TOPLEFT"}, "text": "M. Lysak, et al.", "orig": "M. Lysak, et al.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 4, "label": "caption", "bbox": {"l": 134.765, "t": 124.11900000000003, "r": 480.592, "b": 201.16200000000003, "coord_origin": "TOPLEFT"}, "confidence": 0.8939083218574524, "cells": [{"index": 2, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 134.26, "r_x1": 162.644, "r_y1": 134.26, "r_x2": 162.644, "r_y2": 126.33399999999995, "r_x3": 134.765, "r_y3": 126.33399999999995, "coord_origin": "TOPLEFT"}, "text": "Fig. 1.", "orig": "Fig. 1.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 3, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 167.062, "r_y0": 135.40800000000002, "r_x1": 480.591, "r_y1": 135.40800000000002, "r_x2": 480.591, "r_y2": 124.11900000000003, "r_x3": 167.062, "r_y3": 124.11900000000003, "coord_origin": "TOPLEFT"}, "text": "Comparison between HTML and OTSL table structure representation: (A)", "orig": "Comparison between HTML and OTSL table structure representation: (A)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 4, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 146.36699999999996, "r_x1": 190.823, "r_y1": 146.36699999999996, "r_x2": 190.823, "r_y2": 135.07799999999997, "r_x3": 134.765, "r_y3": 135.07799999999997, "coord_origin": "TOPLEFT"}, "text": "table-example", "orig": "table-example", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 5, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 195.199, "r_y0": 146.36699999999996, "r_x1": 480.59, "r_y1": 146.36699999999996, "r_x2": 480.59, "r_y2": 135.07799999999997, "r_x3": 195.199, "r_y3": 135.07799999999997, "coord_origin": "TOPLEFT"}, "text": "with complex row and column headers, including a 2D empty span,", "orig": "with complex row and column headers, including a 2D empty span,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 6, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 157.32600000000002, "r_x1": 480.591, "r_y1": 157.32600000000002, "r_x2": 480.591, "r_y2": 146.03700000000003, "r_x3": 134.765, "r_y3": 146.03700000000003, "coord_origin": "TOPLEFT"}, "text": "(B) minimal graphical representation of table structure using rectangular layout, (C)", "orig": "(B) minimal graphical representation of table structure using rectangular layout, (C)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 7, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 168.28499999999997, "r_x1": 480.592, "r_y1": 168.28499999999997, "r_x2": 480.592, "r_y2": 156.99599999999998, "r_x3": 134.765, "r_y3": 156.99599999999998, "coord_origin": "TOPLEFT"}, "text": "HTML representation, (D) OTSL representation. This example demonstrates many of", "orig": "HTML representation, (D) OTSL representation. This example demonstrates many of", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 8, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 179.24400000000003, "r_x1": 480.589, "r_y1": 179.24400000000003, "r_x2": 480.589, "r_y2": 167.95500000000004, "r_x3": 134.765, "r_y3": 167.95500000000004, "coord_origin": "TOPLEFT"}, "text": "the key-features of OTSL, namely its reduced vocabulary size (12 versus 5 in this case),", "orig": "the key-features of OTSL, namely its reduced vocabulary size (12 versus 5 in this case),", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 9, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 190.20299999999997, "r_x1": 480.59, "r_y1": 190.20299999999997, "r_x2": 480.59, "r_y2": 178.914, "r_x3": 134.765, "r_y3": 178.914, "coord_origin": "TOPLEFT"}, "text": "its reduced sequence length (55 versus 30) and a enhanced internal structure (variable", "orig": "its reduced sequence length (55 versus 30) and a enhanced internal structure (variable", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 10, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 201.16200000000003, "r_x1": 460.871, "r_y1": 201.16200000000003, "r_x2": 460.871, "r_y2": 189.87300000000005, "r_x3": 134.765, "r_y3": 189.87300000000005, "coord_origin": "TOPLEFT"}, "text": "token sequence length per row in HTML versus a fixed length of rows in OTSL).", "orig": "token sequence length per row in HTML versus a fixed length of rows in OTSL).", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 1, "label": "picture", "bbox": {"l": 148.45364379882812, "t": 208.37423706054688, "r": 464.3608093261719, "b": 425.8462219238281, "coord_origin": "TOPLEFT"}, "confidence": 0.9688959121704102, "cells": [{"index": 11, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 396.411, "r_y0": 289.478, "r_x1": 446.134, "r_y1": 288.875, "r_x2": 446.134, "r_y2": 280.49, "r_x3": 396.411, "r_y3": 281.093, "coord_origin": "TOPLEFT"}, "text": "C L C L L", "orig": "C L C L L", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 12, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 395.748, "r_y0": 311.731, "r_x1": 463.795, "r_y1": 311.337, "r_x2": 463.795, "r_y2": 302.952, "r_x3": 395.748, "r_y3": 303.346, "coord_origin": "TOPLEFT"}, "text": "C C C C C NL", "orig": "C C C C C NL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 13, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 407.563, "r_y0": 322.9, "r_x1": 463.716, "r_y1": 322.618, "r_x2": 463.716, "r_y2": 314.233, "r_x3": 407.563, "r_y3": 314.515, "coord_origin": "TOPLEFT"}, "text": "C C C C NL", "orig": "C C C C NL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 14, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 418.511, "r_y0": 300.579, "r_x1": 463.773, "r_y1": 300.093, "r_x2": 463.773, "r_y2": 291.708, "r_x3": 418.511, "r_y3": 292.194, "coord_origin": "TOPLEFT"}, "text": "C C C NL", "orig": "C C C NL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 15, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 407.397, "r_y0": 333.784, "r_x1": 463.915, "r_y1": 333.963, "r_x2": 463.915, "r_y2": 325.578, "r_x3": 407.397, "r_y3": 325.399, "coord_origin": "TOPLEFT"}, "text": "C C C C NL", "orig": "C C C C NL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 16, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 451.895, "r_y0": 288.651, "r_x1": 463.513, "r_y1": 288.651, "r_x2": 463.513, "r_y2": 280.266, "r_x3": 451.895, "r_y3": 280.266, "coord_origin": "TOPLEFT"}, "text": "NL", "orig": "NL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 17, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 396.097, "r_y0": 322.989, "r_x1": 402.659, "r_y1": 322.989, "r_x2": 402.659, "r_y2": 314.604, "r_x3": 396.097, "r_y3": 314.604, "coord_origin": "TOPLEFT"}, "text": "U", "orig": "U", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 18, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 395.998, "r_y0": 333.883, "r_x1": 402.561, "r_y1": 333.883, "r_x2": 402.561, "r_y2": 325.498, "r_x3": 395.998, "r_y3": 325.498, "coord_origin": "TOPLEFT"}, "text": "U", "orig": "U", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 19, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 396.275, "r_y0": 300.765, "r_x1": 414.036, "r_y1": 300.628, "r_x2": 414.036, "r_y2": 292.243, "r_x3": 396.275, "r_y3": 292.38, "coord_origin": "TOPLEFT"}, "text": "U X", "orig": "U X", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 20, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 441.256, "r_y0": 419.675, "r_x1": 452.874, "r_y1": 419.675, "r_x2": 452.874, "r_y2": 411.29, "r_x3": 441.256, "r_y3": 411.29, "coord_origin": "TOPLEFT"}, "text": "NL", "orig": "NL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 21, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 393.753, "r_y0": 406.873, "r_x1": 432.489, "r_y1": 406.873, "r_x2": 432.489, "r_y2": 399.886, "r_x3": 393.753, "r_y3": 399.886, "coord_origin": "TOPLEFT"}, "text": "vocabulary:", "orig": "vocabulary:", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 22, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 434.59, "r_y0": 406.873, "r_x1": 438.801, "r_y1": 406.873, "r_x2": 438.801, "r_y2": 399.886, "r_x3": 434.59, "r_y3": 399.886, "coord_origin": "TOPLEFT"}, "text": "5", "orig": "5", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 23, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 440.906, "r_y0": 406.873, "r_x1": 463.222, "r_y1": 406.873, "r_x2": 463.222, "r_y2": 399.886, "r_x3": 440.906, "r_y3": 399.886, "coord_origin": "TOPLEFT"}, "text": "tokens", "orig": "tokens", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 24, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 384.118, "r_y0": 265.626, "r_x1": 413.993, "r_y1": 265.626, "r_x2": 413.993, "r_y2": 258.63800000000003, "r_x3": 384.118, "r_y3": 258.63800000000003, "coord_origin": "TOPLEFT"}, "text": "D OTSL", "orig": "D OTSL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 25, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 393.753, "r_y0": 273.75300000000004, "r_x1": 451.451, "r_y1": 273.75300000000004, "r_x2": 451.451, "r_y2": 266.76599999999996, "r_x3": 393.753, "r_y3": 266.76599999999996, "coord_origin": "TOPLEFT"}, "text": "sequence length:", "orig": "sequence length:", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 26, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 453.551, "r_y0": 273.75300000000004, "r_x1": 461.975, "r_y1": 273.75300000000004, "r_x2": 461.975, "r_y2": 266.76599999999996, "r_x3": 453.551, "r_y3": 266.76599999999996, "coord_origin": "TOPLEFT"}, "text": "30", "orig": "30", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 27, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 151.793, "r_y0": 406.839, "r_x1": 233.894, "r_y1": 406.839, "r_x2": 233.894, "r_y2": 399.851, "r_x3": 151.793, "r_y3": 399.851, "coord_origin": "TOPLEFT"}, "text": "vocabulary for this table:", "orig": "vocabulary for this table:", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 28, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 235.993, "r_y0": 406.839, "r_x1": 244.417, "r_y1": 406.839, "r_x2": 244.417, "r_y2": 399.851, "r_x3": 235.993, "r_y3": 399.851, "coord_origin": "TOPLEFT"}, "text": "12", "orig": "12", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 29, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 246.522, "r_y0": 406.839, "r_x1": 268.839, "r_y1": 406.839, "r_x2": 268.839, "r_y2": 399.851, "r_x3": 246.522, "r_y3": 399.851, "coord_origin": "TOPLEFT"}, "text": "tokens", "orig": "tokens", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 30, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 154.33, "r_y0": 220.65300000000002, "r_x1": 159.798, "r_y1": 220.65300000000002, "r_x2": 159.798, "r_y2": 213.66600000000005, "r_x3": 154.33, "r_y3": 213.66600000000005, "coord_origin": "TOPLEFT"}, "text": "A", "orig": "A", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 31, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 321.071, "r_y0": 220.65300000000002, "r_x1": 326.539, "r_y1": 220.65300000000002, "r_x2": 326.539, "r_y2": 213.66600000000005, "r_x3": 321.071, "r_y3": 213.66600000000005, "coord_origin": "TOPLEFT"}, "text": "B", "orig": "B", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 32, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 153.095, "r_y0": 286.675, "r_x1": 175.839, "r_y1": 286.675, "r_x2": 175.839, "r_y2": 280.386, "r_x3": 153.095, "r_y3": 280.386, "coord_origin": "TOPLEFT"}, "text": "<table>", "orig": "<table>", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 33, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 160.67, "r_y0": 293.491, "r_x1": 172.796, "r_y1": 293.491, "r_x2": 172.796, "r_y2": 287.203, "r_x3": 160.67, "r_y3": 287.203, "coord_origin": "TOPLEFT"}, "text": "<tr>", "orig": "<tr>", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 34, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 168.246, "r_y0": 300.308, "r_x1": 351.469, "r_y1": 300.308, "r_x2": 351.469, "r_y2": 294.019, "r_x3": 168.246, "r_y3": 294.019, "coord_origin": "TOPLEFT"}, "text": "<td colspan='2' rowspan='2' > </td> <td colspan='3' > </td>", "orig": "<td colspan='2' rowspan='2' > </td> <td colspan='3' > </td>", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 35, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 160.67, "r_y0": 307.125, "r_x1": 174.69, "r_y1": 307.125, "r_x2": 174.69, "r_y2": 300.836, "r_x3": 160.67, "r_y3": 300.836, "coord_origin": "TOPLEFT"}, "text": "</tr>", "orig": "</tr>", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 36, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 160.67, "r_y0": 313.942, "r_x1": 172.796, "r_y1": 313.942, "r_x2": 172.796, "r_y2": 307.653, "r_x3": 160.67, "r_y3": 307.653, "coord_origin": "TOPLEFT"}, "text": "<tr>", "orig": "<tr>", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 37, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 168.246, "r_y0": 320.759, "r_x1": 265.275, "r_y1": 320.759, "r_x2": 265.275, "r_y2": 314.47, "r_x3": 168.246, "r_y3": 314.47, "coord_origin": "TOPLEFT"}, "text": "<td> </td> <td> </td> <td> </td>", "orig": "<td> </td> <td> </td> <td> </td>", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 38, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 160.67, "r_y0": 327.575, "r_x1": 174.69, "r_y1": 327.575, "r_x2": 174.69, "r_y2": 321.287, "r_x3": 160.67, "r_y3": 321.287, "coord_origin": "TOPLEFT"}, "text": "</tr>", "orig": "</tr>", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 39, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 160.67, "r_y0": 334.392, "r_x1": 172.796, "r_y1": 334.392, "r_x2": 172.796, "r_y2": 328.103, "r_x3": 160.67, "r_y3": 328.103, "coord_origin": "TOPLEFT"}, "text": "<tr>", "orig": "<tr>", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 40, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 168.246, "r_y0": 341.209, "r_x1": 373.091, "r_y1": 341.209, "r_x2": 373.091, "r_y2": 334.92, "r_x3": 168.246, "r_y3": 334.92, "coord_origin": "TOPLEFT"}, "text": "<td rowspan='3' > </td> <td> </td> <td> </td> <td> </td> <td> </td>", "orig": "<td rowspan='3' > </td> <td> </td> <td> </td> <td> </td> <td> </td>", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 41, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 160.67, "r_y0": 348.026, "r_x1": 174.69, "r_y1": 348.026, "r_x2": 174.69, "r_y2": 341.737, "r_x3": 160.67, "r_y3": 341.737, "coord_origin": "TOPLEFT"}, "text": "</tr>", "orig": "</tr>", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 42, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 160.67, "r_y0": 354.842, "r_x1": 172.796, "r_y1": 354.842, "r_x2": 172.796, "r_y2": 348.553, "r_x3": 160.67, "r_y3": 348.553, "coord_origin": "TOPLEFT"}, "text": "<tr>", "orig": "<tr>", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 43, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 168.246, "r_y0": 361.659, "r_x1": 298.249, "r_y1": 361.659, "r_x2": 298.249, "r_y2": 355.37, "r_x3": 168.246, "r_y3": 355.37, "coord_origin": "TOPLEFT"}, "text": "<td> </td> <td> </td> <td> </td> <td> </td>", "orig": "<td> </td> <td> </td> <td> </td> <td> </td>", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 44, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 160.67, "r_y0": 368.476, "r_x1": 174.69, "r_y1": 368.476, "r_x2": 174.69, "r_y2": 362.187, "r_x3": 160.67, "r_y3": 362.187, "coord_origin": "TOPLEFT"}, "text": "</tr>", "orig": "</tr>", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 45, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 160.67, "r_y0": 375.292, "r_x1": 172.796, "r_y1": 375.292, "r_x2": 172.796, "r_y2": 369.004, "r_x3": 160.67, "r_y3": 369.004, "coord_origin": "TOPLEFT"}, "text": "<tr>", "orig": "<tr>", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 46, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 168.246, "r_y0": 382.109, "r_x1": 298.249, "r_y1": 382.109, "r_x2": 298.249, "r_y2": 375.821, "r_x3": 168.246, "r_y3": 375.821, "coord_origin": "TOPLEFT"}, "text": "<td> </td> <td> </td> <td> </td> <td> </td>", "orig": "<td> </td> <td> </td> <td> </td> <td> </td>", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 47, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 160.67, "r_y0": 388.926, "r_x1": 174.69, "r_y1": 388.926, "r_x2": 174.69, "r_y2": 382.637, "r_x3": 160.67, "r_y3": 382.637, "coord_origin": "TOPLEFT"}, "text": "</tr>", "orig": "</tr>", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 48, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 153.095, "r_y0": 395.743, "r_x1": 177.733, "r_y1": 395.743, "r_x2": 177.733, "r_y2": 389.454, "r_x3": 153.095, "r_y3": 389.454, "coord_origin": "TOPLEFT"}, "text": "</table>", "orig": "</table>", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 49, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 395.061, "r_y0": 419.828, "r_x1": 412.476, "r_y1": 419.828, "r_x2": 412.476, "r_y2": 411.443, "r_x3": 395.061, "r_y3": 411.443, "coord_origin": "TOPLEFT"}, "text": "C L", "orig": "C L", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 50, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 418.693, "r_y0": 419.828, "r_x1": 436.571, "r_y1": 419.828, "r_x2": 436.571, "r_y2": 411.443, "r_x3": 418.693, "r_y3": 411.443, "coord_origin": "TOPLEFT"}, "text": "U X", "orig": "U X", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 51, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 152.362, "r_y0": 416.144, "r_x1": 175.106, "r_y1": 416.144, "r_x2": 175.106, "r_y2": 409.855, "r_x3": 152.362, "r_y3": 409.855, "coord_origin": "TOPLEFT"}, "text": "<table>", "orig": "<table>", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 52, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 178.894, "r_y0": 416.144, "r_x1": 191.019, "r_y1": 416.144, "r_x2": 191.019, "r_y2": 409.855, "r_x3": 178.894, "r_y3": 409.855, "coord_origin": "TOPLEFT"}, "text": "<tr>", "orig": "<tr>", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 53, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 194.807, "r_y0": 416.144, "r_x1": 208.826, "r_y1": 416.144, "r_x2": 208.826, "r_y2": 409.855, "r_x3": 194.807, "r_y3": 409.855, "coord_origin": "TOPLEFT"}, "text": "</tr>", "orig": "</tr>", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 54, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 212.614, "r_y0": 416.144, "r_x1": 226.26, "r_y1": 416.144, "r_x2": 226.26, "r_y2": 409.855, "r_x3": 212.614, "r_y3": 409.855, "coord_origin": "TOPLEFT"}, "text": "<td>", "orig": "<td>", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 55, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 230.047, "r_y0": 416.144, "r_x1": 245.588, "r_y1": 416.144, "r_x2": 245.588, "r_y2": 409.855, "r_x3": 230.047, "r_y3": 409.855, "coord_origin": "TOPLEFT"}, "text": "</td>", "orig": "</td>", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 56, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 249.375, "r_y0": 416.144, "r_x1": 259.039, "r_y1": 416.144, "r_x2": 259.039, "r_y2": 409.855, "r_x3": 249.375, "r_y3": 409.855, "coord_origin": "TOPLEFT"}, "text": "<td", "orig": "<td", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 57, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 262.828, "r_y0": 416.144, "r_x1": 298.936, "r_y1": 416.144, "r_x2": 298.936, "r_y2": 409.855, "r_x3": 262.828, "r_y3": 409.855, "coord_origin": "TOPLEFT"}, "text": "colspan=\"2\"", "orig": "colspan=\"2\"", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 58, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 302.724, "r_y0": 416.144, "r_x1": 338.832, "r_y1": 416.144, "r_x2": 338.832, "r_y2": 409.855, "r_x3": 302.724, "r_y3": 409.855, "coord_origin": "TOPLEFT"}, "text": "colspan=\"3\"", "orig": "colspan=\"3\"", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 59, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 152.362, "r_y0": 424.476, "r_x1": 190.741, "r_y1": 424.476, "r_x2": 190.741, "r_y2": 418.187, "r_x3": 152.362, "r_y3": 418.187, "coord_origin": "TOPLEFT"}, "text": "rowspan=\"2\"", "orig": "rowspan=\"2\"", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 60, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 194.529, "r_y0": 424.476, "r_x1": 232.908, "r_y1": 424.476, "r_x2": 232.908, "r_y2": 418.187, "r_x3": 194.529, "r_y3": 418.187, "coord_origin": "TOPLEFT"}, "text": "rowspan=\"3\"", "orig": "rowspan=\"3\"", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 61, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 236.695, "r_y0": 424.476, "r_x1": 269.101, "r_y1": 424.476, "r_x2": 269.101, "r_y2": 418.187, "r_x3": 236.695, "r_y3": 418.187, "coord_origin": "TOPLEFT"}, "text": "> </table>", "orig": "> </table>", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 62, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 154.506, "r_y0": 265.679, "r_x1": 185.219, "r_y1": 265.679, "r_x2": 185.219, "r_y2": 258.692, "r_x3": 154.506, "r_y3": 258.692, "coord_origin": "TOPLEFT"}, "text": "C HTML", "orig": "C HTML", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 63, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 164.355, "r_y0": 273.57500000000005, "r_x1": 222.054, "r_y1": 273.57500000000005, "r_x2": 222.054, "r_y2": 266.58799999999997, "r_x3": 164.355, "r_y3": 266.58799999999997, "coord_origin": "TOPLEFT"}, "text": "sequence length:", "orig": "sequence length:", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 64, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 224.153, "r_y0": 273.57500000000005, "r_x1": 232.577, "r_y1": 273.57500000000005, "r_x2": 232.577, "r_y2": 266.58799999999997, "r_x3": 224.153, "r_y3": 266.58799999999997, "coord_origin": "TOPLEFT"}, "text": "55", "orig": "55", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": [{"id": 11, "label": "text", "bbox": {"l": 396.411, "t": 280.49, "r": 446.134, "b": 289.478, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 11, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 396.411, "r_y0": 289.478, "r_x1": 446.134, "r_y1": 288.875, "r_x2": 446.134, "r_y2": 280.49, "r_x3": 396.411, "r_y3": 281.093, "coord_origin": "TOPLEFT"}, "text": "C L C L L", "orig": "C L C L L", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 12, "label": "text", "bbox": {"l": 395.748, "t": 302.952, "r": 463.795, "b": 311.731, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 12, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 395.748, "r_y0": 311.731, "r_x1": 463.795, "r_y1": 311.337, "r_x2": 463.795, "r_y2": 302.952, "r_x3": 395.748, "r_y3": 303.346, "coord_origin": "TOPLEFT"}, "text": "C C C C C NL", "orig": "C C C C C NL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 13, "label": "text", "bbox": {"l": 407.563, "t": 314.233, "r": 463.716, "b": 322.9, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 13, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 407.563, "r_y0": 322.9, "r_x1": 463.716, "r_y1": 322.618, "r_x2": 463.716, "r_y2": 314.233, "r_x3": 407.563, "r_y3": 314.515, "coord_origin": "TOPLEFT"}, "text": "C C C C NL", "orig": "C C C C NL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 14, "label": "text", "bbox": {"l": 418.511, "t": 291.708, "r": 463.773, "b": 300.579, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 14, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 418.511, "r_y0": 300.579, "r_x1": 463.773, "r_y1": 300.093, "r_x2": 463.773, "r_y2": 291.708, "r_x3": 418.511, "r_y3": 292.194, "coord_origin": "TOPLEFT"}, "text": "C C C NL", "orig": "C C C NL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 15, "label": "text", "bbox": {"l": 407.397, "t": 325.399, "r": 463.915, "b": 333.963, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 15, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 407.397, "r_y0": 333.784, "r_x1": 463.915, "r_y1": 333.963, "r_x2": 463.915, "r_y2": 325.578, "r_x3": 407.397, "r_y3": 325.399, "coord_origin": "TOPLEFT"}, "text": "C C C C NL", "orig": "C C C C NL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 16, "label": "text", "bbox": {"l": 451.895, "t": 280.266, "r": 463.513, "b": 288.651, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 16, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 451.895, "r_y0": 288.651, "r_x1": 463.513, "r_y1": 288.651, "r_x2": 463.513, "r_y2": 280.266, "r_x3": 451.895, "r_y3": 280.266, "coord_origin": "TOPLEFT"}, "text": "NL", "orig": "NL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 17, "label": "text", "bbox": {"l": 396.097, "t": 314.604, "r": 402.659, "b": 322.989, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 17, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 396.097, "r_y0": 322.989, "r_x1": 402.659, "r_y1": 322.989, "r_x2": 402.659, "r_y2": 314.604, "r_x3": 396.097, "r_y3": 314.604, "coord_origin": "TOPLEFT"}, "text": "U", "orig": "U", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 18, "label": "text", "bbox": {"l": 395.998, "t": 325.498, "r": 402.561, "b": 333.883, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 18, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 395.998, "r_y0": 333.883, "r_x1": 402.561, "r_y1": 333.883, "r_x2": 402.561, "r_y2": 325.498, "r_x3": 395.998, "r_y3": 325.498, "coord_origin": "TOPLEFT"}, "text": "U", "orig": "U", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 19, "label": "text", "bbox": {"l": 396.275, "t": 292.243, "r": 414.036, "b": 300.765, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 19, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 396.275, "r_y0": 300.765, "r_x1": 414.036, "r_y1": 300.628, "r_x2": 414.036, "r_y2": 292.243, "r_x3": 396.275, "r_y3": 292.38, "coord_origin": "TOPLEFT"}, "text": "U X", "orig": "U X", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 20, "label": "text", "bbox": {"l": 441.256, "t": 411.29, "r": 452.874, "b": 419.675, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 20, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 441.256, "r_y0": 419.675, "r_x1": 452.874, "r_y1": 419.675, "r_x2": 452.874, "r_y2": 411.29, "r_x3": 441.256, "r_y3": 411.29, "coord_origin": "TOPLEFT"}, "text": "NL", "orig": "NL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 21, "label": "text", "bbox": {"l": 393.753, "t": 399.886, "r": 432.489, "b": 406.873, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 21, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 393.753, "r_y0": 406.873, "r_x1": 432.489, "r_y1": 406.873, "r_x2": 432.489, "r_y2": 399.886, "r_x3": 393.753, "r_y3": 399.886, "coord_origin": "TOPLEFT"}, "text": "vocabulary:", "orig": "vocabulary:", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 22, "label": "text", "bbox": {"l": 434.59, "t": 399.886, "r": 438.801, "b": 406.873, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 22, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 434.59, "r_y0": 406.873, "r_x1": 438.801, "r_y1": 406.873, "r_x2": 438.801, "r_y2": 399.886, "r_x3": 434.59, "r_y3": 399.886, "coord_origin": "TOPLEFT"}, "text": "5", "orig": "5", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 23, "label": "text", "bbox": {"l": 440.906, "t": 399.886, "r": 463.222, "b": 406.873, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 23, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 440.906, "r_y0": 406.873, "r_x1": 463.222, "r_y1": 406.873, "r_x2": 463.222, "r_y2": 399.886, "r_x3": 440.906, "r_y3": 399.886, "coord_origin": "TOPLEFT"}, "text": "tokens", "orig": "tokens", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 24, "label": "text", "bbox": {"l": 384.118, "t": 258.63800000000003, "r": 413.993, "b": 265.626, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 24, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 384.118, "r_y0": 265.626, "r_x1": 413.993, "r_y1": 265.626, "r_x2": 413.993, "r_y2": 258.63800000000003, "r_x3": 384.118, "r_y3": 258.63800000000003, "coord_origin": "TOPLEFT"}, "text": "D OTSL", "orig": "D OTSL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 25, "label": "text", "bbox": {"l": 393.753, "t": 266.76599999999996, "r": 451.451, "b": 273.75300000000004, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 25, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 393.753, "r_y0": 273.75300000000004, "r_x1": 451.451, "r_y1": 273.75300000000004, "r_x2": 451.451, "r_y2": 266.76599999999996, "r_x3": 393.753, "r_y3": 266.76599999999996, "coord_origin": "TOPLEFT"}, "text": "sequence length:", "orig": "sequence length:", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 26, "label": "text", "bbox": {"l": 453.551, "t": 266.76599999999996, "r": 461.975, "b": 273.75300000000004, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 26, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 453.551, "r_y0": 273.75300000000004, "r_x1": 461.975, "r_y1": 273.75300000000004, "r_x2": 461.975, "r_y2": 266.76599999999996, "r_x3": 453.551, "r_y3": 266.76599999999996, "coord_origin": "TOPLEFT"}, "text": "30", "orig": "30", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 27, "label": "text", "bbox": {"l": 151.793, "t": 399.851, "r": 233.894, "b": 406.839, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 27, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 151.793, "r_y0": 406.839, "r_x1": 233.894, "r_y1": 406.839, "r_x2": 233.894, "r_y2": 399.851, "r_x3": 151.793, "r_y3": 399.851, "coord_origin": "TOPLEFT"}, "text": "vocabulary for this table:", "orig": "vocabulary for this table:", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 28, "label": "text", "bbox": {"l": 235.993, "t": 399.851, "r": 244.417, "b": 406.839, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 28, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 235.993, "r_y0": 406.839, "r_x1": 244.417, "r_y1": 406.839, "r_x2": 244.417, "r_y2": 399.851, "r_x3": 235.993, "r_y3": 399.851, "coord_origin": "TOPLEFT"}, "text": "12", "orig": "12", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 29, "label": "text", "bbox": {"l": 246.522, "t": 399.851, "r": 268.839, "b": 406.839, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 29, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 246.522, "r_y0": 406.839, "r_x1": 268.839, "r_y1": 406.839, "r_x2": 268.839, "r_y2": 399.851, "r_x3": 246.522, "r_y3": 399.851, "coord_origin": "TOPLEFT"}, "text": "tokens", "orig": "tokens", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 30, "label": "text", "bbox": {"l": 154.33, "t": 213.66600000000005, "r": 159.798, "b": 220.65300000000002, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 30, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 154.33, "r_y0": 220.65300000000002, "r_x1": 159.798, "r_y1": 220.65300000000002, "r_x2": 159.798, "r_y2": 213.66600000000005, "r_x3": 154.33, "r_y3": 213.66600000000005, "coord_origin": "TOPLEFT"}, "text": "A", "orig": "A", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 31, "label": "text", "bbox": {"l": 321.071, "t": 213.66600000000005, "r": 326.539, "b": 220.65300000000002, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 31, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 321.071, "r_y0": 220.65300000000002, "r_x1": 326.539, "r_y1": 220.65300000000002, "r_x2": 326.539, "r_y2": 213.66600000000005, "r_x3": 321.071, "r_y3": 213.66600000000005, "coord_origin": "TOPLEFT"}, "text": "B", "orig": "B", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 32, "label": "text", "bbox": {"l": 153.095, "t": 280.386, "r": 175.839, "b": 286.675, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 32, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 153.095, "r_y0": 286.675, "r_x1": 175.839, "r_y1": 286.675, "r_x2": 175.839, "r_y2": 280.386, "r_x3": 153.095, "r_y3": 280.386, "coord_origin": "TOPLEFT"}, "text": "<table>", "orig": "<table>", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 33, "label": "text", "bbox": {"l": 160.67, "t": 287.203, "r": 172.796, "b": 293.491, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 33, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 160.67, "r_y0": 293.491, "r_x1": 172.796, "r_y1": 293.491, "r_x2": 172.796, "r_y2": 287.203, "r_x3": 160.67, "r_y3": 287.203, "coord_origin": "TOPLEFT"}, "text": "<tr>", "orig": "<tr>", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 34, "label": "text", "bbox": {"l": 168.246, "t": 294.019, "r": 351.469, "b": 300.308, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 34, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 168.246, "r_y0": 300.308, "r_x1": 351.469, "r_y1": 300.308, "r_x2": 351.469, "r_y2": 294.019, "r_x3": 168.246, "r_y3": 294.019, "coord_origin": "TOPLEFT"}, "text": "<td colspan='2' rowspan='2' > </td> <td colspan='3' > </td>", "orig": "<td colspan='2' rowspan='2' > </td> <td colspan='3' > </td>", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 35, "label": "text", "bbox": {"l": 160.67, "t": 300.836, "r": 174.69, "b": 307.125, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 35, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 160.67, "r_y0": 307.125, "r_x1": 174.69, "r_y1": 307.125, "r_x2": 174.69, "r_y2": 300.836, "r_x3": 160.67, "r_y3": 300.836, "coord_origin": "TOPLEFT"}, "text": "</tr>", "orig": "</tr>", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 36, "label": "text", "bbox": {"l": 160.67, "t": 307.653, "r": 172.796, "b": 313.942, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 36, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 160.67, "r_y0": 313.942, "r_x1": 172.796, "r_y1": 313.942, "r_x2": 172.796, "r_y2": 307.653, "r_x3": 160.67, "r_y3": 307.653, "coord_origin": "TOPLEFT"}, "text": "<tr>", "orig": "<tr>", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 37, "label": "text", "bbox": {"l": 168.246, "t": 314.47, "r": 265.275, "b": 320.759, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 37, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 168.246, "r_y0": 320.759, "r_x1": 265.275, "r_y1": 320.759, "r_x2": 265.275, "r_y2": 314.47, "r_x3": 168.246, "r_y3": 314.47, "coord_origin": "TOPLEFT"}, "text": "<td> </td> <td> </td> <td> </td>", "orig": "<td> </td> <td> </td> <td> </td>", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 38, "label": "text", "bbox": {"l": 160.67, "t": 321.287, "r": 174.69, "b": 327.575, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 38, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 160.67, "r_y0": 327.575, "r_x1": 174.69, "r_y1": 327.575, "r_x2": 174.69, "r_y2": 321.287, "r_x3": 160.67, "r_y3": 321.287, "coord_origin": "TOPLEFT"}, "text": "</tr>", "orig": "</tr>", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 39, "label": "text", "bbox": {"l": 160.67, "t": 328.103, "r": 172.796, "b": 334.392, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 39, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 160.67, "r_y0": 334.392, "r_x1": 172.796, "r_y1": 334.392, "r_x2": 172.796, "r_y2": 328.103, "r_x3": 160.67, "r_y3": 328.103, "coord_origin": "TOPLEFT"}, "text": "<tr>", "orig": "<tr>", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 40, "label": "text", "bbox": {"l": 168.246, "t": 334.92, "r": 373.091, "b": 341.209, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 40, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 168.246, "r_y0": 341.209, "r_x1": 373.091, "r_y1": 341.209, "r_x2": 373.091, "r_y2": 334.92, "r_x3": 168.246, "r_y3": 334.92, "coord_origin": "TOPLEFT"}, "text": "<td rowspan='3' > </td> <td> </td> <td> </td> <td> </td> <td> </td>", "orig": "<td rowspan='3' > </td> <td> </td> <td> </td> <td> </td> <td> </td>", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 41, "label": "text", "bbox": {"l": 160.67, "t": 341.737, "r": 174.69, "b": 348.026, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 41, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 160.67, "r_y0": 348.026, "r_x1": 174.69, "r_y1": 348.026, "r_x2": 174.69, "r_y2": 341.737, "r_x3": 160.67, "r_y3": 341.737, "coord_origin": "TOPLEFT"}, "text": "</tr>", "orig": "</tr>", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 42, "label": "text", "bbox": {"l": 160.67, "t": 348.553, "r": 172.796, "b": 354.842, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 42, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 160.67, "r_y0": 354.842, "r_x1": 172.796, "r_y1": 354.842, "r_x2": 172.796, "r_y2": 348.553, "r_x3": 160.67, "r_y3": 348.553, "coord_origin": "TOPLEFT"}, "text": "<tr>", "orig": "<tr>", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 43, "label": "text", "bbox": {"l": 168.246, "t": 355.37, "r": 298.249, "b": 361.659, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 43, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 168.246, "r_y0": 361.659, "r_x1": 298.249, "r_y1": 361.659, "r_x2": 298.249, "r_y2": 355.37, "r_x3": 168.246, "r_y3": 355.37, "coord_origin": "TOPLEFT"}, "text": "<td> </td> <td> </td> <td> </td> <td> </td>", "orig": "<td> </td> <td> </td> <td> </td> <td> </td>", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 44, "label": "text", "bbox": {"l": 160.67, "t": 362.187, "r": 174.69, "b": 368.476, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 44, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 160.67, "r_y0": 368.476, "r_x1": 174.69, "r_y1": 368.476, "r_x2": 174.69, "r_y2": 362.187, "r_x3": 160.67, "r_y3": 362.187, "coord_origin": "TOPLEFT"}, "text": "</tr>", "orig": "</tr>", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 45, "label": "text", "bbox": {"l": 160.67, "t": 369.004, "r": 172.796, "b": 375.292, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 45, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 160.67, "r_y0": 375.292, "r_x1": 172.796, "r_y1": 375.292, "r_x2": 172.796, "r_y2": 369.004, "r_x3": 160.67, "r_y3": 369.004, "coord_origin": "TOPLEFT"}, "text": "<tr>", "orig": "<tr>", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 46, "label": "text", "bbox": {"l": 168.246, "t": 375.821, "r": 298.249, "b": 382.109, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 46, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 168.246, "r_y0": 382.109, "r_x1": 298.249, "r_y1": 382.109, "r_x2": 298.249, "r_y2": 375.821, "r_x3": 168.246, "r_y3": 375.821, "coord_origin": "TOPLEFT"}, "text": "<td> </td> <td> </td> <td> </td> <td> </td>", "orig": "<td> </td> <td> </td> <td> </td> <td> </td>", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 47, "label": "text", "bbox": {"l": 160.67, "t": 382.637, "r": 174.69, "b": 388.926, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 47, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 160.67, "r_y0": 388.926, "r_x1": 174.69, "r_y1": 388.926, "r_x2": 174.69, "r_y2": 382.637, "r_x3": 160.67, "r_y3": 382.637, "coord_origin": "TOPLEFT"}, "text": "</tr>", "orig": "</tr>", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 48, "label": "text", "bbox": {"l": 153.095, "t": 389.454, "r": 177.733, "b": 395.743, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 48, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 153.095, "r_y0": 395.743, "r_x1": 177.733, "r_y1": 395.743, "r_x2": 177.733, "r_y2": 389.454, "r_x3": 153.095, "r_y3": 389.454, "coord_origin": "TOPLEFT"}, "text": "</table>", "orig": "</table>", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 49, "label": "text", "bbox": {"l": 395.061, "t": 411.443, "r": 412.476, "b": 419.828, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 49, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 395.061, "r_y0": 419.828, "r_x1": 412.476, "r_y1": 419.828, "r_x2": 412.476, "r_y2": 411.443, "r_x3": 395.061, "r_y3": 411.443, "coord_origin": "TOPLEFT"}, "text": "C L", "orig": "C L", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 50, "label": "text", "bbox": {"l": 418.693, "t": 411.443, "r": 436.571, "b": 419.828, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 50, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 418.693, "r_y0": 419.828, "r_x1": 436.571, "r_y1": 419.828, "r_x2": 436.571, "r_y2": 411.443, "r_x3": 418.693, "r_y3": 411.443, "coord_origin": "TOPLEFT"}, "text": "U X", "orig": "U X", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 51, "label": "text", "bbox": {"l": 152.362, "t": 409.855, "r": 175.106, "b": 416.144, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 51, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 152.362, "r_y0": 416.144, "r_x1": 175.106, "r_y1": 416.144, "r_x2": 175.106, "r_y2": 409.855, "r_x3": 152.362, "r_y3": 409.855, "coord_origin": "TOPLEFT"}, "text": "<table>", "orig": "<table>", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 52, "label": "text", "bbox": {"l": 178.894, "t": 409.855, "r": 191.019, "b": 416.144, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 52, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 178.894, "r_y0": 416.144, "r_x1": 191.019, "r_y1": 416.144, "r_x2": 191.019, "r_y2": 409.855, "r_x3": 178.894, "r_y3": 409.855, "coord_origin": "TOPLEFT"}, "text": "<tr>", "orig": "<tr>", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 53, "label": "text", "bbox": {"l": 194.807, "t": 409.855, "r": 208.826, "b": 416.144, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 53, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 194.807, "r_y0": 416.144, "r_x1": 208.826, "r_y1": 416.144, "r_x2": 208.826, "r_y2": 409.855, "r_x3": 194.807, "r_y3": 409.855, "coord_origin": "TOPLEFT"}, "text": "</tr>", "orig": "</tr>", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 54, "label": "text", "bbox": {"l": 212.614, "t": 409.855, "r": 226.26, "b": 416.144, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 54, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 212.614, "r_y0": 416.144, "r_x1": 226.26, "r_y1": 416.144, "r_x2": 226.26, "r_y2": 409.855, "r_x3": 212.614, "r_y3": 409.855, "coord_origin": "TOPLEFT"}, "text": "<td>", "orig": "<td>", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 55, "label": "text", "bbox": {"l": 230.047, "t": 409.855, "r": 245.588, "b": 416.144, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 55, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 230.047, "r_y0": 416.144, "r_x1": 245.588, "r_y1": 416.144, "r_x2": 245.588, "r_y2": 409.855, "r_x3": 230.047, "r_y3": 409.855, "coord_origin": "TOPLEFT"}, "text": "</td>", "orig": "</td>", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 56, "label": "text", "bbox": {"l": 249.375, "t": 409.855, "r": 259.039, "b": 416.144, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 56, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 249.375, "r_y0": 416.144, "r_x1": 259.039, "r_y1": 416.144, "r_x2": 259.039, "r_y2": 409.855, "r_x3": 249.375, "r_y3": 409.855, "coord_origin": "TOPLEFT"}, "text": "<td", "orig": "<td", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 57, "label": "text", "bbox": {"l": 262.828, "t": 409.855, "r": 298.936, "b": 416.144, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 57, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 262.828, "r_y0": 416.144, "r_x1": 298.936, "r_y1": 416.144, "r_x2": 298.936, "r_y2": 409.855, "r_x3": 262.828, "r_y3": 409.855, "coord_origin": "TOPLEFT"}, "text": "colspan=\"2\"", "orig": "colspan=\"2\"", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 58, "label": "text", "bbox": {"l": 302.724, "t": 409.855, "r": 338.832, "b": 416.144, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 58, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 302.724, "r_y0": 416.144, "r_x1": 338.832, "r_y1": 416.144, "r_x2": 338.832, "r_y2": 409.855, "r_x3": 302.724, "r_y3": 409.855, "coord_origin": "TOPLEFT"}, "text": "colspan=\"3\"", "orig": "colspan=\"3\"", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 59, "label": "text", "bbox": {"l": 152.362, "t": 418.187, "r": 190.741, "b": 424.476, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 59, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 152.362, "r_y0": 424.476, "r_x1": 190.741, "r_y1": 424.476, "r_x2": 190.741, "r_y2": 418.187, "r_x3": 152.362, "r_y3": 418.187, "coord_origin": "TOPLEFT"}, "text": "rowspan=\"2\"", "orig": "rowspan=\"2\"", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 60, "label": "text", "bbox": {"l": 194.529, "t": 418.187, "r": 232.908, "b": 424.476, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 60, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 194.529, "r_y0": 424.476, "r_x1": 232.908, "r_y1": 424.476, "r_x2": 232.908, "r_y2": 418.187, "r_x3": 194.529, "r_y3": 418.187, "coord_origin": "TOPLEFT"}, "text": "rowspan=\"3\"", "orig": "rowspan=\"3\"", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 61, "label": "text", "bbox": {"l": 236.695, "t": 418.187, "r": 269.101, "b": 424.476, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 61, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 236.695, "r_y0": 424.476, "r_x1": 269.101, "r_y1": 424.476, "r_x2": 269.101, "r_y2": 418.187, "r_x3": 236.695, "r_y3": 418.187, "coord_origin": "TOPLEFT"}, "text": "> </table>", "orig": "> </table>", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 62, "label": "text", "bbox": {"l": 154.506, "t": 258.692, "r": 185.219, "b": 265.679, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 62, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 154.506, "r_y0": 265.679, "r_x1": 185.219, "r_y1": 265.679, "r_x2": 185.219, "r_y2": 258.692, "r_x3": 154.506, "r_y3": 258.692, "coord_origin": "TOPLEFT"}, "text": "C HTML", "orig": "C HTML", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 63, "label": "text", "bbox": {"l": 164.355, "t": 266.58799999999997, "r": 222.054, "b": 273.57500000000005, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 63, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 164.355, "r_y0": 273.57500000000005, "r_x1": 222.054, "r_y1": 273.57500000000005, "r_x2": 222.054, "r_y2": 266.58799999999997, "r_x3": 164.355, "r_y3": 266.58799999999997, "coord_origin": "TOPLEFT"}, "text": "sequence length:", "orig": "sequence length:", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 64, "label": "text", "bbox": {"l": 224.153, "t": 266.58799999999997, "r": 232.577, "b": 273.57500000000005, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 64, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 224.153, "r_y0": 273.57500000000005, "r_x1": 232.577, "r_y1": 273.57500000000005, "r_x2": 232.577, "r_y2": 266.58799999999997, "r_x3": 224.153, "r_y3": 266.58799999999997, "coord_origin": "TOPLEFT"}, "text": "55", "orig": "55", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}]}, {"id": 2, "label": "text", "bbox": {"l": 134.765, "t": 452.314, "r": 480.592, "b": 520.887, "coord_origin": "TOPLEFT"}, "confidence": 0.950499951839447, "cells": [{"index": 65, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 461.111, "r_x1": 161.329, "r_y1": 461.111, "r_x2": 161.329, "r_y2": 452.314, "r_x3": 134.765, "r_y3": 452.314, "coord_origin": "TOPLEFT"}, "text": "today,", "orig": "today,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 66, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 164.269, "r_y0": 461.111, "r_x1": 226.286, "r_y1": 461.111, "r_x2": 226.286, "r_y2": 452.314, "r_x3": 164.269, "r_y3": 452.314, "coord_origin": "TOPLEFT"}, "text": "table detection", "orig": "table detection", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 67, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 229.992, "r_y0": 461.111, "r_x1": 480.592, "r_y1": 461.111, "r_x2": 480.592, "r_y2": 452.314, "r_x3": 229.992, "r_y3": 452.314, "coord_origin": "TOPLEFT"}, "text": "in documents is a well understood problem, and the latest", "orig": "in documents is a well understood problem, and the latest", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 68, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 473.066, "r_x1": 480.592, "r_y1": 473.066, "r_x2": 480.592, "r_y2": 464.269, "r_x3": 134.765, "r_y3": 464.269, "coord_origin": "TOPLEFT"}, "text": "state-of-the-art (SOTA) object detection methods provide an accuracy compa-", "orig": "state-of-the-art (SOTA) object detection methods provide an accuracy compa-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 69, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 485.021, "r_x1": 480.587, "r_y1": 485.021, "r_x2": 480.587, "r_y2": 476.224, "r_x3": 134.765, "r_y3": 476.224, "coord_origin": "TOPLEFT"}, "text": "rable to human observers [7,8,10,14,23]. On the other hand, the problem of table", "orig": "rable to human observers [7,8,10,14,23]. On the other hand, the problem of table", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 70, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 496.977, "r_x1": 480.587, "r_y1": 496.977, "r_x2": 480.587, "r_y2": 488.18, "r_x3": 134.765, "r_y3": 488.18, "coord_origin": "TOPLEFT"}, "text": "structure recognition (TSR) is a lot more challenging and remains a very active", "orig": "structure recognition (TSR) is a lot more challenging and remains a very active", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 71, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 508.932, "r_x1": 165.481, "r_y1": 508.932, "r_x2": 165.481, "r_y2": 500.135, "r_x3": 134.765, "r_y3": 500.135, "coord_origin": "TOPLEFT"}, "text": "area of", "orig": "area of", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 72, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 169.874, "r_y0": 508.932, "r_x1": 207.895, "r_y1": 508.932, "r_x2": 207.895, "r_y2": 500.135, "r_x3": 169.874, "r_y3": 500.135, "coord_origin": "TOPLEFT"}, "text": "research,", "orig": "research,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 73, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 212.289, "r_y0": 508.932, "r_x1": 220.589, "r_y1": 508.932, "r_x2": 220.589, "r_y2": 500.135, "r_x3": 212.289, "r_y3": 500.135, "coord_origin": "TOPLEFT"}, "text": "in", "orig": "in", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 74, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 224.992, "r_y0": 508.932, "r_x1": 480.59, "r_y1": 508.932, "r_x2": 480.59, "r_y2": 500.135, "r_x3": 224.992, "r_y3": 500.135, "coord_origin": "TOPLEFT"}, "text": "which many novel machine learning algorithms are being", "orig": "which many novel machine learning algorithms are being", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 75, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 520.887, "r_x1": 313.246, "r_y1": 520.887, "r_x2": 313.246, "r_y2": 512.0899999999999, "r_x3": 134.765, "r_y3": 512.0899999999999, "coord_origin": "TOPLEFT"}, "text": "explored [3,4,5,9,11,12,13,14,17,18,21,22].", "orig": "explored [3,4,5,9,11,12,13,14,17,18,21,22].", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 0, "label": "text", "bbox": {"l": 134.765, "t": 524.5509999999999, "r": 480.595, "b": 664.855, "coord_origin": "TOPLEFT"}, "confidence": 0.9845512509346008, "cells": [{"index": 76, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 149.709, "r_y0": 533.348, "r_x1": 187.471, "r_y1": 533.348, "r_x2": 187.471, "r_y2": 524.5509999999999, "r_x3": 149.709, "r_y3": 524.5509999999999, "coord_origin": "TOPLEFT"}, "text": "Recently", "orig": "Recently", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 77, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 192.194, "r_y0": 533.348, "r_x1": 480.589, "r_y1": 533.348, "r_x2": 480.589, "r_y2": 524.5509999999999, "r_x3": 192.194, "r_y3": 524.5509999999999, "coord_origin": "TOPLEFT"}, "text": "emerging SOTA methods for table structure recognition employ", "orig": "emerging SOTA methods for table structure recognition employ", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 78, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 545.304, "r_x1": 480.592, "r_y1": 545.304, "r_x2": 480.592, "r_y2": 536.5070000000001, "r_x3": 134.765, "r_y3": 536.5070000000001, "coord_origin": "TOPLEFT"}, "text": "transformer-based models, in which an image of the table is provided to the net-", "orig": "transformer-based models, in which an image of the table is provided to the net-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 79, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 557.259, "r_x1": 480.589, "r_y1": 557.259, "r_x2": 480.589, "r_y2": 548.462, "r_x3": 134.765, "r_y3": 548.462, "coord_origin": "TOPLEFT"}, "text": "work in order to predict the structure of the table as a sequence of tokens. These", "orig": "work in order to predict the structure of the table as a sequence of tokens. These", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 80, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 569.2139999999999, "r_x1": 480.588, "r_y1": 569.2139999999999, "r_x2": 480.588, "r_y2": 560.417, "r_x3": 134.765, "r_y3": 560.417, "coord_origin": "TOPLEFT"}, "text": "image-to-sequence (Im2Seq) models are extremely powerful, since they allow for", "orig": "image-to-sequence (Im2Seq) models are extremely powerful, since they allow for", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 81, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 581.169, "r_x1": 480.59, "r_y1": 581.169, "r_x2": 480.59, "r_y2": 572.3720000000001, "r_x3": 134.765, "r_y3": 572.3720000000001, "coord_origin": "TOPLEFT"}, "text": "a purely data-driven solution. The tokens of the sequence typically belong to a", "orig": "a purely data-driven solution. The tokens of the sequence typically belong to a", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 82, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 593.124, "r_x1": 480.595, "r_y1": 593.124, "r_x2": 480.595, "r_y2": 584.327, "r_x3": 134.765, "r_y3": 584.327, "coord_origin": "TOPLEFT"}, "text": "markup language such as HTML, Latex or Markdown, which allow to describe", "orig": "markup language such as HTML, Latex or Markdown, which allow to describe", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 83, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 605.08, "r_x1": 480.587, "r_y1": 605.08, "r_x2": 480.587, "r_y2": 596.283, "r_x3": 134.765, "r_y3": 596.283, "coord_origin": "TOPLEFT"}, "text": "table structure as rows, columns and spanning cells in various configurations.", "orig": "table structure as rows, columns and spanning cells in various configurations.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 84, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 617.035, "r_x1": 480.595, "r_y1": 617.035, "r_x2": 480.595, "r_y2": 608.238, "r_x3": 134.765, "r_y3": 608.238, "coord_origin": "TOPLEFT"}, "text": "In Figure 1, we illustrate how HTML is used to represent the table-structure", "orig": "In Figure 1, we illustrate how HTML is used to represent the table-structure", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 85, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 628.99, "r_x1": 480.594, "r_y1": 628.99, "r_x2": 480.594, "r_y2": 620.193, "r_x3": 134.765, "r_y3": 620.193, "coord_origin": "TOPLEFT"}, "text": "of a particular example table. Public table-structure data sets such as PubTab-", "orig": "of a particular example table. Public table-structure data sets such as PubTab-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 86, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 640.9449999999999, "r_x1": 480.595, "r_y1": 640.9449999999999, "r_x2": 480.595, "r_y2": 632.148, "r_x3": 134.765, "r_y3": 632.148, "coord_origin": "TOPLEFT"}, "text": "Net [22], and FinTabNet [21], which were created in a semi-automated way from", "orig": "Net [22], and FinTabNet [21], which were created in a semi-automated way from", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 87, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 652.9, "r_x1": 480.588, "r_y1": 652.9, "r_x2": 480.588, "r_y2": 644.1030000000001, "r_x3": 134.765, "r_y3": 644.1030000000001, "coord_origin": "TOPLEFT"}, "text": "paired PDF and HTML sources (e.g. PubMed Central), popularized primarily", "orig": "paired PDF and HTML sources (e.g. PubMed Central), popularized primarily", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 88, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 664.855, "r_x1": 421.454, "r_y1": 664.855, "r_x2": 421.454, "r_y2": 656.058, "r_x3": 134.765, "r_y3": 656.058, "coord_origin": "TOPLEFT"}, "text": "the use of HTML as ground-truth representation format for TSR.", "orig": "the use of HTML as ground-truth representation format for TSR.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}]}, "tablestructure": {"table_map": {}}, "figures_classification": null, "equations_prediction": null, "vlm_response": null}, "assembled": {"elements": [{"label": "page_header", "id": 5, "page_no": 1, "cluster": {"id": 5, "label": "page_header", "bbox": {"l": 134.765, "t": 91.49300000000005, "r": 139.372, "b": 102.78200000000004, "coord_origin": "TOPLEFT"}, "confidence": 0.8580349683761597, "cells": [{"index": 0, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 102.78200000000004, "r_x1": 139.372, "r_y1": 102.78200000000004, "r_x2": 139.372, "r_y2": 91.49300000000005, "r_x3": 134.765, "r_y3": 91.49300000000005, "coord_origin": "TOPLEFT"}, "text": "2", "orig": "2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "2"}, {"label": "page_header", "id": 3, "page_no": 1, "cluster": {"id": 3, "label": "page_header", "bbox": {"l": 167.813, "t": 91.49300000000005, "r": 231.722, "b": 102.78200000000004, "coord_origin": "TOPLEFT"}, "confidence": 0.9076642990112305, "cells": [{"index": 1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 167.813, "r_y0": 102.78200000000004, "r_x1": 231.722, "r_y1": 102.78200000000004, "r_x2": 231.722, "r_y2": 91.49300000000005, "r_x3": 167.813, "r_y3": 91.49300000000005, "coord_origin": "TOPLEFT"}, "text": "M. Lysak, et al.", "orig": "M. Lysak, et al.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "M. Lysak, et al."}, {"label": "caption", "id": 4, "page_no": 1, "cluster": {"id": 4, "label": "caption", "bbox": {"l": 134.765, "t": 124.11900000000003, "r": 480.592, "b": 201.16200000000003, "coord_origin": "TOPLEFT"}, "confidence": 0.8939083218574524, "cells": [{"index": 2, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 134.26, "r_x1": 162.644, "r_y1": 134.26, "r_x2": 162.644, "r_y2": 126.33399999999995, "r_x3": 134.765, "r_y3": 126.33399999999995, "coord_origin": "TOPLEFT"}, "text": "Fig. 1.", "orig": "Fig. 1.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 3, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 167.062, "r_y0": 135.40800000000002, "r_x1": 480.591, "r_y1": 135.40800000000002, "r_x2": 480.591, "r_y2": 124.11900000000003, "r_x3": 167.062, "r_y3": 124.11900000000003, "coord_origin": "TOPLEFT"}, "text": "Comparison between HTML and OTSL table structure representation: (A)", "orig": "Comparison between HTML and OTSL table structure representation: (A)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 4, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 146.36699999999996, "r_x1": 190.823, "r_y1": 146.36699999999996, "r_x2": 190.823, "r_y2": 135.07799999999997, "r_x3": 134.765, "r_y3": 135.07799999999997, "coord_origin": "TOPLEFT"}, "text": "table-example", "orig": "table-example", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 5, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 195.199, "r_y0": 146.36699999999996, "r_x1": 480.59, "r_y1": 146.36699999999996, "r_x2": 480.59, "r_y2": 135.07799999999997, "r_x3": 195.199, "r_y3": 135.07799999999997, "coord_origin": "TOPLEFT"}, "text": "with complex row and column headers, including a 2D empty span,", "orig": "with complex row and column headers, including a 2D empty span,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 6, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 157.32600000000002, "r_x1": 480.591, "r_y1": 157.32600000000002, "r_x2": 480.591, "r_y2": 146.03700000000003, "r_x3": 134.765, "r_y3": 146.03700000000003, "coord_origin": "TOPLEFT"}, "text": "(B) minimal graphical representation of table structure using rectangular layout, (C)", "orig": "(B) minimal graphical representation of table structure using rectangular layout, (C)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 7, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 168.28499999999997, "r_x1": 480.592, "r_y1": 168.28499999999997, "r_x2": 480.592, "r_y2": 156.99599999999998, "r_x3": 134.765, "r_y3": 156.99599999999998, "coord_origin": "TOPLEFT"}, "text": "HTML representation, (D) OTSL representation. This example demonstrates many of", "orig": "HTML representation, (D) OTSL representation. This example demonstrates many of", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 8, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 179.24400000000003, "r_x1": 480.589, "r_y1": 179.24400000000003, "r_x2": 480.589, "r_y2": 167.95500000000004, "r_x3": 134.765, "r_y3": 167.95500000000004, "coord_origin": "TOPLEFT"}, "text": "the key-features of OTSL, namely its reduced vocabulary size (12 versus 5 in this case),", "orig": "the key-features of OTSL, namely its reduced vocabulary size (12 versus 5 in this case),", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 9, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 190.20299999999997, "r_x1": 480.59, "r_y1": 190.20299999999997, "r_x2": 480.59, "r_y2": 178.914, "r_x3": 134.765, "r_y3": 178.914, "coord_origin": "TOPLEFT"}, "text": "its reduced sequence length (55 versus 30) and a enhanced internal structure (variable", "orig": "its reduced sequence length (55 versus 30) and a enhanced internal structure (variable", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 10, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 201.16200000000003, "r_x1": 460.871, "r_y1": 201.16200000000003, "r_x2": 460.871, "r_y2": 189.87300000000005, "r_x3": 134.765, "r_y3": 189.87300000000005, "coord_origin": "TOPLEFT"}, "text": "token sequence length per row in HTML versus a fixed length of rows in OTSL).", "orig": "token sequence length per row in HTML versus a fixed length of rows in OTSL).", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "Fig. 1. Comparison between HTML and OTSL table structure representation: (A) table-example with complex row and column headers, including a 2D empty span, (B) minimal graphical representation of table structure using rectangular layout, (C) HTML representation, (D) OTSL representation. This example demonstrates many of the key-features of OTSL, namely its reduced vocabulary size (12 versus 5 in this case), its reduced sequence length (55 versus 30) and a enhanced internal structure (variable token sequence length per row in HTML versus a fixed length of rows in OTSL)."}, {"label": "picture", "id": 1, "page_no": 1, "cluster": {"id": 1, "label": "picture", "bbox": {"l": 148.45364379882812, "t": 208.37423706054688, "r": 464.3608093261719, "b": 425.8462219238281, "coord_origin": "TOPLEFT"}, "confidence": 0.9688959121704102, "cells": [{"index": 11, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 396.411, "r_y0": 289.478, "r_x1": 446.134, "r_y1": 288.875, "r_x2": 446.134, "r_y2": 280.49, "r_x3": 396.411, "r_y3": 281.093, "coord_origin": "TOPLEFT"}, "text": "C L C L L", "orig": "C L C L L", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 12, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 395.748, "r_y0": 311.731, "r_x1": 463.795, "r_y1": 311.337, "r_x2": 463.795, "r_y2": 302.952, "r_x3": 395.748, "r_y3": 303.346, "coord_origin": "TOPLEFT"}, "text": "C C C C C NL", "orig": "C C C C C NL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 13, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 407.563, "r_y0": 322.9, "r_x1": 463.716, "r_y1": 322.618, "r_x2": 463.716, "r_y2": 314.233, "r_x3": 407.563, "r_y3": 314.515, "coord_origin": "TOPLEFT"}, "text": "C C C C NL", "orig": "C C C C NL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 14, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 418.511, "r_y0": 300.579, "r_x1": 463.773, "r_y1": 300.093, "r_x2": 463.773, "r_y2": 291.708, "r_x3": 418.511, "r_y3": 292.194, "coord_origin": "TOPLEFT"}, "text": "C C C NL", "orig": "C C C NL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 15, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 407.397, "r_y0": 333.784, "r_x1": 463.915, "r_y1": 333.963, "r_x2": 463.915, "r_y2": 325.578, "r_x3": 407.397, "r_y3": 325.399, "coord_origin": "TOPLEFT"}, "text": "C C C C NL", "orig": "C C C C NL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 16, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 451.895, "r_y0": 288.651, "r_x1": 463.513, "r_y1": 288.651, "r_x2": 463.513, "r_y2": 280.266, "r_x3": 451.895, "r_y3": 280.266, "coord_origin": "TOPLEFT"}, "text": "NL", "orig": "NL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 17, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 396.097, "r_y0": 322.989, "r_x1": 402.659, "r_y1": 322.989, "r_x2": 402.659, "r_y2": 314.604, "r_x3": 396.097, "r_y3": 314.604, "coord_origin": "TOPLEFT"}, "text": "U", "orig": "U", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 18, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 395.998, "r_y0": 333.883, "r_x1": 402.561, "r_y1": 333.883, "r_x2": 402.561, "r_y2": 325.498, "r_x3": 395.998, "r_y3": 325.498, "coord_origin": "TOPLEFT"}, "text": "U", "orig": "U", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 19, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 396.275, "r_y0": 300.765, "r_x1": 414.036, "r_y1": 300.628, "r_x2": 414.036, "r_y2": 292.243, "r_x3": 396.275, "r_y3": 292.38, "coord_origin": "TOPLEFT"}, "text": "U X", "orig": "U X", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 20, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 441.256, "r_y0": 419.675, "r_x1": 452.874, "r_y1": 419.675, "r_x2": 452.874, "r_y2": 411.29, "r_x3": 441.256, "r_y3": 411.29, "coord_origin": "TOPLEFT"}, "text": "NL", "orig": "NL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 21, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 393.753, "r_y0": 406.873, "r_x1": 432.489, "r_y1": 406.873, "r_x2": 432.489, "r_y2": 399.886, "r_x3": 393.753, "r_y3": 399.886, "coord_origin": "TOPLEFT"}, "text": "vocabulary:", "orig": "vocabulary:", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 22, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 434.59, "r_y0": 406.873, "r_x1": 438.801, "r_y1": 406.873, "r_x2": 438.801, "r_y2": 399.886, "r_x3": 434.59, "r_y3": 399.886, "coord_origin": "TOPLEFT"}, "text": "5", "orig": "5", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 23, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 440.906, "r_y0": 406.873, "r_x1": 463.222, "r_y1": 406.873, "r_x2": 463.222, "r_y2": 399.886, "r_x3": 440.906, "r_y3": 399.886, "coord_origin": "TOPLEFT"}, "text": "tokens", "orig": "tokens", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 24, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 384.118, "r_y0": 265.626, "r_x1": 413.993, "r_y1": 265.626, "r_x2": 413.993, "r_y2": 258.63800000000003, "r_x3": 384.118, "r_y3": 258.63800000000003, "coord_origin": "TOPLEFT"}, "text": "D OTSL", "orig": "D OTSL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 25, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 393.753, "r_y0": 273.75300000000004, "r_x1": 451.451, "r_y1": 273.75300000000004, "r_x2": 451.451, "r_y2": 266.76599999999996, "r_x3": 393.753, "r_y3": 266.76599999999996, "coord_origin": "TOPLEFT"}, "text": "sequence length:", "orig": "sequence length:", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 26, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 453.551, "r_y0": 273.75300000000004, "r_x1": 461.975, "r_y1": 273.75300000000004, "r_x2": 461.975, "r_y2": 266.76599999999996, "r_x3": 453.551, "r_y3": 266.76599999999996, "coord_origin": "TOPLEFT"}, "text": "30", "orig": "30", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 27, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 151.793, "r_y0": 406.839, "r_x1": 233.894, "r_y1": 406.839, "r_x2": 233.894, "r_y2": 399.851, "r_x3": 151.793, "r_y3": 399.851, "coord_origin": "TOPLEFT"}, "text": "vocabulary for this table:", "orig": "vocabulary for this table:", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 28, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 235.993, "r_y0": 406.839, "r_x1": 244.417, "r_y1": 406.839, "r_x2": 244.417, "r_y2": 399.851, "r_x3": 235.993, "r_y3": 399.851, "coord_origin": "TOPLEFT"}, "text": "12", "orig": "12", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 29, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 246.522, "r_y0": 406.839, "r_x1": 268.839, "r_y1": 406.839, "r_x2": 268.839, "r_y2": 399.851, "r_x3": 246.522, "r_y3": 399.851, "coord_origin": "TOPLEFT"}, "text": "tokens", "orig": "tokens", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 30, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 154.33, "r_y0": 220.65300000000002, "r_x1": 159.798, "r_y1": 220.65300000000002, "r_x2": 159.798, "r_y2": 213.66600000000005, "r_x3": 154.33, "r_y3": 213.66600000000005, "coord_origin": "TOPLEFT"}, "text": "A", "orig": "A", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 31, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 321.071, "r_y0": 220.65300000000002, "r_x1": 326.539, "r_y1": 220.65300000000002, "r_x2": 326.539, "r_y2": 213.66600000000005, "r_x3": 321.071, "r_y3": 213.66600000000005, "coord_origin": "TOPLEFT"}, "text": "B", "orig": "B", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 32, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 153.095, "r_y0": 286.675, "r_x1": 175.839, "r_y1": 286.675, "r_x2": 175.839, "r_y2": 280.386, "r_x3": 153.095, "r_y3": 280.386, "coord_origin": "TOPLEFT"}, "text": "<table>", "orig": "<table>", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 33, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 160.67, "r_y0": 293.491, "r_x1": 172.796, "r_y1": 293.491, "r_x2": 172.796, "r_y2": 287.203, "r_x3": 160.67, "r_y3": 287.203, "coord_origin": "TOPLEFT"}, "text": "<tr>", "orig": "<tr>", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 34, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 168.246, "r_y0": 300.308, "r_x1": 351.469, "r_y1": 300.308, "r_x2": 351.469, "r_y2": 294.019, "r_x3": 168.246, "r_y3": 294.019, "coord_origin": "TOPLEFT"}, "text": "<td colspan='2' rowspan='2' > </td> <td colspan='3' > </td>", "orig": "<td colspan='2' rowspan='2' > </td> <td colspan='3' > </td>", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 35, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 160.67, "r_y0": 307.125, "r_x1": 174.69, "r_y1": 307.125, "r_x2": 174.69, "r_y2": 300.836, "r_x3": 160.67, "r_y3": 300.836, "coord_origin": "TOPLEFT"}, "text": "</tr>", "orig": "</tr>", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 36, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 160.67, "r_y0": 313.942, "r_x1": 172.796, "r_y1": 313.942, "r_x2": 172.796, "r_y2": 307.653, "r_x3": 160.67, "r_y3": 307.653, "coord_origin": "TOPLEFT"}, "text": "<tr>", "orig": "<tr>", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 37, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 168.246, "r_y0": 320.759, "r_x1": 265.275, "r_y1": 320.759, "r_x2": 265.275, "r_y2": 314.47, "r_x3": 168.246, "r_y3": 314.47, "coord_origin": "TOPLEFT"}, "text": "<td> </td> <td> </td> <td> </td>", "orig": "<td> </td> <td> </td> <td> </td>", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 38, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 160.67, "r_y0": 327.575, "r_x1": 174.69, "r_y1": 327.575, "r_x2": 174.69, "r_y2": 321.287, "r_x3": 160.67, "r_y3": 321.287, "coord_origin": "TOPLEFT"}, "text": "</tr>", "orig": "</tr>", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 39, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 160.67, "r_y0": 334.392, "r_x1": 172.796, "r_y1": 334.392, "r_x2": 172.796, "r_y2": 328.103, "r_x3": 160.67, "r_y3": 328.103, "coord_origin": "TOPLEFT"}, "text": "<tr>", "orig": "<tr>", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 40, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 168.246, "r_y0": 341.209, "r_x1": 373.091, "r_y1": 341.209, "r_x2": 373.091, "r_y2": 334.92, "r_x3": 168.246, "r_y3": 334.92, "coord_origin": "TOPLEFT"}, "text": "<td rowspan='3' > </td> <td> </td> <td> </td> <td> </td> <td> </td>", "orig": "<td rowspan='3' > </td> <td> </td> <td> </td> <td> </td> <td> </td>", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 41, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 160.67, "r_y0": 348.026, "r_x1": 174.69, "r_y1": 348.026, "r_x2": 174.69, "r_y2": 341.737, "r_x3": 160.67, "r_y3": 341.737, "coord_origin": "TOPLEFT"}, "text": "</tr>", "orig": "</tr>", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 42, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 160.67, "r_y0": 354.842, "r_x1": 172.796, "r_y1": 354.842, "r_x2": 172.796, "r_y2": 348.553, "r_x3": 160.67, "r_y3": 348.553, "coord_origin": "TOPLEFT"}, "text": "<tr>", "orig": "<tr>", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 43, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 168.246, "r_y0": 361.659, "r_x1": 298.249, "r_y1": 361.659, "r_x2": 298.249, "r_y2": 355.37, "r_x3": 168.246, "r_y3": 355.37, "coord_origin": "TOPLEFT"}, "text": "<td> </td> <td> </td> <td> </td> <td> </td>", "orig": "<td> </td> <td> </td> <td> </td> <td> </td>", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 44, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 160.67, "r_y0": 368.476, "r_x1": 174.69, "r_y1": 368.476, "r_x2": 174.69, "r_y2": 362.187, "r_x3": 160.67, "r_y3": 362.187, "coord_origin": "TOPLEFT"}, "text": "</tr>", "orig": "</tr>", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 45, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 160.67, "r_y0": 375.292, "r_x1": 172.796, "r_y1": 375.292, "r_x2": 172.796, "r_y2": 369.004, "r_x3": 160.67, "r_y3": 369.004, "coord_origin": "TOPLEFT"}, "text": "<tr>", "orig": "<tr>", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 46, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 168.246, "r_y0": 382.109, "r_x1": 298.249, "r_y1": 382.109, "r_x2": 298.249, "r_y2": 375.821, "r_x3": 168.246, "r_y3": 375.821, "coord_origin": "TOPLEFT"}, "text": "<td> </td> <td> </td> <td> </td> <td> </td>", "orig": "<td> </td> <td> </td> <td> </td> <td> </td>", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 47, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 160.67, "r_y0": 388.926, "r_x1": 174.69, "r_y1": 388.926, "r_x2": 174.69, "r_y2": 382.637, "r_x3": 160.67, "r_y3": 382.637, "coord_origin": "TOPLEFT"}, "text": "</tr>", "orig": "</tr>", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 48, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 153.095, "r_y0": 395.743, "r_x1": 177.733, "r_y1": 395.743, "r_x2": 177.733, "r_y2": 389.454, "r_x3": 153.095, "r_y3": 389.454, "coord_origin": "TOPLEFT"}, "text": "</table>", "orig": "</table>", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 49, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 395.061, "r_y0": 419.828, "r_x1": 412.476, "r_y1": 419.828, "r_x2": 412.476, "r_y2": 411.443, "r_x3": 395.061, "r_y3": 411.443, "coord_origin": "TOPLEFT"}, "text": "C L", "orig": "C L", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 50, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 418.693, "r_y0": 419.828, "r_x1": 436.571, "r_y1": 419.828, "r_x2": 436.571, "r_y2": 411.443, "r_x3": 418.693, "r_y3": 411.443, "coord_origin": "TOPLEFT"}, "text": "U X", "orig": "U X", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 51, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 152.362, "r_y0": 416.144, "r_x1": 175.106, "r_y1": 416.144, "r_x2": 175.106, "r_y2": 409.855, "r_x3": 152.362, "r_y3": 409.855, "coord_origin": "TOPLEFT"}, "text": "<table>", "orig": "<table>", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 52, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 178.894, "r_y0": 416.144, "r_x1": 191.019, "r_y1": 416.144, "r_x2": 191.019, "r_y2": 409.855, "r_x3": 178.894, "r_y3": 409.855, "coord_origin": "TOPLEFT"}, "text": "<tr>", "orig": "<tr>", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 53, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 194.807, "r_y0": 416.144, "r_x1": 208.826, "r_y1": 416.144, "r_x2": 208.826, "r_y2": 409.855, "r_x3": 194.807, "r_y3": 409.855, "coord_origin": "TOPLEFT"}, "text": "</tr>", "orig": "</tr>", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 54, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 212.614, "r_y0": 416.144, "r_x1": 226.26, "r_y1": 416.144, "r_x2": 226.26, "r_y2": 409.855, "r_x3": 212.614, "r_y3": 409.855, "coord_origin": "TOPLEFT"}, "text": "<td>", "orig": "<td>", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 55, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 230.047, "r_y0": 416.144, "r_x1": 245.588, "r_y1": 416.144, "r_x2": 245.588, "r_y2": 409.855, "r_x3": 230.047, "r_y3": 409.855, "coord_origin": "TOPLEFT"}, "text": "</td>", "orig": "</td>", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 56, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 249.375, "r_y0": 416.144, "r_x1": 259.039, "r_y1": 416.144, "r_x2": 259.039, "r_y2": 409.855, "r_x3": 249.375, "r_y3": 409.855, "coord_origin": "TOPLEFT"}, "text": "<td", "orig": "<td", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 57, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 262.828, "r_y0": 416.144, "r_x1": 298.936, "r_y1": 416.144, "r_x2": 298.936, "r_y2": 409.855, "r_x3": 262.828, "r_y3": 409.855, "coord_origin": "TOPLEFT"}, "text": "colspan=\"2\"", "orig": "colspan=\"2\"", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 58, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 302.724, "r_y0": 416.144, "r_x1": 338.832, "r_y1": 416.144, "r_x2": 338.832, "r_y2": 409.855, "r_x3": 302.724, "r_y3": 409.855, "coord_origin": "TOPLEFT"}, "text": "colspan=\"3\"", "orig": "colspan=\"3\"", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 59, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 152.362, "r_y0": 424.476, "r_x1": 190.741, "r_y1": 424.476, "r_x2": 190.741, "r_y2": 418.187, "r_x3": 152.362, "r_y3": 418.187, "coord_origin": "TOPLEFT"}, "text": "rowspan=\"2\"", "orig": "rowspan=\"2\"", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 60, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 194.529, "r_y0": 424.476, "r_x1": 232.908, "r_y1": 424.476, "r_x2": 232.908, "r_y2": 418.187, "r_x3": 194.529, "r_y3": 418.187, "coord_origin": "TOPLEFT"}, "text": "rowspan=\"3\"", "orig": "rowspan=\"3\"", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 61, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 236.695, "r_y0": 424.476, "r_x1": 269.101, "r_y1": 424.476, "r_x2": 269.101, "r_y2": 418.187, "r_x3": 236.695, "r_y3": 418.187, "coord_origin": "TOPLEFT"}, "text": "> </table>", "orig": "> </table>", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 62, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 154.506, "r_y0": 265.679, "r_x1": 185.219, "r_y1": 265.679, "r_x2": 185.219, "r_y2": 258.692, "r_x3": 154.506, "r_y3": 258.692, "coord_origin": "TOPLEFT"}, "text": "C HTML", "orig": "C HTML", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 63, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 164.355, "r_y0": 273.57500000000005, "r_x1": 222.054, "r_y1": 273.57500000000005, "r_x2": 222.054, "r_y2": 266.58799999999997, "r_x3": 164.355, "r_y3": 266.58799999999997, "coord_origin": "TOPLEFT"}, "text": "sequence length:", "orig": "sequence length:", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 64, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 224.153, "r_y0": 273.57500000000005, "r_x1": 232.577, "r_y1": 273.57500000000005, "r_x2": 232.577, "r_y2": 266.58799999999997, "r_x3": 224.153, "r_y3": 266.58799999999997, "coord_origin": "TOPLEFT"}, "text": "55", "orig": "55", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": [{"id": 11, "label": "text", "bbox": {"l": 396.411, "t": 280.49, "r": 446.134, "b": 289.478, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 11, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 396.411, "r_y0": 289.478, "r_x1": 446.134, "r_y1": 288.875, "r_x2": 446.134, "r_y2": 280.49, "r_x3": 396.411, "r_y3": 281.093, "coord_origin": "TOPLEFT"}, "text": "C L C L L", "orig": "C L C L L", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 12, "label": "text", "bbox": {"l": 395.748, "t": 302.952, "r": 463.795, "b": 311.731, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 12, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 395.748, "r_y0": 311.731, "r_x1": 463.795, "r_y1": 311.337, "r_x2": 463.795, "r_y2": 302.952, "r_x3": 395.748, "r_y3": 303.346, "coord_origin": "TOPLEFT"}, "text": "C C C C C NL", "orig": "C C C C C NL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 13, "label": "text", "bbox": {"l": 407.563, "t": 314.233, "r": 463.716, "b": 322.9, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 13, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 407.563, "r_y0": 322.9, "r_x1": 463.716, "r_y1": 322.618, "r_x2": 463.716, "r_y2": 314.233, "r_x3": 407.563, "r_y3": 314.515, "coord_origin": "TOPLEFT"}, "text": "C C C C NL", "orig": "C C C C NL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 14, "label": "text", "bbox": {"l": 418.511, "t": 291.708, "r": 463.773, "b": 300.579, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 14, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 418.511, "r_y0": 300.579, "r_x1": 463.773, "r_y1": 300.093, "r_x2": 463.773, "r_y2": 291.708, "r_x3": 418.511, "r_y3": 292.194, "coord_origin": "TOPLEFT"}, "text": "C C C NL", "orig": "C C C NL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 15, "label": "text", "bbox": {"l": 407.397, "t": 325.399, "r": 463.915, "b": 333.963, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 15, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 407.397, "r_y0": 333.784, "r_x1": 463.915, "r_y1": 333.963, "r_x2": 463.915, "r_y2": 325.578, "r_x3": 407.397, "r_y3": 325.399, "coord_origin": "TOPLEFT"}, "text": "C C C C NL", "orig": "C C C C NL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 16, "label": "text", "bbox": {"l": 451.895, "t": 280.266, "r": 463.513, "b": 288.651, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 16, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 451.895, "r_y0": 288.651, "r_x1": 463.513, "r_y1": 288.651, "r_x2": 463.513, "r_y2": 280.266, "r_x3": 451.895, "r_y3": 280.266, "coord_origin": "TOPLEFT"}, "text": "NL", "orig": "NL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 17, "label": "text", "bbox": {"l": 396.097, "t": 314.604, "r": 402.659, "b": 322.989, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 17, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 396.097, "r_y0": 322.989, "r_x1": 402.659, "r_y1": 322.989, "r_x2": 402.659, "r_y2": 314.604, "r_x3": 396.097, "r_y3": 314.604, "coord_origin": "TOPLEFT"}, "text": "U", "orig": "U", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 18, "label": "text", "bbox": {"l": 395.998, "t": 325.498, "r": 402.561, "b": 333.883, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 18, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 395.998, "r_y0": 333.883, "r_x1": 402.561, "r_y1": 333.883, "r_x2": 402.561, "r_y2": 325.498, "r_x3": 395.998, "r_y3": 325.498, "coord_origin": "TOPLEFT"}, "text": "U", "orig": "U", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 19, "label": "text", "bbox": {"l": 396.275, "t": 292.243, "r": 414.036, "b": 300.765, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 19, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 396.275, "r_y0": 300.765, "r_x1": 414.036, "r_y1": 300.628, "r_x2": 414.036, "r_y2": 292.243, "r_x3": 396.275, "r_y3": 292.38, "coord_origin": "TOPLEFT"}, "text": "U X", "orig": "U X", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 20, "label": "text", "bbox": {"l": 441.256, "t": 411.29, "r": 452.874, "b": 419.675, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 20, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 441.256, "r_y0": 419.675, "r_x1": 452.874, "r_y1": 419.675, "r_x2": 452.874, "r_y2": 411.29, "r_x3": 441.256, "r_y3": 411.29, "coord_origin": "TOPLEFT"}, "text": "NL", "orig": "NL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 21, "label": "text", "bbox": {"l": 393.753, "t": 399.886, "r": 432.489, "b": 406.873, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 21, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 393.753, "r_y0": 406.873, "r_x1": 432.489, "r_y1": 406.873, "r_x2": 432.489, "r_y2": 399.886, "r_x3": 393.753, "r_y3": 399.886, "coord_origin": "TOPLEFT"}, "text": "vocabulary:", "orig": "vocabulary:", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 22, "label": "text", "bbox": {"l": 434.59, "t": 399.886, "r": 438.801, "b": 406.873, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 22, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 434.59, "r_y0": 406.873, "r_x1": 438.801, "r_y1": 406.873, "r_x2": 438.801, "r_y2": 399.886, "r_x3": 434.59, "r_y3": 399.886, "coord_origin": "TOPLEFT"}, "text": "5", "orig": "5", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 23, "label": "text", "bbox": {"l": 440.906, "t": 399.886, "r": 463.222, "b": 406.873, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 23, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 440.906, "r_y0": 406.873, "r_x1": 463.222, "r_y1": 406.873, "r_x2": 463.222, "r_y2": 399.886, "r_x3": 440.906, "r_y3": 399.886, "coord_origin": "TOPLEFT"}, "text": "tokens", "orig": "tokens", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 24, "label": "text", "bbox": {"l": 384.118, "t": 258.63800000000003, "r": 413.993, "b": 265.626, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 24, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 384.118, "r_y0": 265.626, "r_x1": 413.993, "r_y1": 265.626, "r_x2": 413.993, "r_y2": 258.63800000000003, "r_x3": 384.118, "r_y3": 258.63800000000003, "coord_origin": "TOPLEFT"}, "text": "D OTSL", "orig": "D OTSL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 25, "label": "text", "bbox": {"l": 393.753, "t": 266.76599999999996, "r": 451.451, "b": 273.75300000000004, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 25, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 393.753, "r_y0": 273.75300000000004, "r_x1": 451.451, "r_y1": 273.75300000000004, "r_x2": 451.451, "r_y2": 266.76599999999996, "r_x3": 393.753, "r_y3": 266.76599999999996, "coord_origin": "TOPLEFT"}, "text": "sequence length:", "orig": "sequence length:", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 26, "label": "text", "bbox": {"l": 453.551, "t": 266.76599999999996, "r": 461.975, "b": 273.75300000000004, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 26, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 453.551, "r_y0": 273.75300000000004, "r_x1": 461.975, "r_y1": 273.75300000000004, "r_x2": 461.975, "r_y2": 266.76599999999996, "r_x3": 453.551, "r_y3": 266.76599999999996, "coord_origin": "TOPLEFT"}, "text": "30", "orig": "30", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 27, "label": "text", "bbox": {"l": 151.793, "t": 399.851, "r": 233.894, "b": 406.839, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 27, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 151.793, "r_y0": 406.839, "r_x1": 233.894, "r_y1": 406.839, "r_x2": 233.894, "r_y2": 399.851, "r_x3": 151.793, "r_y3": 399.851, "coord_origin": "TOPLEFT"}, "text": "vocabulary for this table:", "orig": "vocabulary for this table:", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 28, "label": "text", "bbox": {"l": 235.993, "t": 399.851, "r": 244.417, "b": 406.839, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 28, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 235.993, "r_y0": 406.839, "r_x1": 244.417, "r_y1": 406.839, "r_x2": 244.417, "r_y2": 399.851, "r_x3": 235.993, "r_y3": 399.851, "coord_origin": "TOPLEFT"}, "text": "12", "orig": "12", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 29, "label": "text", "bbox": {"l": 246.522, "t": 399.851, "r": 268.839, "b": 406.839, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 29, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 246.522, "r_y0": 406.839, "r_x1": 268.839, "r_y1": 406.839, "r_x2": 268.839, "r_y2": 399.851, "r_x3": 246.522, "r_y3": 399.851, "coord_origin": "TOPLEFT"}, "text": "tokens", "orig": "tokens", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 30, "label": "text", "bbox": {"l": 154.33, "t": 213.66600000000005, "r": 159.798, "b": 220.65300000000002, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 30, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 154.33, "r_y0": 220.65300000000002, "r_x1": 159.798, "r_y1": 220.65300000000002, "r_x2": 159.798, "r_y2": 213.66600000000005, "r_x3": 154.33, "r_y3": 213.66600000000005, "coord_origin": "TOPLEFT"}, "text": "A", "orig": "A", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 31, "label": "text", "bbox": {"l": 321.071, "t": 213.66600000000005, "r": 326.539, "b": 220.65300000000002, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 31, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 321.071, "r_y0": 220.65300000000002, "r_x1": 326.539, "r_y1": 220.65300000000002, "r_x2": 326.539, "r_y2": 213.66600000000005, "r_x3": 321.071, "r_y3": 213.66600000000005, "coord_origin": "TOPLEFT"}, "text": "B", "orig": "B", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 32, "label": "text", "bbox": {"l": 153.095, "t": 280.386, "r": 175.839, "b": 286.675, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 32, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 153.095, "r_y0": 286.675, "r_x1": 175.839, "r_y1": 286.675, "r_x2": 175.839, "r_y2": 280.386, "r_x3": 153.095, "r_y3": 280.386, "coord_origin": "TOPLEFT"}, "text": "<table>", "orig": "<table>", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 33, "label": "text", "bbox": {"l": 160.67, "t": 287.203, "r": 172.796, "b": 293.491, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 33, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 160.67, "r_y0": 293.491, "r_x1": 172.796, "r_y1": 293.491, "r_x2": 172.796, "r_y2": 287.203, "r_x3": 160.67, "r_y3": 287.203, "coord_origin": "TOPLEFT"}, "text": "<tr>", "orig": "<tr>", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 34, "label": "text", "bbox": {"l": 168.246, "t": 294.019, "r": 351.469, "b": 300.308, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 34, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 168.246, "r_y0": 300.308, "r_x1": 351.469, "r_y1": 300.308, "r_x2": 351.469, "r_y2": 294.019, "r_x3": 168.246, "r_y3": 294.019, "coord_origin": "TOPLEFT"}, "text": "<td colspan='2' rowspan='2' > </td> <td colspan='3' > </td>", "orig": "<td colspan='2' rowspan='2' > </td> <td colspan='3' > </td>", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 35, "label": "text", "bbox": {"l": 160.67, "t": 300.836, "r": 174.69, "b": 307.125, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 35, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 160.67, "r_y0": 307.125, "r_x1": 174.69, "r_y1": 307.125, "r_x2": 174.69, "r_y2": 300.836, "r_x3": 160.67, "r_y3": 300.836, "coord_origin": "TOPLEFT"}, "text": "</tr>", "orig": "</tr>", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 36, "label": "text", "bbox": {"l": 160.67, "t": 307.653, "r": 172.796, "b": 313.942, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 36, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 160.67, "r_y0": 313.942, "r_x1": 172.796, "r_y1": 313.942, "r_x2": 172.796, "r_y2": 307.653, "r_x3": 160.67, "r_y3": 307.653, "coord_origin": "TOPLEFT"}, "text": "<tr>", "orig": "<tr>", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 37, "label": "text", "bbox": {"l": 168.246, "t": 314.47, "r": 265.275, "b": 320.759, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 37, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 168.246, "r_y0": 320.759, "r_x1": 265.275, "r_y1": 320.759, "r_x2": 265.275, "r_y2": 314.47, "r_x3": 168.246, "r_y3": 314.47, "coord_origin": "TOPLEFT"}, "text": "<td> </td> <td> </td> <td> </td>", "orig": "<td> </td> <td> </td> <td> </td>", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 38, "label": "text", "bbox": {"l": 160.67, "t": 321.287, "r": 174.69, "b": 327.575, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 38, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 160.67, "r_y0": 327.575, "r_x1": 174.69, "r_y1": 327.575, "r_x2": 174.69, "r_y2": 321.287, "r_x3": 160.67, "r_y3": 321.287, "coord_origin": "TOPLEFT"}, "text": "</tr>", "orig": "</tr>", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 39, "label": "text", "bbox": {"l": 160.67, "t": 328.103, "r": 172.796, "b": 334.392, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 39, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 160.67, "r_y0": 334.392, "r_x1": 172.796, "r_y1": 334.392, "r_x2": 172.796, "r_y2": 328.103, "r_x3": 160.67, "r_y3": 328.103, "coord_origin": "TOPLEFT"}, "text": "<tr>", "orig": "<tr>", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 40, "label": "text", "bbox": {"l": 168.246, "t": 334.92, "r": 373.091, "b": 341.209, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 40, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 168.246, "r_y0": 341.209, "r_x1": 373.091, "r_y1": 341.209, "r_x2": 373.091, "r_y2": 334.92, "r_x3": 168.246, "r_y3": 334.92, "coord_origin": "TOPLEFT"}, "text": "<td rowspan='3' > </td> <td> </td> <td> </td> <td> </td> <td> </td>", "orig": "<td rowspan='3' > </td> <td> </td> <td> </td> <td> </td> <td> </td>", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 41, "label": "text", "bbox": {"l": 160.67, "t": 341.737, "r": 174.69, "b": 348.026, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 41, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 160.67, "r_y0": 348.026, "r_x1": 174.69, "r_y1": 348.026, "r_x2": 174.69, "r_y2": 341.737, "r_x3": 160.67, "r_y3": 341.737, "coord_origin": "TOPLEFT"}, "text": "</tr>", "orig": "</tr>", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 42, "label": "text", "bbox": {"l": 160.67, "t": 348.553, "r": 172.796, "b": 354.842, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 42, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 160.67, "r_y0": 354.842, "r_x1": 172.796, "r_y1": 354.842, "r_x2": 172.796, "r_y2": 348.553, "r_x3": 160.67, "r_y3": 348.553, "coord_origin": "TOPLEFT"}, "text": "<tr>", "orig": "<tr>", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 43, "label": "text", "bbox": {"l": 168.246, "t": 355.37, "r": 298.249, "b": 361.659, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 43, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 168.246, "r_y0": 361.659, "r_x1": 298.249, "r_y1": 361.659, "r_x2": 298.249, "r_y2": 355.37, "r_x3": 168.246, "r_y3": 355.37, "coord_origin": "TOPLEFT"}, "text": "<td> </td> <td> </td> <td> </td> <td> </td>", "orig": "<td> </td> <td> </td> <td> </td> <td> </td>", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 44, "label": "text", "bbox": {"l": 160.67, "t": 362.187, "r": 174.69, "b": 368.476, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 44, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 160.67, "r_y0": 368.476, "r_x1": 174.69, "r_y1": 368.476, "r_x2": 174.69, "r_y2": 362.187, "r_x3": 160.67, "r_y3": 362.187, "coord_origin": "TOPLEFT"}, "text": "</tr>", "orig": "</tr>", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 45, "label": "text", "bbox": {"l": 160.67, "t": 369.004, "r": 172.796, "b": 375.292, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 45, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 160.67, "r_y0": 375.292, "r_x1": 172.796, "r_y1": 375.292, "r_x2": 172.796, "r_y2": 369.004, "r_x3": 160.67, "r_y3": 369.004, "coord_origin": "TOPLEFT"}, "text": "<tr>", "orig": "<tr>", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 46, "label": "text", "bbox": {"l": 168.246, "t": 375.821, "r": 298.249, "b": 382.109, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 46, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 168.246, "r_y0": 382.109, "r_x1": 298.249, "r_y1": 382.109, "r_x2": 298.249, "r_y2": 375.821, "r_x3": 168.246, "r_y3": 375.821, "coord_origin": "TOPLEFT"}, "text": "<td> </td> <td> </td> <td> </td> <td> </td>", "orig": "<td> </td> <td> </td> <td> </td> <td> </td>", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 47, "label": "text", "bbox": {"l": 160.67, "t": 382.637, "r": 174.69, "b": 388.926, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 47, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 160.67, "r_y0": 388.926, "r_x1": 174.69, "r_y1": 388.926, "r_x2": 174.69, "r_y2": 382.637, "r_x3": 160.67, "r_y3": 382.637, "coord_origin": "TOPLEFT"}, "text": "</tr>", "orig": "</tr>", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 48, "label": "text", "bbox": {"l": 153.095, "t": 389.454, "r": 177.733, "b": 395.743, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 48, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 153.095, "r_y0": 395.743, "r_x1": 177.733, "r_y1": 395.743, "r_x2": 177.733, "r_y2": 389.454, "r_x3": 153.095, "r_y3": 389.454, "coord_origin": "TOPLEFT"}, "text": "</table>", "orig": "</table>", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 49, "label": "text", "bbox": {"l": 395.061, "t": 411.443, "r": 412.476, "b": 419.828, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 49, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 395.061, "r_y0": 419.828, "r_x1": 412.476, "r_y1": 419.828, "r_x2": 412.476, "r_y2": 411.443, "r_x3": 395.061, "r_y3": 411.443, "coord_origin": "TOPLEFT"}, "text": "C L", "orig": "C L", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 50, "label": "text", "bbox": {"l": 418.693, "t": 411.443, "r": 436.571, "b": 419.828, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 50, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 418.693, "r_y0": 419.828, "r_x1": 436.571, "r_y1": 419.828, "r_x2": 436.571, "r_y2": 411.443, "r_x3": 418.693, "r_y3": 411.443, "coord_origin": "TOPLEFT"}, "text": "U X", "orig": "U X", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 51, "label": "text", "bbox": {"l": 152.362, "t": 409.855, "r": 175.106, "b": 416.144, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 51, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 152.362, "r_y0": 416.144, "r_x1": 175.106, "r_y1": 416.144, "r_x2": 175.106, "r_y2": 409.855, "r_x3": 152.362, "r_y3": 409.855, "coord_origin": "TOPLEFT"}, "text": "<table>", "orig": "<table>", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 52, "label": "text", "bbox": {"l": 178.894, "t": 409.855, "r": 191.019, "b": 416.144, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 52, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 178.894, "r_y0": 416.144, "r_x1": 191.019, "r_y1": 416.144, "r_x2": 191.019, "r_y2": 409.855, "r_x3": 178.894, "r_y3": 409.855, "coord_origin": "TOPLEFT"}, "text": "<tr>", "orig": "<tr>", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 53, "label": "text", "bbox": {"l": 194.807, "t": 409.855, "r": 208.826, "b": 416.144, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 53, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 194.807, "r_y0": 416.144, "r_x1": 208.826, "r_y1": 416.144, "r_x2": 208.826, "r_y2": 409.855, "r_x3": 194.807, "r_y3": 409.855, "coord_origin": "TOPLEFT"}, "text": "</tr>", "orig": "</tr>", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 54, "label": "text", "bbox": {"l": 212.614, "t": 409.855, "r": 226.26, "b": 416.144, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 54, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 212.614, "r_y0": 416.144, "r_x1": 226.26, "r_y1": 416.144, "r_x2": 226.26, "r_y2": 409.855, "r_x3": 212.614, "r_y3": 409.855, "coord_origin": "TOPLEFT"}, "text": "<td>", "orig": "<td>", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 55, "label": "text", "bbox": {"l": 230.047, "t": 409.855, "r": 245.588, "b": 416.144, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 55, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 230.047, "r_y0": 416.144, "r_x1": 245.588, "r_y1": 416.144, "r_x2": 245.588, "r_y2": 409.855, "r_x3": 230.047, "r_y3": 409.855, "coord_origin": "TOPLEFT"}, "text": "</td>", "orig": "</td>", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 56, "label": "text", "bbox": {"l": 249.375, "t": 409.855, "r": 259.039, "b": 416.144, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 56, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 249.375, "r_y0": 416.144, "r_x1": 259.039, "r_y1": 416.144, "r_x2": 259.039, "r_y2": 409.855, "r_x3": 249.375, "r_y3": 409.855, "coord_origin": "TOPLEFT"}, "text": "<td", "orig": "<td", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 57, "label": "text", "bbox": {"l": 262.828, "t": 409.855, "r": 298.936, "b": 416.144, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 57, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 262.828, "r_y0": 416.144, "r_x1": 298.936, "r_y1": 416.144, "r_x2": 298.936, "r_y2": 409.855, "r_x3": 262.828, "r_y3": 409.855, "coord_origin": "TOPLEFT"}, "text": "colspan=\"2\"", "orig": "colspan=\"2\"", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 58, "label": "text", "bbox": {"l": 302.724, "t": 409.855, "r": 338.832, "b": 416.144, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 58, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 302.724, "r_y0": 416.144, "r_x1": 338.832, "r_y1": 416.144, "r_x2": 338.832, "r_y2": 409.855, "r_x3": 302.724, "r_y3": 409.855, "coord_origin": "TOPLEFT"}, "text": "colspan=\"3\"", "orig": "colspan=\"3\"", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 59, "label": "text", "bbox": {"l": 152.362, "t": 418.187, "r": 190.741, "b": 424.476, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 59, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 152.362, "r_y0": 424.476, "r_x1": 190.741, "r_y1": 424.476, "r_x2": 190.741, "r_y2": 418.187, "r_x3": 152.362, "r_y3": 418.187, "coord_origin": "TOPLEFT"}, "text": "rowspan=\"2\"", "orig": "rowspan=\"2\"", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 60, "label": "text", "bbox": {"l": 194.529, "t": 418.187, "r": 232.908, "b": 424.476, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 60, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 194.529, "r_y0": 424.476, "r_x1": 232.908, "r_y1": 424.476, "r_x2": 232.908, "r_y2": 418.187, "r_x3": 194.529, "r_y3": 418.187, "coord_origin": "TOPLEFT"}, "text": "rowspan=\"3\"", "orig": "rowspan=\"3\"", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 61, "label": "text", "bbox": {"l": 236.695, "t": 418.187, "r": 269.101, "b": 424.476, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 61, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 236.695, "r_y0": 424.476, "r_x1": 269.101, "r_y1": 424.476, "r_x2": 269.101, "r_y2": 418.187, "r_x3": 236.695, "r_y3": 418.187, "coord_origin": "TOPLEFT"}, "text": "> </table>", "orig": "> </table>", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 62, "label": "text", "bbox": {"l": 154.506, "t": 258.692, "r": 185.219, "b": 265.679, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 62, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 154.506, "r_y0": 265.679, "r_x1": 185.219, "r_y1": 265.679, "r_x2": 185.219, "r_y2": 258.692, "r_x3": 154.506, "r_y3": 258.692, "coord_origin": "TOPLEFT"}, "text": "C HTML", "orig": "C HTML", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 63, "label": "text", "bbox": {"l": 164.355, "t": 266.58799999999997, "r": 222.054, "b": 273.57500000000005, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 63, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 164.355, "r_y0": 273.57500000000005, "r_x1": 222.054, "r_y1": 273.57500000000005, "r_x2": 222.054, "r_y2": 266.58799999999997, "r_x3": 164.355, "r_y3": 266.58799999999997, "coord_origin": "TOPLEFT"}, "text": "sequence length:", "orig": "sequence length:", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 64, "label": "text", "bbox": {"l": 224.153, "t": 266.58799999999997, "r": 232.577, "b": 273.57500000000005, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 64, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 224.153, "r_y0": 273.57500000000005, "r_x1": 232.577, "r_y1": 273.57500000000005, "r_x2": 232.577, "r_y2": 266.58799999999997, "r_x3": 224.153, "r_y3": 266.58799999999997, "coord_origin": "TOPLEFT"}, "text": "55", "orig": "55", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}]}, "text": "", "annotations": [], "provenance": null, "predicted_class": null, "confidence": null}, {"label": "text", "id": 2, "page_no": 1, "cluster": {"id": 2, "label": "text", "bbox": {"l": 134.765, "t": 452.314, "r": 480.592, "b": 520.887, "coord_origin": "TOPLEFT"}, "confidence": 0.950499951839447, "cells": [{"index": 65, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 461.111, "r_x1": 161.329, "r_y1": 461.111, "r_x2": 161.329, "r_y2": 452.314, "r_x3": 134.765, "r_y3": 452.314, "coord_origin": "TOPLEFT"}, "text": "today,", "orig": "today,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 66, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 164.269, "r_y0": 461.111, "r_x1": 226.286, "r_y1": 461.111, "r_x2": 226.286, "r_y2": 452.314, "r_x3": 164.269, "r_y3": 452.314, "coord_origin": "TOPLEFT"}, "text": "table detection", "orig": "table detection", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 67, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 229.992, "r_y0": 461.111, "r_x1": 480.592, "r_y1": 461.111, "r_x2": 480.592, "r_y2": 452.314, "r_x3": 229.992, "r_y3": 452.314, "coord_origin": "TOPLEFT"}, "text": "in documents is a well understood problem, and the latest", "orig": "in documents is a well understood problem, and the latest", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 68, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 473.066, "r_x1": 480.592, "r_y1": 473.066, "r_x2": 480.592, "r_y2": 464.269, "r_x3": 134.765, "r_y3": 464.269, "coord_origin": "TOPLEFT"}, "text": "state-of-the-art (SOTA) object detection methods provide an accuracy compa-", "orig": "state-of-the-art (SOTA) object detection methods provide an accuracy compa-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 69, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 485.021, "r_x1": 480.587, "r_y1": 485.021, "r_x2": 480.587, "r_y2": 476.224, "r_x3": 134.765, "r_y3": 476.224, "coord_origin": "TOPLEFT"}, "text": "rable to human observers [7,8,10,14,23]. On the other hand, the problem of table", "orig": "rable to human observers [7,8,10,14,23]. On the other hand, the problem of table", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 70, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 496.977, "r_x1": 480.587, "r_y1": 496.977, "r_x2": 480.587, "r_y2": 488.18, "r_x3": 134.765, "r_y3": 488.18, "coord_origin": "TOPLEFT"}, "text": "structure recognition (TSR) is a lot more challenging and remains a very active", "orig": "structure recognition (TSR) is a lot more challenging and remains a very active", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 71, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 508.932, "r_x1": 165.481, "r_y1": 508.932, "r_x2": 165.481, "r_y2": 500.135, "r_x3": 134.765, "r_y3": 500.135, "coord_origin": "TOPLEFT"}, "text": "area of", "orig": "area of", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 72, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 169.874, "r_y0": 508.932, "r_x1": 207.895, "r_y1": 508.932, "r_x2": 207.895, "r_y2": 500.135, "r_x3": 169.874, "r_y3": 500.135, "coord_origin": "TOPLEFT"}, "text": "research,", "orig": "research,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 73, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 212.289, "r_y0": 508.932, "r_x1": 220.589, "r_y1": 508.932, "r_x2": 220.589, "r_y2": 500.135, "r_x3": 212.289, "r_y3": 500.135, "coord_origin": "TOPLEFT"}, "text": "in", "orig": "in", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 74, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 224.992, "r_y0": 508.932, "r_x1": 480.59, "r_y1": 508.932, "r_x2": 480.59, "r_y2": 500.135, "r_x3": 224.992, "r_y3": 500.135, "coord_origin": "TOPLEFT"}, "text": "which many novel machine learning algorithms are being", "orig": "which many novel machine learning algorithms are being", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 75, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 520.887, "r_x1": 313.246, "r_y1": 520.887, "r_x2": 313.246, "r_y2": 512.0899999999999, "r_x3": 134.765, "r_y3": 512.0899999999999, "coord_origin": "TOPLEFT"}, "text": "explored [3,4,5,9,11,12,13,14,17,18,21,22].", "orig": "explored [3,4,5,9,11,12,13,14,17,18,21,22].", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "today, table detection in documents is a well understood problem, and the latest state-of-the-art (SOTA) object detection methods provide an accuracy comparable to human observers [7,8,10,14,23]. On the other hand, the problem of table structure recognition (TSR) is a lot more challenging and remains a very active area of research, in which many novel machine learning algorithms are being explored [3,4,5,9,11,12,13,14,17,18,21,22]."}, {"label": "text", "id": 0, "page_no": 1, "cluster": {"id": 0, "label": "text", "bbox": {"l": 134.765, "t": 524.5509999999999, "r": 480.595, "b": 664.855, "coord_origin": "TOPLEFT"}, "confidence": 0.9845512509346008, "cells": [{"index": 76, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 149.709, "r_y0": 533.348, "r_x1": 187.471, "r_y1": 533.348, "r_x2": 187.471, "r_y2": 524.5509999999999, "r_x3": 149.709, "r_y3": 524.5509999999999, "coord_origin": "TOPLEFT"}, "text": "Recently", "orig": "Recently", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 77, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 192.194, "r_y0": 533.348, "r_x1": 480.589, "r_y1": 533.348, "r_x2": 480.589, "r_y2": 524.5509999999999, "r_x3": 192.194, "r_y3": 524.5509999999999, "coord_origin": "TOPLEFT"}, "text": "emerging SOTA methods for table structure recognition employ", "orig": "emerging SOTA methods for table structure recognition employ", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 78, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 545.304, "r_x1": 480.592, "r_y1": 545.304, "r_x2": 480.592, "r_y2": 536.5070000000001, "r_x3": 134.765, "r_y3": 536.5070000000001, "coord_origin": "TOPLEFT"}, "text": "transformer-based models, in which an image of the table is provided to the net-", "orig": "transformer-based models, in which an image of the table is provided to the net-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 79, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 557.259, "r_x1": 480.589, "r_y1": 557.259, "r_x2": 480.589, "r_y2": 548.462, "r_x3": 134.765, "r_y3": 548.462, "coord_origin": "TOPLEFT"}, "text": "work in order to predict the structure of the table as a sequence of tokens. These", "orig": "work in order to predict the structure of the table as a sequence of tokens. These", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 80, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 569.2139999999999, "r_x1": 480.588, "r_y1": 569.2139999999999, "r_x2": 480.588, "r_y2": 560.417, "r_x3": 134.765, "r_y3": 560.417, "coord_origin": "TOPLEFT"}, "text": "image-to-sequence (Im2Seq) models are extremely powerful, since they allow for", "orig": "image-to-sequence (Im2Seq) models are extremely powerful, since they allow for", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 81, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 581.169, "r_x1": 480.59, "r_y1": 581.169, "r_x2": 480.59, "r_y2": 572.3720000000001, "r_x3": 134.765, "r_y3": 572.3720000000001, "coord_origin": "TOPLEFT"}, "text": "a purely data-driven solution. The tokens of the sequence typically belong to a", "orig": "a purely data-driven solution. The tokens of the sequence typically belong to a", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 82, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 593.124, "r_x1": 480.595, "r_y1": 593.124, "r_x2": 480.595, "r_y2": 584.327, "r_x3": 134.765, "r_y3": 584.327, "coord_origin": "TOPLEFT"}, "text": "markup language such as HTML, Latex or Markdown, which allow to describe", "orig": "markup language such as HTML, Latex or Markdown, which allow to describe", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 83, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 605.08, "r_x1": 480.587, "r_y1": 605.08, "r_x2": 480.587, "r_y2": 596.283, "r_x3": 134.765, "r_y3": 596.283, "coord_origin": "TOPLEFT"}, "text": "table structure as rows, columns and spanning cells in various configurations.", "orig": "table structure as rows, columns and spanning cells in various configurations.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 84, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 617.035, "r_x1": 480.595, "r_y1": 617.035, "r_x2": 480.595, "r_y2": 608.238, "r_x3": 134.765, "r_y3": 608.238, "coord_origin": "TOPLEFT"}, "text": "In Figure 1, we illustrate how HTML is used to represent the table-structure", "orig": "In Figure 1, we illustrate how HTML is used to represent the table-structure", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 85, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 628.99, "r_x1": 480.594, "r_y1": 628.99, "r_x2": 480.594, "r_y2": 620.193, "r_x3": 134.765, "r_y3": 620.193, "coord_origin": "TOPLEFT"}, "text": "of a particular example table. Public table-structure data sets such as PubTab-", "orig": "of a particular example table. Public table-structure data sets such as PubTab-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 86, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 640.9449999999999, "r_x1": 480.595, "r_y1": 640.9449999999999, "r_x2": 480.595, "r_y2": 632.148, "r_x3": 134.765, "r_y3": 632.148, "coord_origin": "TOPLEFT"}, "text": "Net [22], and FinTabNet [21], which were created in a semi-automated way from", "orig": "Net [22], and FinTabNet [21], which were created in a semi-automated way from", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 87, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 652.9, "r_x1": 480.588, "r_y1": 652.9, "r_x2": 480.588, "r_y2": 644.1030000000001, "r_x3": 134.765, "r_y3": 644.1030000000001, "coord_origin": "TOPLEFT"}, "text": "paired PDF and HTML sources (e.g. PubMed Central), popularized primarily", "orig": "paired PDF and HTML sources (e.g. PubMed Central), popularized primarily", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 88, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 664.855, "r_x1": 421.454, "r_y1": 664.855, "r_x2": 421.454, "r_y2": 656.058, "r_x3": 134.765, "r_y3": 656.058, "coord_origin": "TOPLEFT"}, "text": "the use of HTML as ground-truth representation format for TSR.", "orig": "the use of HTML as ground-truth representation format for TSR.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "Recently emerging SOTA methods for table structure recognition employ transformer-based models, in which an image of the table is provided to the network in order to predict the structure of the table as a sequence of tokens. These image-to-sequence (Im2Seq) models are extremely powerful, since they allow for a purely data-driven solution. The tokens of the sequence typically belong to a markup language such as HTML, Latex or Markdown, which allow to describe table structure as rows, columns and spanning cells in various configurations. In Figure 1, we illustrate how HTML is used to represent the table-structure of a particular example table. Public table-structure data sets such as PubTabNet [22], and FinTabNet [21], which were created in a semi-automated way from paired PDF and HTML sources (e.g. PubMed Central), popularized primarily the use of HTML as ground-truth representation format for TSR."}], "body": [{"label": "caption", "id": 4, "page_no": 1, "cluster": {"id": 4, "label": "caption", "bbox": {"l": 134.765, "t": 124.11900000000003, "r": 480.592, "b": 201.16200000000003, "coord_origin": "TOPLEFT"}, "confidence": 0.8939083218574524, "cells": [{"index": 2, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 134.26, "r_x1": 162.644, "r_y1": 134.26, "r_x2": 162.644, "r_y2": 126.33399999999995, "r_x3": 134.765, "r_y3": 126.33399999999995, "coord_origin": "TOPLEFT"}, "text": "Fig. 1.", "orig": "Fig. 1.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 3, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 167.062, "r_y0": 135.40800000000002, "r_x1": 480.591, "r_y1": 135.40800000000002, "r_x2": 480.591, "r_y2": 124.11900000000003, "r_x3": 167.062, "r_y3": 124.11900000000003, "coord_origin": "TOPLEFT"}, "text": "Comparison between HTML and OTSL table structure representation: (A)", "orig": "Comparison between HTML and OTSL table structure representation: (A)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 4, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 146.36699999999996, "r_x1": 190.823, "r_y1": 146.36699999999996, "r_x2": 190.823, "r_y2": 135.07799999999997, "r_x3": 134.765, "r_y3": 135.07799999999997, "coord_origin": "TOPLEFT"}, "text": "table-example", "orig": "table-example", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 5, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 195.199, "r_y0": 146.36699999999996, "r_x1": 480.59, "r_y1": 146.36699999999996, "r_x2": 480.59, "r_y2": 135.07799999999997, "r_x3": 195.199, "r_y3": 135.07799999999997, "coord_origin": "TOPLEFT"}, "text": "with complex row and column headers, including a 2D empty span,", "orig": "with complex row and column headers, including a 2D empty span,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 6, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 157.32600000000002, "r_x1": 480.591, "r_y1": 157.32600000000002, "r_x2": 480.591, "r_y2": 146.03700000000003, "r_x3": 134.765, "r_y3": 146.03700000000003, "coord_origin": "TOPLEFT"}, "text": "(B) minimal graphical representation of table structure using rectangular layout, (C)", "orig": "(B) minimal graphical representation of table structure using rectangular layout, (C)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 7, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 168.28499999999997, "r_x1": 480.592, "r_y1": 168.28499999999997, "r_x2": 480.592, "r_y2": 156.99599999999998, "r_x3": 134.765, "r_y3": 156.99599999999998, "coord_origin": "TOPLEFT"}, "text": "HTML representation, (D) OTSL representation. This example demonstrates many of", "orig": "HTML representation, (D) OTSL representation. This example demonstrates many of", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 8, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 179.24400000000003, "r_x1": 480.589, "r_y1": 179.24400000000003, "r_x2": 480.589, "r_y2": 167.95500000000004, "r_x3": 134.765, "r_y3": 167.95500000000004, "coord_origin": "TOPLEFT"}, "text": "the key-features of OTSL, namely its reduced vocabulary size (12 versus 5 in this case),", "orig": "the key-features of OTSL, namely its reduced vocabulary size (12 versus 5 in this case),", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 9, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 190.20299999999997, "r_x1": 480.59, "r_y1": 190.20299999999997, "r_x2": 480.59, "r_y2": 178.914, "r_x3": 134.765, "r_y3": 178.914, "coord_origin": "TOPLEFT"}, "text": "its reduced sequence length (55 versus 30) and a enhanced internal structure (variable", "orig": "its reduced sequence length (55 versus 30) and a enhanced internal structure (variable", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 10, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 201.16200000000003, "r_x1": 460.871, "r_y1": 201.16200000000003, "r_x2": 460.871, "r_y2": 189.87300000000005, "r_x3": 134.765, "r_y3": 189.87300000000005, "coord_origin": "TOPLEFT"}, "text": "token sequence length per row in HTML versus a fixed length of rows in OTSL).", "orig": "token sequence length per row in HTML versus a fixed length of rows in OTSL).", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "Fig. 1. Comparison between HTML and OTSL table structure representation: (A) table-example with complex row and column headers, including a 2D empty span, (B) minimal graphical representation of table structure using rectangular layout, (C) HTML representation, (D) OTSL representation. This example demonstrates many of the key-features of OTSL, namely its reduced vocabulary size (12 versus 5 in this case), its reduced sequence length (55 versus 30) and a enhanced internal structure (variable token sequence length per row in HTML versus a fixed length of rows in OTSL)."}, {"label": "picture", "id": 1, "page_no": 1, "cluster": {"id": 1, "label": "picture", "bbox": {"l": 148.45364379882812, "t": 208.37423706054688, "r": 464.3608093261719, "b": 425.8462219238281, "coord_origin": "TOPLEFT"}, "confidence": 0.9688959121704102, "cells": [{"index": 11, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 396.411, "r_y0": 289.478, "r_x1": 446.134, "r_y1": 288.875, "r_x2": 446.134, "r_y2": 280.49, "r_x3": 396.411, "r_y3": 281.093, "coord_origin": "TOPLEFT"}, "text": "C L C L L", "orig": "C L C L L", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 12, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 395.748, "r_y0": 311.731, "r_x1": 463.795, "r_y1": 311.337, "r_x2": 463.795, "r_y2": 302.952, "r_x3": 395.748, "r_y3": 303.346, "coord_origin": "TOPLEFT"}, "text": "C C C C C NL", "orig": "C C C C C NL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 13, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 407.563, "r_y0": 322.9, "r_x1": 463.716, "r_y1": 322.618, "r_x2": 463.716, "r_y2": 314.233, "r_x3": 407.563, "r_y3": 314.515, "coord_origin": "TOPLEFT"}, "text": "C C C C NL", "orig": "C C C C NL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 14, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 418.511, "r_y0": 300.579, "r_x1": 463.773, "r_y1": 300.093, "r_x2": 463.773, "r_y2": 291.708, "r_x3": 418.511, "r_y3": 292.194, "coord_origin": "TOPLEFT"}, "text": "C C C NL", "orig": "C C C NL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 15, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 407.397, "r_y0": 333.784, "r_x1": 463.915, "r_y1": 333.963, "r_x2": 463.915, "r_y2": 325.578, "r_x3": 407.397, "r_y3": 325.399, "coord_origin": "TOPLEFT"}, "text": "C C C C NL", "orig": "C C C C NL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 16, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 451.895, "r_y0": 288.651, "r_x1": 463.513, "r_y1": 288.651, "r_x2": 463.513, "r_y2": 280.266, "r_x3": 451.895, "r_y3": 280.266, "coord_origin": "TOPLEFT"}, "text": "NL", "orig": "NL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 17, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 396.097, "r_y0": 322.989, "r_x1": 402.659, "r_y1": 322.989, "r_x2": 402.659, "r_y2": 314.604, "r_x3": 396.097, "r_y3": 314.604, "coord_origin": "TOPLEFT"}, "text": "U", "orig": "U", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 18, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 395.998, "r_y0": 333.883, "r_x1": 402.561, "r_y1": 333.883, "r_x2": 402.561, "r_y2": 325.498, "r_x3": 395.998, "r_y3": 325.498, "coord_origin": "TOPLEFT"}, "text": "U", "orig": "U", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 19, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 396.275, "r_y0": 300.765, "r_x1": 414.036, "r_y1": 300.628, "r_x2": 414.036, "r_y2": 292.243, "r_x3": 396.275, "r_y3": 292.38, "coord_origin": "TOPLEFT"}, "text": "U X", "orig": "U X", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 20, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 441.256, "r_y0": 419.675, "r_x1": 452.874, "r_y1": 419.675, "r_x2": 452.874, "r_y2": 411.29, "r_x3": 441.256, "r_y3": 411.29, "coord_origin": "TOPLEFT"}, "text": "NL", "orig": "NL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 21, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 393.753, "r_y0": 406.873, "r_x1": 432.489, "r_y1": 406.873, "r_x2": 432.489, "r_y2": 399.886, "r_x3": 393.753, "r_y3": 399.886, "coord_origin": "TOPLEFT"}, "text": "vocabulary:", "orig": "vocabulary:", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 22, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 434.59, "r_y0": 406.873, "r_x1": 438.801, "r_y1": 406.873, "r_x2": 438.801, "r_y2": 399.886, "r_x3": 434.59, "r_y3": 399.886, "coord_origin": "TOPLEFT"}, "text": "5", "orig": "5", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 23, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 440.906, "r_y0": 406.873, "r_x1": 463.222, "r_y1": 406.873, "r_x2": 463.222, "r_y2": 399.886, "r_x3": 440.906, "r_y3": 399.886, "coord_origin": "TOPLEFT"}, "text": "tokens", "orig": "tokens", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 24, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 384.118, "r_y0": 265.626, "r_x1": 413.993, "r_y1": 265.626, "r_x2": 413.993, "r_y2": 258.63800000000003, "r_x3": 384.118, "r_y3": 258.63800000000003, "coord_origin": "TOPLEFT"}, "text": "D OTSL", "orig": "D OTSL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 25, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 393.753, "r_y0": 273.75300000000004, "r_x1": 451.451, "r_y1": 273.75300000000004, "r_x2": 451.451, "r_y2": 266.76599999999996, "r_x3": 393.753, "r_y3": 266.76599999999996, "coord_origin": "TOPLEFT"}, "text": "sequence length:", "orig": "sequence length:", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 26, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 453.551, "r_y0": 273.75300000000004, "r_x1": 461.975, "r_y1": 273.75300000000004, "r_x2": 461.975, "r_y2": 266.76599999999996, "r_x3": 453.551, "r_y3": 266.76599999999996, "coord_origin": "TOPLEFT"}, "text": "30", "orig": "30", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 27, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 151.793, "r_y0": 406.839, "r_x1": 233.894, "r_y1": 406.839, "r_x2": 233.894, "r_y2": 399.851, "r_x3": 151.793, "r_y3": 399.851, "coord_origin": "TOPLEFT"}, "text": "vocabulary for this table:", "orig": "vocabulary for this table:", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 28, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 235.993, "r_y0": 406.839, "r_x1": 244.417, "r_y1": 406.839, "r_x2": 244.417, "r_y2": 399.851, "r_x3": 235.993, "r_y3": 399.851, "coord_origin": "TOPLEFT"}, "text": "12", "orig": "12", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 29, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 246.522, "r_y0": 406.839, "r_x1": 268.839, "r_y1": 406.839, "r_x2": 268.839, "r_y2": 399.851, "r_x3": 246.522, "r_y3": 399.851, "coord_origin": "TOPLEFT"}, "text": "tokens", "orig": "tokens", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 30, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 154.33, "r_y0": 220.65300000000002, "r_x1": 159.798, "r_y1": 220.65300000000002, "r_x2": 159.798, "r_y2": 213.66600000000005, "r_x3": 154.33, "r_y3": 213.66600000000005, "coord_origin": "TOPLEFT"}, "text": "A", "orig": "A", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 31, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 321.071, "r_y0": 220.65300000000002, "r_x1": 326.539, "r_y1": 220.65300000000002, "r_x2": 326.539, "r_y2": 213.66600000000005, "r_x3": 321.071, "r_y3": 213.66600000000005, "coord_origin": "TOPLEFT"}, "text": "B", "orig": "B", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 32, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 153.095, "r_y0": 286.675, "r_x1": 175.839, "r_y1": 286.675, "r_x2": 175.839, "r_y2": 280.386, "r_x3": 153.095, "r_y3": 280.386, "coord_origin": "TOPLEFT"}, "text": "<table>", "orig": "<table>", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 33, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 160.67, "r_y0": 293.491, "r_x1": 172.796, "r_y1": 293.491, "r_x2": 172.796, "r_y2": 287.203, "r_x3": 160.67, "r_y3": 287.203, "coord_origin": "TOPLEFT"}, "text": "<tr>", "orig": "<tr>", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 34, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 168.246, "r_y0": 300.308, "r_x1": 351.469, "r_y1": 300.308, "r_x2": 351.469, "r_y2": 294.019, "r_x3": 168.246, "r_y3": 294.019, "coord_origin": "TOPLEFT"}, "text": "<td colspan='2' rowspan='2' > </td> <td colspan='3' > </td>", "orig": "<td colspan='2' rowspan='2' > </td> <td colspan='3' > </td>", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 35, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 160.67, "r_y0": 307.125, "r_x1": 174.69, "r_y1": 307.125, "r_x2": 174.69, "r_y2": 300.836, "r_x3": 160.67, "r_y3": 300.836, "coord_origin": "TOPLEFT"}, "text": "</tr>", "orig": "</tr>", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 36, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 160.67, "r_y0": 313.942, "r_x1": 172.796, "r_y1": 313.942, "r_x2": 172.796, "r_y2": 307.653, "r_x3": 160.67, "r_y3": 307.653, "coord_origin": "TOPLEFT"}, "text": "<tr>", "orig": "<tr>", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 37, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 168.246, "r_y0": 320.759, "r_x1": 265.275, "r_y1": 320.759, "r_x2": 265.275, "r_y2": 314.47, "r_x3": 168.246, "r_y3": 314.47, "coord_origin": "TOPLEFT"}, "text": "<td> </td> <td> </td> <td> </td>", "orig": "<td> </td> <td> </td> <td> </td>", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 38, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 160.67, "r_y0": 327.575, "r_x1": 174.69, "r_y1": 327.575, "r_x2": 174.69, "r_y2": 321.287, "r_x3": 160.67, "r_y3": 321.287, "coord_origin": "TOPLEFT"}, "text": "</tr>", "orig": "</tr>", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 39, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 160.67, "r_y0": 334.392, "r_x1": 172.796, "r_y1": 334.392, "r_x2": 172.796, "r_y2": 328.103, "r_x3": 160.67, "r_y3": 328.103, "coord_origin": "TOPLEFT"}, "text": "<tr>", "orig": "<tr>", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 40, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 168.246, "r_y0": 341.209, "r_x1": 373.091, "r_y1": 341.209, "r_x2": 373.091, "r_y2": 334.92, "r_x3": 168.246, "r_y3": 334.92, "coord_origin": "TOPLEFT"}, "text": "<td rowspan='3' > </td> <td> </td> <td> </td> <td> </td> <td> </td>", "orig": "<td rowspan='3' > </td> <td> </td> <td> </td> <td> </td> <td> </td>", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 41, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 160.67, "r_y0": 348.026, "r_x1": 174.69, "r_y1": 348.026, "r_x2": 174.69, "r_y2": 341.737, "r_x3": 160.67, "r_y3": 341.737, "coord_origin": "TOPLEFT"}, "text": "</tr>", "orig": "</tr>", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 42, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 160.67, "r_y0": 354.842, "r_x1": 172.796, "r_y1": 354.842, "r_x2": 172.796, "r_y2": 348.553, "r_x3": 160.67, "r_y3": 348.553, "coord_origin": "TOPLEFT"}, "text": "<tr>", "orig": "<tr>", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 43, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 168.246, "r_y0": 361.659, "r_x1": 298.249, "r_y1": 361.659, "r_x2": 298.249, "r_y2": 355.37, "r_x3": 168.246, "r_y3": 355.37, "coord_origin": "TOPLEFT"}, "text": "<td> </td> <td> </td> <td> </td> <td> </td>", "orig": "<td> </td> <td> </td> <td> </td> <td> </td>", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 44, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 160.67, "r_y0": 368.476, "r_x1": 174.69, "r_y1": 368.476, "r_x2": 174.69, "r_y2": 362.187, "r_x3": 160.67, "r_y3": 362.187, "coord_origin": "TOPLEFT"}, "text": "</tr>", "orig": "</tr>", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 45, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 160.67, "r_y0": 375.292, "r_x1": 172.796, "r_y1": 375.292, "r_x2": 172.796, "r_y2": 369.004, "r_x3": 160.67, "r_y3": 369.004, "coord_origin": "TOPLEFT"}, "text": "<tr>", "orig": "<tr>", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 46, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 168.246, "r_y0": 382.109, "r_x1": 298.249, "r_y1": 382.109, "r_x2": 298.249, "r_y2": 375.821, "r_x3": 168.246, "r_y3": 375.821, "coord_origin": "TOPLEFT"}, "text": "<td> </td> <td> </td> <td> </td> <td> </td>", "orig": "<td> </td> <td> </td> <td> </td> <td> </td>", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 47, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 160.67, "r_y0": 388.926, "r_x1": 174.69, "r_y1": 388.926, "r_x2": 174.69, "r_y2": 382.637, "r_x3": 160.67, "r_y3": 382.637, "coord_origin": "TOPLEFT"}, "text": "</tr>", "orig": "</tr>", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 48, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 153.095, "r_y0": 395.743, "r_x1": 177.733, "r_y1": 395.743, "r_x2": 177.733, "r_y2": 389.454, "r_x3": 153.095, "r_y3": 389.454, "coord_origin": "TOPLEFT"}, "text": "</table>", "orig": "</table>", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 49, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 395.061, "r_y0": 419.828, "r_x1": 412.476, "r_y1": 419.828, "r_x2": 412.476, "r_y2": 411.443, "r_x3": 395.061, "r_y3": 411.443, "coord_origin": "TOPLEFT"}, "text": "C L", "orig": "C L", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 50, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 418.693, "r_y0": 419.828, "r_x1": 436.571, "r_y1": 419.828, "r_x2": 436.571, "r_y2": 411.443, "r_x3": 418.693, "r_y3": 411.443, "coord_origin": "TOPLEFT"}, "text": "U X", "orig": "U X", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 51, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 152.362, "r_y0": 416.144, "r_x1": 175.106, "r_y1": 416.144, "r_x2": 175.106, "r_y2": 409.855, "r_x3": 152.362, "r_y3": 409.855, "coord_origin": "TOPLEFT"}, "text": "<table>", "orig": "<table>", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 52, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 178.894, "r_y0": 416.144, "r_x1": 191.019, "r_y1": 416.144, "r_x2": 191.019, "r_y2": 409.855, "r_x3": 178.894, "r_y3": 409.855, "coord_origin": "TOPLEFT"}, "text": "<tr>", "orig": "<tr>", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 53, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 194.807, "r_y0": 416.144, "r_x1": 208.826, "r_y1": 416.144, "r_x2": 208.826, "r_y2": 409.855, "r_x3": 194.807, "r_y3": 409.855, "coord_origin": "TOPLEFT"}, "text": "</tr>", "orig": "</tr>", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 54, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 212.614, "r_y0": 416.144, "r_x1": 226.26, "r_y1": 416.144, "r_x2": 226.26, "r_y2": 409.855, "r_x3": 212.614, "r_y3": 409.855, "coord_origin": "TOPLEFT"}, "text": "<td>", "orig": "<td>", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 55, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 230.047, "r_y0": 416.144, "r_x1": 245.588, "r_y1": 416.144, "r_x2": 245.588, "r_y2": 409.855, "r_x3": 230.047, "r_y3": 409.855, "coord_origin": "TOPLEFT"}, "text": "</td>", "orig": "</td>", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 56, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 249.375, "r_y0": 416.144, "r_x1": 259.039, "r_y1": 416.144, "r_x2": 259.039, "r_y2": 409.855, "r_x3": 249.375, "r_y3": 409.855, "coord_origin": "TOPLEFT"}, "text": "<td", "orig": "<td", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 57, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 262.828, "r_y0": 416.144, "r_x1": 298.936, "r_y1": 416.144, "r_x2": 298.936, "r_y2": 409.855, "r_x3": 262.828, "r_y3": 409.855, "coord_origin": "TOPLEFT"}, "text": "colspan=\"2\"", "orig": "colspan=\"2\"", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 58, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 302.724, "r_y0": 416.144, "r_x1": 338.832, "r_y1": 416.144, "r_x2": 338.832, "r_y2": 409.855, "r_x3": 302.724, "r_y3": 409.855, "coord_origin": "TOPLEFT"}, "text": "colspan=\"3\"", "orig": "colspan=\"3\"", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 59, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 152.362, "r_y0": 424.476, "r_x1": 190.741, "r_y1": 424.476, "r_x2": 190.741, "r_y2": 418.187, "r_x3": 152.362, "r_y3": 418.187, "coord_origin": "TOPLEFT"}, "text": "rowspan=\"2\"", "orig": "rowspan=\"2\"", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 60, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 194.529, "r_y0": 424.476, "r_x1": 232.908, "r_y1": 424.476, "r_x2": 232.908, "r_y2": 418.187, "r_x3": 194.529, "r_y3": 418.187, "coord_origin": "TOPLEFT"}, "text": "rowspan=\"3\"", "orig": "rowspan=\"3\"", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 61, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 236.695, "r_y0": 424.476, "r_x1": 269.101, "r_y1": 424.476, "r_x2": 269.101, "r_y2": 418.187, "r_x3": 236.695, "r_y3": 418.187, "coord_origin": "TOPLEFT"}, "text": "> </table>", "orig": "> </table>", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 62, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 154.506, "r_y0": 265.679, "r_x1": 185.219, "r_y1": 265.679, "r_x2": 185.219, "r_y2": 258.692, "r_x3": 154.506, "r_y3": 258.692, "coord_origin": "TOPLEFT"}, "text": "C HTML", "orig": "C HTML", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 63, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 164.355, "r_y0": 273.57500000000005, "r_x1": 222.054, "r_y1": 273.57500000000005, "r_x2": 222.054, "r_y2": 266.58799999999997, "r_x3": 164.355, "r_y3": 266.58799999999997, "coord_origin": "TOPLEFT"}, "text": "sequence length:", "orig": "sequence length:", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 64, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 224.153, "r_y0": 273.57500000000005, "r_x1": 232.577, "r_y1": 273.57500000000005, "r_x2": 232.577, "r_y2": 266.58799999999997, "r_x3": 224.153, "r_y3": 266.58799999999997, "coord_origin": "TOPLEFT"}, "text": "55", "orig": "55", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": [{"id": 11, "label": "text", "bbox": {"l": 396.411, "t": 280.49, "r": 446.134, "b": 289.478, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 11, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 396.411, "r_y0": 289.478, "r_x1": 446.134, "r_y1": 288.875, "r_x2": 446.134, "r_y2": 280.49, "r_x3": 396.411, "r_y3": 281.093, "coord_origin": "TOPLEFT"}, "text": "C L C L L", "orig": "C L C L L", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 12, "label": "text", "bbox": {"l": 395.748, "t": 302.952, "r": 463.795, "b": 311.731, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 12, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 395.748, "r_y0": 311.731, "r_x1": 463.795, "r_y1": 311.337, "r_x2": 463.795, "r_y2": 302.952, "r_x3": 395.748, "r_y3": 303.346, "coord_origin": "TOPLEFT"}, "text": "C C C C C NL", "orig": "C C C C C NL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 13, "label": "text", "bbox": {"l": 407.563, "t": 314.233, "r": 463.716, "b": 322.9, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 13, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 407.563, "r_y0": 322.9, "r_x1": 463.716, "r_y1": 322.618, "r_x2": 463.716, "r_y2": 314.233, "r_x3": 407.563, "r_y3": 314.515, "coord_origin": "TOPLEFT"}, "text": "C C C C NL", "orig": "C C C C NL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 14, "label": "text", "bbox": {"l": 418.511, "t": 291.708, "r": 463.773, "b": 300.579, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 14, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 418.511, "r_y0": 300.579, "r_x1": 463.773, "r_y1": 300.093, "r_x2": 463.773, "r_y2": 291.708, "r_x3": 418.511, "r_y3": 292.194, "coord_origin": "TOPLEFT"}, "text": "C C C NL", "orig": "C C C NL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 15, "label": "text", "bbox": {"l": 407.397, "t": 325.399, "r": 463.915, "b": 333.963, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 15, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 407.397, "r_y0": 333.784, "r_x1": 463.915, "r_y1": 333.963, "r_x2": 463.915, "r_y2": 325.578, "r_x3": 407.397, "r_y3": 325.399, "coord_origin": "TOPLEFT"}, "text": "C C C C NL", "orig": "C C C C NL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 16, "label": "text", "bbox": {"l": 451.895, "t": 280.266, "r": 463.513, "b": 288.651, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 16, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 451.895, "r_y0": 288.651, "r_x1": 463.513, "r_y1": 288.651, "r_x2": 463.513, "r_y2": 280.266, "r_x3": 451.895, "r_y3": 280.266, "coord_origin": "TOPLEFT"}, "text": "NL", "orig": "NL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 17, "label": "text", "bbox": {"l": 396.097, "t": 314.604, "r": 402.659, "b": 322.989, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 17, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 396.097, "r_y0": 322.989, "r_x1": 402.659, "r_y1": 322.989, "r_x2": 402.659, "r_y2": 314.604, "r_x3": 396.097, "r_y3": 314.604, "coord_origin": "TOPLEFT"}, "text": "U", "orig": "U", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 18, "label": "text", "bbox": {"l": 395.998, "t": 325.498, "r": 402.561, "b": 333.883, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 18, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 395.998, "r_y0": 333.883, "r_x1": 402.561, "r_y1": 333.883, "r_x2": 402.561, "r_y2": 325.498, "r_x3": 395.998, "r_y3": 325.498, "coord_origin": "TOPLEFT"}, "text": "U", "orig": "U", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 19, "label": "text", "bbox": {"l": 396.275, "t": 292.243, "r": 414.036, "b": 300.765, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 19, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 396.275, "r_y0": 300.765, "r_x1": 414.036, "r_y1": 300.628, "r_x2": 414.036, "r_y2": 292.243, "r_x3": 396.275, "r_y3": 292.38, "coord_origin": "TOPLEFT"}, "text": "U X", "orig": "U X", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 20, "label": "text", "bbox": {"l": 441.256, "t": 411.29, "r": 452.874, "b": 419.675, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 20, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 441.256, "r_y0": 419.675, "r_x1": 452.874, "r_y1": 419.675, "r_x2": 452.874, "r_y2": 411.29, "r_x3": 441.256, "r_y3": 411.29, "coord_origin": "TOPLEFT"}, "text": "NL", "orig": "NL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 21, "label": "text", "bbox": {"l": 393.753, "t": 399.886, "r": 432.489, "b": 406.873, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 21, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 393.753, "r_y0": 406.873, "r_x1": 432.489, "r_y1": 406.873, "r_x2": 432.489, "r_y2": 399.886, "r_x3": 393.753, "r_y3": 399.886, "coord_origin": "TOPLEFT"}, "text": "vocabulary:", "orig": "vocabulary:", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 22, "label": "text", "bbox": {"l": 434.59, "t": 399.886, "r": 438.801, "b": 406.873, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 22, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 434.59, "r_y0": 406.873, "r_x1": 438.801, "r_y1": 406.873, "r_x2": 438.801, "r_y2": 399.886, "r_x3": 434.59, "r_y3": 399.886, "coord_origin": "TOPLEFT"}, "text": "5", "orig": "5", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 23, "label": "text", "bbox": {"l": 440.906, "t": 399.886, "r": 463.222, "b": 406.873, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 23, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 440.906, "r_y0": 406.873, "r_x1": 463.222, "r_y1": 406.873, "r_x2": 463.222, "r_y2": 399.886, "r_x3": 440.906, "r_y3": 399.886, "coord_origin": "TOPLEFT"}, "text": "tokens", "orig": "tokens", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 24, "label": "text", "bbox": {"l": 384.118, "t": 258.63800000000003, "r": 413.993, "b": 265.626, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 24, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 384.118, "r_y0": 265.626, "r_x1": 413.993, "r_y1": 265.626, "r_x2": 413.993, "r_y2": 258.63800000000003, "r_x3": 384.118, "r_y3": 258.63800000000003, "coord_origin": "TOPLEFT"}, "text": "D OTSL", "orig": "D OTSL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 25, "label": "text", "bbox": {"l": 393.753, "t": 266.76599999999996, "r": 451.451, "b": 273.75300000000004, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 25, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 393.753, "r_y0": 273.75300000000004, "r_x1": 451.451, "r_y1": 273.75300000000004, "r_x2": 451.451, "r_y2": 266.76599999999996, "r_x3": 393.753, "r_y3": 266.76599999999996, "coord_origin": "TOPLEFT"}, "text": "sequence length:", "orig": "sequence length:", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 26, "label": "text", "bbox": {"l": 453.551, "t": 266.76599999999996, "r": 461.975, "b": 273.75300000000004, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 26, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 453.551, "r_y0": 273.75300000000004, "r_x1": 461.975, "r_y1": 273.75300000000004, "r_x2": 461.975, "r_y2": 266.76599999999996, "r_x3": 453.551, "r_y3": 266.76599999999996, "coord_origin": "TOPLEFT"}, "text": "30", "orig": "30", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 27, "label": "text", "bbox": {"l": 151.793, "t": 399.851, "r": 233.894, "b": 406.839, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 27, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 151.793, "r_y0": 406.839, "r_x1": 233.894, "r_y1": 406.839, "r_x2": 233.894, "r_y2": 399.851, "r_x3": 151.793, "r_y3": 399.851, "coord_origin": "TOPLEFT"}, "text": "vocabulary for this table:", "orig": "vocabulary for this table:", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 28, "label": "text", "bbox": {"l": 235.993, "t": 399.851, "r": 244.417, "b": 406.839, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 28, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 235.993, "r_y0": 406.839, "r_x1": 244.417, "r_y1": 406.839, "r_x2": 244.417, "r_y2": 399.851, "r_x3": 235.993, "r_y3": 399.851, "coord_origin": "TOPLEFT"}, "text": "12", "orig": "12", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 29, "label": "text", "bbox": {"l": 246.522, "t": 399.851, "r": 268.839, "b": 406.839, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 29, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 246.522, "r_y0": 406.839, "r_x1": 268.839, "r_y1": 406.839, "r_x2": 268.839, "r_y2": 399.851, "r_x3": 246.522, "r_y3": 399.851, "coord_origin": "TOPLEFT"}, "text": "tokens", "orig": "tokens", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 30, "label": "text", "bbox": {"l": 154.33, "t": 213.66600000000005, "r": 159.798, "b": 220.65300000000002, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 30, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 154.33, "r_y0": 220.65300000000002, "r_x1": 159.798, "r_y1": 220.65300000000002, "r_x2": 159.798, "r_y2": 213.66600000000005, "r_x3": 154.33, "r_y3": 213.66600000000005, "coord_origin": "TOPLEFT"}, "text": "A", "orig": "A", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 31, "label": "text", "bbox": {"l": 321.071, "t": 213.66600000000005, "r": 326.539, "b": 220.65300000000002, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 31, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 321.071, "r_y0": 220.65300000000002, "r_x1": 326.539, "r_y1": 220.65300000000002, "r_x2": 326.539, "r_y2": 213.66600000000005, "r_x3": 321.071, "r_y3": 213.66600000000005, "coord_origin": "TOPLEFT"}, "text": "B", "orig": "B", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 32, "label": "text", "bbox": {"l": 153.095, "t": 280.386, "r": 175.839, "b": 286.675, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 32, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 153.095, "r_y0": 286.675, "r_x1": 175.839, "r_y1": 286.675, "r_x2": 175.839, "r_y2": 280.386, "r_x3": 153.095, "r_y3": 280.386, "coord_origin": "TOPLEFT"}, "text": "<table>", "orig": "<table>", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 33, "label": "text", "bbox": {"l": 160.67, "t": 287.203, "r": 172.796, "b": 293.491, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 33, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 160.67, "r_y0": 293.491, "r_x1": 172.796, "r_y1": 293.491, "r_x2": 172.796, "r_y2": 287.203, "r_x3": 160.67, "r_y3": 287.203, "coord_origin": "TOPLEFT"}, "text": "<tr>", "orig": "<tr>", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 34, "label": "text", "bbox": {"l": 168.246, "t": 294.019, "r": 351.469, "b": 300.308, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 34, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 168.246, "r_y0": 300.308, "r_x1": 351.469, "r_y1": 300.308, "r_x2": 351.469, "r_y2": 294.019, "r_x3": 168.246, "r_y3": 294.019, "coord_origin": "TOPLEFT"}, "text": "<td colspan='2' rowspan='2' > </td> <td colspan='3' > </td>", "orig": "<td colspan='2' rowspan='2' > </td> <td colspan='3' > </td>", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 35, "label": "text", "bbox": {"l": 160.67, "t": 300.836, "r": 174.69, "b": 307.125, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 35, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 160.67, "r_y0": 307.125, "r_x1": 174.69, "r_y1": 307.125, "r_x2": 174.69, "r_y2": 300.836, "r_x3": 160.67, "r_y3": 300.836, "coord_origin": "TOPLEFT"}, "text": "</tr>", "orig": "</tr>", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 36, "label": "text", "bbox": {"l": 160.67, "t": 307.653, "r": 172.796, "b": 313.942, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 36, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 160.67, "r_y0": 313.942, "r_x1": 172.796, "r_y1": 313.942, "r_x2": 172.796, "r_y2": 307.653, "r_x3": 160.67, "r_y3": 307.653, "coord_origin": "TOPLEFT"}, "text": "<tr>", "orig": "<tr>", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 37, "label": "text", "bbox": {"l": 168.246, "t": 314.47, "r": 265.275, "b": 320.759, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 37, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 168.246, "r_y0": 320.759, "r_x1": 265.275, "r_y1": 320.759, "r_x2": 265.275, "r_y2": 314.47, "r_x3": 168.246, "r_y3": 314.47, "coord_origin": "TOPLEFT"}, "text": "<td> </td> <td> </td> <td> </td>", "orig": "<td> </td> <td> </td> <td> </td>", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 38, "label": "text", "bbox": {"l": 160.67, "t": 321.287, "r": 174.69, "b": 327.575, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 38, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 160.67, "r_y0": 327.575, "r_x1": 174.69, "r_y1": 327.575, "r_x2": 174.69, "r_y2": 321.287, "r_x3": 160.67, "r_y3": 321.287, "coord_origin": "TOPLEFT"}, "text": "</tr>", "orig": "</tr>", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 39, "label": "text", "bbox": {"l": 160.67, "t": 328.103, "r": 172.796, "b": 334.392, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 39, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 160.67, "r_y0": 334.392, "r_x1": 172.796, "r_y1": 334.392, "r_x2": 172.796, "r_y2": 328.103, "r_x3": 160.67, "r_y3": 328.103, "coord_origin": "TOPLEFT"}, "text": "<tr>", "orig": "<tr>", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 40, "label": "text", "bbox": {"l": 168.246, "t": 334.92, "r": 373.091, "b": 341.209, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 40, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 168.246, "r_y0": 341.209, "r_x1": 373.091, "r_y1": 341.209, "r_x2": 373.091, "r_y2": 334.92, "r_x3": 168.246, "r_y3": 334.92, "coord_origin": "TOPLEFT"}, "text": "<td rowspan='3' > </td> <td> </td> <td> </td> <td> </td> <td> </td>", "orig": "<td rowspan='3' > </td> <td> </td> <td> </td> <td> </td> <td> </td>", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 41, "label": "text", "bbox": {"l": 160.67, "t": 341.737, "r": 174.69, "b": 348.026, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 41, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 160.67, "r_y0": 348.026, "r_x1": 174.69, "r_y1": 348.026, "r_x2": 174.69, "r_y2": 341.737, "r_x3": 160.67, "r_y3": 341.737, "coord_origin": "TOPLEFT"}, "text": "</tr>", "orig": "</tr>", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 42, "label": "text", "bbox": {"l": 160.67, "t": 348.553, "r": 172.796, "b": 354.842, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 42, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 160.67, "r_y0": 354.842, "r_x1": 172.796, "r_y1": 354.842, "r_x2": 172.796, "r_y2": 348.553, "r_x3": 160.67, "r_y3": 348.553, "coord_origin": "TOPLEFT"}, "text": "<tr>", "orig": "<tr>", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 43, "label": "text", "bbox": {"l": 168.246, "t": 355.37, "r": 298.249, "b": 361.659, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 43, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 168.246, "r_y0": 361.659, "r_x1": 298.249, "r_y1": 361.659, "r_x2": 298.249, "r_y2": 355.37, "r_x3": 168.246, "r_y3": 355.37, "coord_origin": "TOPLEFT"}, "text": "<td> </td> <td> </td> <td> </td> <td> </td>", "orig": "<td> </td> <td> </td> <td> </td> <td> </td>", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 44, "label": "text", "bbox": {"l": 160.67, "t": 362.187, "r": 174.69, "b": 368.476, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 44, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 160.67, "r_y0": 368.476, "r_x1": 174.69, "r_y1": 368.476, "r_x2": 174.69, "r_y2": 362.187, "r_x3": 160.67, "r_y3": 362.187, "coord_origin": "TOPLEFT"}, "text": "</tr>", "orig": "</tr>", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 45, "label": "text", "bbox": {"l": 160.67, "t": 369.004, "r": 172.796, "b": 375.292, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 45, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 160.67, "r_y0": 375.292, "r_x1": 172.796, "r_y1": 375.292, "r_x2": 172.796, "r_y2": 369.004, "r_x3": 160.67, "r_y3": 369.004, "coord_origin": "TOPLEFT"}, "text": "<tr>", "orig": "<tr>", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 46, "label": "text", "bbox": {"l": 168.246, "t": 375.821, "r": 298.249, "b": 382.109, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 46, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 168.246, "r_y0": 382.109, "r_x1": 298.249, "r_y1": 382.109, "r_x2": 298.249, "r_y2": 375.821, "r_x3": 168.246, "r_y3": 375.821, "coord_origin": "TOPLEFT"}, "text": "<td> </td> <td> </td> <td> </td> <td> </td>", "orig": "<td> </td> <td> </td> <td> </td> <td> </td>", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 47, "label": "text", "bbox": {"l": 160.67, "t": 382.637, "r": 174.69, "b": 388.926, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 47, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 160.67, "r_y0": 388.926, "r_x1": 174.69, "r_y1": 388.926, "r_x2": 174.69, "r_y2": 382.637, "r_x3": 160.67, "r_y3": 382.637, "coord_origin": "TOPLEFT"}, "text": "</tr>", "orig": "</tr>", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 48, "label": "text", "bbox": {"l": 153.095, "t": 389.454, "r": 177.733, "b": 395.743, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 48, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 153.095, "r_y0": 395.743, "r_x1": 177.733, "r_y1": 395.743, "r_x2": 177.733, "r_y2": 389.454, "r_x3": 153.095, "r_y3": 389.454, "coord_origin": "TOPLEFT"}, "text": "</table>", "orig": "</table>", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 49, "label": "text", "bbox": {"l": 395.061, "t": 411.443, "r": 412.476, "b": 419.828, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 49, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 395.061, "r_y0": 419.828, "r_x1": 412.476, "r_y1": 419.828, "r_x2": 412.476, "r_y2": 411.443, "r_x3": 395.061, "r_y3": 411.443, "coord_origin": "TOPLEFT"}, "text": "C L", "orig": "C L", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 50, "label": "text", "bbox": {"l": 418.693, "t": 411.443, "r": 436.571, "b": 419.828, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 50, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 418.693, "r_y0": 419.828, "r_x1": 436.571, "r_y1": 419.828, "r_x2": 436.571, "r_y2": 411.443, "r_x3": 418.693, "r_y3": 411.443, "coord_origin": "TOPLEFT"}, "text": "U X", "orig": "U X", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 51, "label": "text", "bbox": {"l": 152.362, "t": 409.855, "r": 175.106, "b": 416.144, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 51, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 152.362, "r_y0": 416.144, "r_x1": 175.106, "r_y1": 416.144, "r_x2": 175.106, "r_y2": 409.855, "r_x3": 152.362, "r_y3": 409.855, "coord_origin": "TOPLEFT"}, "text": "<table>", "orig": "<table>", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 52, "label": "text", "bbox": {"l": 178.894, "t": 409.855, "r": 191.019, "b": 416.144, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 52, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 178.894, "r_y0": 416.144, "r_x1": 191.019, "r_y1": 416.144, "r_x2": 191.019, "r_y2": 409.855, "r_x3": 178.894, "r_y3": 409.855, "coord_origin": "TOPLEFT"}, "text": "<tr>", "orig": "<tr>", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 53, "label": "text", "bbox": {"l": 194.807, "t": 409.855, "r": 208.826, "b": 416.144, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 53, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 194.807, "r_y0": 416.144, "r_x1": 208.826, "r_y1": 416.144, "r_x2": 208.826, "r_y2": 409.855, "r_x3": 194.807, "r_y3": 409.855, "coord_origin": "TOPLEFT"}, "text": "</tr>", "orig": "</tr>", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 54, "label": "text", "bbox": {"l": 212.614, "t": 409.855, "r": 226.26, "b": 416.144, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 54, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 212.614, "r_y0": 416.144, "r_x1": 226.26, "r_y1": 416.144, "r_x2": 226.26, "r_y2": 409.855, "r_x3": 212.614, "r_y3": 409.855, "coord_origin": "TOPLEFT"}, "text": "<td>", "orig": "<td>", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 55, "label": "text", "bbox": {"l": 230.047, "t": 409.855, "r": 245.588, "b": 416.144, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 55, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 230.047, "r_y0": 416.144, "r_x1": 245.588, "r_y1": 416.144, "r_x2": 245.588, "r_y2": 409.855, "r_x3": 230.047, "r_y3": 409.855, "coord_origin": "TOPLEFT"}, "text": "</td>", "orig": "</td>", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 56, "label": "text", "bbox": {"l": 249.375, "t": 409.855, "r": 259.039, "b": 416.144, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 56, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 249.375, "r_y0": 416.144, "r_x1": 259.039, "r_y1": 416.144, "r_x2": 259.039, "r_y2": 409.855, "r_x3": 249.375, "r_y3": 409.855, "coord_origin": "TOPLEFT"}, "text": "<td", "orig": "<td", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 57, "label": "text", "bbox": {"l": 262.828, "t": 409.855, "r": 298.936, "b": 416.144, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 57, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 262.828, "r_y0": 416.144, "r_x1": 298.936, "r_y1": 416.144, "r_x2": 298.936, "r_y2": 409.855, "r_x3": 262.828, "r_y3": 409.855, "coord_origin": "TOPLEFT"}, "text": "colspan=\"2\"", "orig": "colspan=\"2\"", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 58, "label": "text", "bbox": {"l": 302.724, "t": 409.855, "r": 338.832, "b": 416.144, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 58, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 302.724, "r_y0": 416.144, "r_x1": 338.832, "r_y1": 416.144, "r_x2": 338.832, "r_y2": 409.855, "r_x3": 302.724, "r_y3": 409.855, "coord_origin": "TOPLEFT"}, "text": "colspan=\"3\"", "orig": "colspan=\"3\"", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 59, "label": "text", "bbox": {"l": 152.362, "t": 418.187, "r": 190.741, "b": 424.476, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 59, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 152.362, "r_y0": 424.476, "r_x1": 190.741, "r_y1": 424.476, "r_x2": 190.741, "r_y2": 418.187, "r_x3": 152.362, "r_y3": 418.187, "coord_origin": "TOPLEFT"}, "text": "rowspan=\"2\"", "orig": "rowspan=\"2\"", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 60, "label": "text", "bbox": {"l": 194.529, "t": 418.187, "r": 232.908, "b": 424.476, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 60, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 194.529, "r_y0": 424.476, "r_x1": 232.908, "r_y1": 424.476, "r_x2": 232.908, "r_y2": 418.187, "r_x3": 194.529, "r_y3": 418.187, "coord_origin": "TOPLEFT"}, "text": "rowspan=\"3\"", "orig": "rowspan=\"3\"", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 61, "label": "text", "bbox": {"l": 236.695, "t": 418.187, "r": 269.101, "b": 424.476, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 61, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 236.695, "r_y0": 424.476, "r_x1": 269.101, "r_y1": 424.476, "r_x2": 269.101, "r_y2": 418.187, "r_x3": 236.695, "r_y3": 418.187, "coord_origin": "TOPLEFT"}, "text": "> </table>", "orig": "> </table>", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 62, "label": "text", "bbox": {"l": 154.506, "t": 258.692, "r": 185.219, "b": 265.679, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 62, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 154.506, "r_y0": 265.679, "r_x1": 185.219, "r_y1": 265.679, "r_x2": 185.219, "r_y2": 258.692, "r_x3": 154.506, "r_y3": 258.692, "coord_origin": "TOPLEFT"}, "text": "C HTML", "orig": "C HTML", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 63, "label": "text", "bbox": {"l": 164.355, "t": 266.58799999999997, "r": 222.054, "b": 273.57500000000005, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 63, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 164.355, "r_y0": 273.57500000000005, "r_x1": 222.054, "r_y1": 273.57500000000005, "r_x2": 222.054, "r_y2": 266.58799999999997, "r_x3": 164.355, "r_y3": 266.58799999999997, "coord_origin": "TOPLEFT"}, "text": "sequence length:", "orig": "sequence length:", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 64, "label": "text", "bbox": {"l": 224.153, "t": 266.58799999999997, "r": 232.577, "b": 273.57500000000005, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 64, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 224.153, "r_y0": 273.57500000000005, "r_x1": 232.577, "r_y1": 273.57500000000005, "r_x2": 232.577, "r_y2": 266.58799999999997, "r_x3": 224.153, "r_y3": 266.58799999999997, "coord_origin": "TOPLEFT"}, "text": "55", "orig": "55", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}]}, "text": "", "annotations": [], "provenance": null, "predicted_class": null, "confidence": null}, {"label": "text", "id": 2, "page_no": 1, "cluster": {"id": 2, "label": "text", "bbox": {"l": 134.765, "t": 452.314, "r": 480.592, "b": 520.887, "coord_origin": "TOPLEFT"}, "confidence": 0.950499951839447, "cells": [{"index": 65, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 461.111, "r_x1": 161.329, "r_y1": 461.111, "r_x2": 161.329, "r_y2": 452.314, "r_x3": 134.765, "r_y3": 452.314, "coord_origin": "TOPLEFT"}, "text": "today,", "orig": "today,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 66, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 164.269, "r_y0": 461.111, "r_x1": 226.286, "r_y1": 461.111, "r_x2": 226.286, "r_y2": 452.314, "r_x3": 164.269, "r_y3": 452.314, "coord_origin": "TOPLEFT"}, "text": "table detection", "orig": "table detection", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 67, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 229.992, "r_y0": 461.111, "r_x1": 480.592, "r_y1": 461.111, "r_x2": 480.592, "r_y2": 452.314, "r_x3": 229.992, "r_y3": 452.314, "coord_origin": "TOPLEFT"}, "text": "in documents is a well understood problem, and the latest", "orig": "in documents is a well understood problem, and the latest", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 68, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 473.066, "r_x1": 480.592, "r_y1": 473.066, "r_x2": 480.592, "r_y2": 464.269, "r_x3": 134.765, "r_y3": 464.269, "coord_origin": "TOPLEFT"}, "text": "state-of-the-art (SOTA) object detection methods provide an accuracy compa-", "orig": "state-of-the-art (SOTA) object detection methods provide an accuracy compa-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 69, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 485.021, "r_x1": 480.587, "r_y1": 485.021, "r_x2": 480.587, "r_y2": 476.224, "r_x3": 134.765, "r_y3": 476.224, "coord_origin": "TOPLEFT"}, "text": "rable to human observers [7,8,10,14,23]. On the other hand, the problem of table", "orig": "rable to human observers [7,8,10,14,23]. On the other hand, the problem of table", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 70, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 496.977, "r_x1": 480.587, "r_y1": 496.977, "r_x2": 480.587, "r_y2": 488.18, "r_x3": 134.765, "r_y3": 488.18, "coord_origin": "TOPLEFT"}, "text": "structure recognition (TSR) is a lot more challenging and remains a very active", "orig": "structure recognition (TSR) is a lot more challenging and remains a very active", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 71, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 508.932, "r_x1": 165.481, "r_y1": 508.932, "r_x2": 165.481, "r_y2": 500.135, "r_x3": 134.765, "r_y3": 500.135, "coord_origin": "TOPLEFT"}, "text": "area of", "orig": "area of", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 72, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 169.874, "r_y0": 508.932, "r_x1": 207.895, "r_y1": 508.932, "r_x2": 207.895, "r_y2": 500.135, "r_x3": 169.874, "r_y3": 500.135, "coord_origin": "TOPLEFT"}, "text": "research,", "orig": "research,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 73, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 212.289, "r_y0": 508.932, "r_x1": 220.589, "r_y1": 508.932, "r_x2": 220.589, "r_y2": 500.135, "r_x3": 212.289, "r_y3": 500.135, "coord_origin": "TOPLEFT"}, "text": "in", "orig": "in", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 74, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 224.992, "r_y0": 508.932, "r_x1": 480.59, "r_y1": 508.932, "r_x2": 480.59, "r_y2": 500.135, "r_x3": 224.992, "r_y3": 500.135, "coord_origin": "TOPLEFT"}, "text": "which many novel machine learning algorithms are being", "orig": "which many novel machine learning algorithms are being", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 75, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 520.887, "r_x1": 313.246, "r_y1": 520.887, "r_x2": 313.246, "r_y2": 512.0899999999999, "r_x3": 134.765, "r_y3": 512.0899999999999, "coord_origin": "TOPLEFT"}, "text": "explored [3,4,5,9,11,12,13,14,17,18,21,22].", "orig": "explored [3,4,5,9,11,12,13,14,17,18,21,22].", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "today, table detection in documents is a well understood problem, and the latest state-of-the-art (SOTA) object detection methods provide an accuracy comparable to human observers [7,8,10,14,23]. On the other hand, the problem of table structure recognition (TSR) is a lot more challenging and remains a very active area of research, in which many novel machine learning algorithms are being explored [3,4,5,9,11,12,13,14,17,18,21,22]."}, {"label": "text", "id": 0, "page_no": 1, "cluster": {"id": 0, "label": "text", "bbox": {"l": 134.765, "t": 524.5509999999999, "r": 480.595, "b": 664.855, "coord_origin": "TOPLEFT"}, "confidence": 0.9845512509346008, "cells": [{"index": 76, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 149.709, "r_y0": 533.348, "r_x1": 187.471, "r_y1": 533.348, "r_x2": 187.471, "r_y2": 524.5509999999999, "r_x3": 149.709, "r_y3": 524.5509999999999, "coord_origin": "TOPLEFT"}, "text": "Recently", "orig": "Recently", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 77, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 192.194, "r_y0": 533.348, "r_x1": 480.589, "r_y1": 533.348, "r_x2": 480.589, "r_y2": 524.5509999999999, "r_x3": 192.194, "r_y3": 524.5509999999999, "coord_origin": "TOPLEFT"}, "text": "emerging SOTA methods for table structure recognition employ", "orig": "emerging SOTA methods for table structure recognition employ", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 78, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 545.304, "r_x1": 480.592, "r_y1": 545.304, "r_x2": 480.592, "r_y2": 536.5070000000001, "r_x3": 134.765, "r_y3": 536.5070000000001, "coord_origin": "TOPLEFT"}, "text": "transformer-based models, in which an image of the table is provided to the net-", "orig": "transformer-based models, in which an image of the table is provided to the net-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 79, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 557.259, "r_x1": 480.589, "r_y1": 557.259, "r_x2": 480.589, "r_y2": 548.462, "r_x3": 134.765, "r_y3": 548.462, "coord_origin": "TOPLEFT"}, "text": "work in order to predict the structure of the table as a sequence of tokens. These", "orig": "work in order to predict the structure of the table as a sequence of tokens. These", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 80, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 569.2139999999999, "r_x1": 480.588, "r_y1": 569.2139999999999, "r_x2": 480.588, "r_y2": 560.417, "r_x3": 134.765, "r_y3": 560.417, "coord_origin": "TOPLEFT"}, "text": "image-to-sequence (Im2Seq) models are extremely powerful, since they allow for", "orig": "image-to-sequence (Im2Seq) models are extremely powerful, since they allow for", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 81, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 581.169, "r_x1": 480.59, "r_y1": 581.169, "r_x2": 480.59, "r_y2": 572.3720000000001, "r_x3": 134.765, "r_y3": 572.3720000000001, "coord_origin": "TOPLEFT"}, "text": "a purely data-driven solution. The tokens of the sequence typically belong to a", "orig": "a purely data-driven solution. The tokens of the sequence typically belong to a", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 82, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 593.124, "r_x1": 480.595, "r_y1": 593.124, "r_x2": 480.595, "r_y2": 584.327, "r_x3": 134.765, "r_y3": 584.327, "coord_origin": "TOPLEFT"}, "text": "markup language such as HTML, Latex or Markdown, which allow to describe", "orig": "markup language such as HTML, Latex or Markdown, which allow to describe", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 83, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 605.08, "r_x1": 480.587, "r_y1": 605.08, "r_x2": 480.587, "r_y2": 596.283, "r_x3": 134.765, "r_y3": 596.283, "coord_origin": "TOPLEFT"}, "text": "table structure as rows, columns and spanning cells in various configurations.", "orig": "table structure as rows, columns and spanning cells in various configurations.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 84, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 617.035, "r_x1": 480.595, "r_y1": 617.035, "r_x2": 480.595, "r_y2": 608.238, "r_x3": 134.765, "r_y3": 608.238, "coord_origin": "TOPLEFT"}, "text": "In Figure 1, we illustrate how HTML is used to represent the table-structure", "orig": "In Figure 1, we illustrate how HTML is used to represent the table-structure", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 85, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 628.99, "r_x1": 480.594, "r_y1": 628.99, "r_x2": 480.594, "r_y2": 620.193, "r_x3": 134.765, "r_y3": 620.193, "coord_origin": "TOPLEFT"}, "text": "of a particular example table. Public table-structure data sets such as PubTab-", "orig": "of a particular example table. Public table-structure data sets such as PubTab-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 86, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 640.9449999999999, "r_x1": 480.595, "r_y1": 640.9449999999999, "r_x2": 480.595, "r_y2": 632.148, "r_x3": 134.765, "r_y3": 632.148, "coord_origin": "TOPLEFT"}, "text": "Net [22], and FinTabNet [21], which were created in a semi-automated way from", "orig": "Net [22], and FinTabNet [21], which were created in a semi-automated way from", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 87, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 652.9, "r_x1": 480.588, "r_y1": 652.9, "r_x2": 480.588, "r_y2": 644.1030000000001, "r_x3": 134.765, "r_y3": 644.1030000000001, "coord_origin": "TOPLEFT"}, "text": "paired PDF and HTML sources (e.g. PubMed Central), popularized primarily", "orig": "paired PDF and HTML sources (e.g. PubMed Central), popularized primarily", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 88, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 664.855, "r_x1": 421.454, "r_y1": 664.855, "r_x2": 421.454, "r_y2": 656.058, "r_x3": 134.765, "r_y3": 656.058, "coord_origin": "TOPLEFT"}, "text": "the use of HTML as ground-truth representation format for TSR.", "orig": "the use of HTML as ground-truth representation format for TSR.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "Recently emerging SOTA methods for table structure recognition employ transformer-based models, in which an image of the table is provided to the network in order to predict the structure of the table as a sequence of tokens. These image-to-sequence (Im2Seq) models are extremely powerful, since they allow for a purely data-driven solution. The tokens of the sequence typically belong to a markup language such as HTML, Latex or Markdown, which allow to describe table structure as rows, columns and spanning cells in various configurations. In Figure 1, we illustrate how HTML is used to represent the table-structure of a particular example table. Public table-structure data sets such as PubTabNet [22], and FinTabNet [21], which were created in a semi-automated way from paired PDF and HTML sources (e.g. PubMed Central), popularized primarily the use of HTML as ground-truth representation format for TSR."}], "headers": [{"label": "page_header", "id": 5, "page_no": 1, "cluster": {"id": 5, "label": "page_header", "bbox": {"l": 134.765, "t": 91.49300000000005, "r": 139.372, "b": 102.78200000000004, "coord_origin": "TOPLEFT"}, "confidence": 0.8580349683761597, "cells": [{"index": 0, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 102.78200000000004, "r_x1": 139.372, "r_y1": 102.78200000000004, "r_x2": 139.372, "r_y2": 91.49300000000005, "r_x3": 134.765, "r_y3": 91.49300000000005, "coord_origin": "TOPLEFT"}, "text": "2", "orig": "2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "2"}, {"label": "page_header", "id": 3, "page_no": 1, "cluster": {"id": 3, "label": "page_header", "bbox": {"l": 167.813, "t": 91.49300000000005, "r": 231.722, "b": 102.78200000000004, "coord_origin": "TOPLEFT"}, "confidence": 0.9076642990112305, "cells": [{"index": 1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 167.813, "r_y0": 102.78200000000004, "r_x1": 231.722, "r_y1": 102.78200000000004, "r_x2": 231.722, "r_y2": 91.49300000000005, "r_x3": 167.813, "r_y3": 91.49300000000005, "coord_origin": "TOPLEFT"}, "text": "M. Lysak, et al.", "orig": "M. Lysak, et al.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "M. Lysak, et al."}]}}, {"page_no": 2, "size": {"width": 612.0, "height": 792.0}, "cells": [{"index": 0, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 194.478, "r_y0": 102.78200000000004, "r_x1": 447.543, "r_y1": 102.78200000000004, "r_x2": 447.543, "r_y2": 91.49300000000005, "r_x3": 194.478, "r_y3": 91.49300000000005, "coord_origin": "TOPLEFT"}, "text": "Optimized Table Tokenization for Table Structure Recognition", "orig": "Optimized Table Tokenization for Table Structure Recognition", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 475.984, "r_y0": 102.78200000000004, "r_x1": 480.591, "r_y1": 102.78200000000004, "r_x2": 480.591, "r_y2": 91.49300000000005, "r_x3": 475.984, "r_y3": 91.49300000000005, "coord_origin": "TOPLEFT"}, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 2, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 149.709, "r_y0": 127.731, "r_x1": 480.592, "r_y1": 127.731, "r_x2": 480.592, "r_y2": 118.93399999999997, "r_x3": 149.709, "r_y3": 118.93399999999997, "coord_origin": "TOPLEFT"}, "text": "While the majority of research in TSR is currently focused on the develop-", "orig": "While the majority of research in TSR is currently focused on the develop-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 3, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 139.68600000000004, "r_x1": 480.587, "r_y1": 139.68600000000004, "r_x2": 480.587, "r_y2": 130.889, "r_x3": 134.765, "r_y3": 130.889, "coord_origin": "TOPLEFT"}, "text": "ment and application of novel neural model architectures, the table structure", "orig": "ment and application of novel neural model architectures, the table structure", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 4, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 151.64200000000005, "r_x1": 480.592, "r_y1": 151.64200000000005, "r_x2": 480.592, "r_y2": 142.84500000000003, "r_x3": 134.765, "r_y3": 142.84500000000003, "coord_origin": "TOPLEFT"}, "text": "representation language (e.g. HTML in PubTabNet and FinTabNet) is usually", "orig": "representation language (e.g. HTML in PubTabNet and FinTabNet) is usually", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 5, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 163.59699999999998, "r_x1": 169.625, "r_y1": 163.59699999999998, "r_x2": 169.625, "r_y2": 154.79999999999995, "r_x3": 134.765, "r_y3": 154.79999999999995, "coord_origin": "TOPLEFT"}, "text": "adopted", "orig": "adopted", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 6, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 173.861, "r_y0": 163.59699999999998, "r_x1": 194.555, "r_y1": 163.59699999999998, "r_x2": 194.555, "r_y2": 154.79999999999995, "r_x3": 173.861, "r_y3": 154.79999999999995, "coord_origin": "TOPLEFT"}, "text": "as is", "orig": "as is", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 7, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 199.61, "r_y0": 163.59699999999998, "r_x1": 211.535, "r_y1": 163.59699999999998, "r_x2": 211.535, "r_y2": 154.79999999999995, "r_x3": 199.61, "r_y3": 154.79999999999995, "coord_origin": "TOPLEFT"}, "text": "for", "orig": "for", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 8, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 215.769, "r_y0": 163.59699999999998, "r_x1": 480.586, "r_y1": 163.59699999999998, "r_x2": 480.586, "r_y2": 154.79999999999995, "r_x3": 215.769, "r_y3": 154.79999999999995, "coord_origin": "TOPLEFT"}, "text": "the sequence tokenization in Im2Seq models. In this paper,", "orig": "the sequence tokenization in Im2Seq models. In this paper,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 9, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 175.55200000000002, "r_x1": 480.592, "r_y1": 175.55200000000002, "r_x2": 480.592, "r_y2": 166.755, "r_x3": 134.765, "r_y3": 166.755, "coord_origin": "TOPLEFT"}, "text": "we aim for the opposite and investigate the impact of the table structure rep-", "orig": "we aim for the opposite and investigate the impact of the table structure rep-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 10, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 187.50699999999995, "r_x1": 480.59, "r_y1": 187.50699999999995, "r_x2": 480.59, "r_y2": 178.71000000000004, "r_x3": 134.765, "r_y3": 178.71000000000004, "coord_origin": "TOPLEFT"}, "text": "resentation language with an otherwise unmodified Im2Seq transformer-based", "orig": "resentation language with an otherwise unmodified Im2Seq transformer-based", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 11, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 199.462, "r_x1": 480.592, "r_y1": 199.462, "r_x2": 480.592, "r_y2": 190.66499999999996, "r_x3": 134.765, "r_y3": 190.66499999999996, "coord_origin": "TOPLEFT"}, "text": "architecture. Since the current state-of-the-art Im2Seq model is TableFormer [9],", "orig": "architecture. Since the current state-of-the-art Im2Seq model is TableFormer [9],", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 12, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 211.41700000000003, "r_x1": 348.355, "r_y1": 211.41700000000003, "r_x2": 348.355, "r_y2": 202.62, "r_x3": 134.765, "r_y3": 202.62, "coord_origin": "TOPLEFT"}, "text": "we select this model to perform our experiments.", "orig": "we select this model to perform our experiments.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 13, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 149.709, "r_y0": 223.63300000000004, "r_x1": 480.594, "r_y1": 223.63300000000004, "r_x2": 480.594, "r_y2": 214.836, "r_x3": 149.709, "r_y3": 214.836, "coord_origin": "TOPLEFT"}, "text": "The main contribution of this paper is the introduction of a new optimised ta-", "orig": "The main contribution of this paper is the introduction of a new optimised ta-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 14, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 235.58799999999997, "r_x1": 480.594, "r_y1": 235.58799999999997, "r_x2": 480.594, "r_y2": 226.79100000000005, "r_x3": 134.765, "r_y3": 226.79100000000005, "coord_origin": "TOPLEFT"}, "text": "ble structure language (OTSL), specifically designed to describe table-structure", "orig": "ble structure language (OTSL), specifically designed to describe table-structure", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 15, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 247.54399999999998, "r_x1": 480.587, "r_y1": 247.54399999999998, "r_x2": 480.587, "r_y2": 238.74699999999996, "r_x3": 134.765, "r_y3": 238.74699999999996, "coord_origin": "TOPLEFT"}, "text": "in an compact and structured way for Im2Seq models. OTSL has a number of", "orig": "in an compact and structured way for Im2Seq models. OTSL has a number of", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 16, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 259.499, "r_x1": 480.587, "r_y1": 259.499, "r_x2": 480.587, "r_y2": 250.702, "r_x3": 134.765, "r_y3": 250.702, "coord_origin": "TOPLEFT"}, "text": "key features, which make it very attractive to use in Im2Seq models. Specifically,", "orig": "key features, which make it very attractive to use in Im2Seq models. Specifically,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 17, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 271.45399999999995, "r_x1": 480.588, "r_y1": 271.45399999999995, "r_x2": 480.588, "r_y2": 262.65700000000004, "r_x3": 134.765, "r_y3": 262.65700000000004, "coord_origin": "TOPLEFT"}, "text": "compared to other languages such as HTML, OTSL has a minimized vocabulary", "orig": "compared to other languages such as HTML, OTSL has a minimized vocabulary", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 18, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 283.409, "r_x1": 480.596, "r_y1": 283.409, "r_x2": 480.596, "r_y2": 274.61199999999997, "r_x3": 134.765, "r_y3": 274.61199999999997, "coord_origin": "TOPLEFT"}, "text": "which yields short sequence length, strong inherent structure (e.g. strict rectan-", "orig": "which yields short sequence length, strong inherent structure (e.g. strict rectan-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 19, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 295.364, "r_x1": 480.593, "r_y1": 295.364, "r_x2": 480.593, "r_y2": 286.567, "r_x3": 134.765, "r_y3": 286.567, "coord_origin": "TOPLEFT"}, "text": "gular layout) and a strict syntax with rules that only look backwards. The latter", "orig": "gular layout) and a strict syntax with rules that only look backwards. The latter", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 20, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 307.319, "r_x1": 480.595, "r_y1": 307.319, "r_x2": 480.595, "r_y2": 298.522, "r_x3": 134.765, "r_y3": 298.522, "coord_origin": "TOPLEFT"}, "text": "allows for syntax validation during inference and ensures a syntactically correct", "orig": "allows for syntax validation during inference and ensures a syntactically correct", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 21, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 319.275, "r_x1": 480.587, "r_y1": 319.275, "r_x2": 480.587, "r_y2": 310.478, "r_x3": 134.765, "r_y3": 310.478, "coord_origin": "TOPLEFT"}, "text": "table-structure. These OTSL features are illustrated in Figure 1, in comparison", "orig": "table-structure. These OTSL features are illustrated in Figure 1, in comparison", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 22, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 331.23, "r_x1": 179.72, "r_y1": 331.23, "r_x2": 179.72, "r_y2": 322.433, "r_x3": 134.765, "r_y3": 322.433, "coord_origin": "TOPLEFT"}, "text": "to HTML.", "orig": "to HTML.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 23, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 149.709, "r_y0": 343.445, "r_x1": 480.588, "r_y1": 343.445, "r_x2": 480.588, "r_y2": 334.648, "r_x3": 149.709, "r_y3": 334.648, "coord_origin": "TOPLEFT"}, "text": "The paper is structured as follows. In section 2, we give an overview of the", "orig": "The paper is structured as follows. In section 2, we give an overview of the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 24, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 355.401, "r_x1": 158.613, "r_y1": 355.401, "r_x2": 158.613, "r_y2": 346.604, "r_x3": 134.765, "r_y3": 346.604, "coord_origin": "TOPLEFT"}, "text": "latest", "orig": "latest", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 25, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 163.366, "r_y0": 355.401, "r_x1": 303.894, "r_y1": 355.401, "r_x2": 303.894, "r_y2": 346.604, "r_x3": 163.366, "r_y3": 346.604, "coord_origin": "TOPLEFT"}, "text": "developments in table-structure", "orig": "developments in table-structure", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 26, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.636, "r_y0": 355.401, "r_x1": 373.487, "r_y1": 355.401, "r_x2": 373.487, "r_y2": 346.604, "r_x3": 308.636, "r_y3": 346.604, "coord_origin": "TOPLEFT"}, "text": "reconstruction.", "orig": "reconstruction.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 27, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 378.239, "r_y0": 355.401, "r_x1": 387.369, "r_y1": 355.401, "r_x2": 387.369, "r_y2": 346.604, "r_x3": 378.239, "r_y3": 346.604, "coord_origin": "TOPLEFT"}, "text": "In", "orig": "In", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 28, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 392.111, "r_y0": 355.401, "r_x1": 422.055, "r_y1": 355.401, "r_x2": 422.055, "r_y2": 346.604, "r_x3": 392.111, "r_y3": 346.604, "coord_origin": "TOPLEFT"}, "text": "section", "orig": "section", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 29, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 426.798, "r_y0": 355.401, "r_x1": 480.594, "r_y1": 355.401, "r_x2": 480.594, "r_y2": 346.604, "r_x3": 426.798, "r_y3": 346.604, "coord_origin": "TOPLEFT"}, "text": "3 we review", "orig": "3 we review", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 30, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 367.356, "r_x1": 480.587, "r_y1": 367.356, "r_x2": 480.587, "r_y2": 358.559, "r_x3": 134.765, "r_y3": 358.559, "coord_origin": "TOPLEFT"}, "text": "the current HTML table encoding (popularised by PubTabNet and FinTabNet)", "orig": "the current HTML table encoding (popularised by PubTabNet and FinTabNet)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 31, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 379.311, "r_x1": 480.592, "r_y1": 379.311, "r_x2": 480.592, "r_y2": 370.514, "r_x3": 134.765, "r_y3": 370.514, "coord_origin": "TOPLEFT"}, "text": "and discuss its flaws. Subsequently, we introduce OTSL in section 4, which in-", "orig": "and discuss its flaws. Subsequently, we introduce OTSL in section 4, which in-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 32, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 391.266, "r_x1": 480.592, "r_y1": 391.266, "r_x2": 480.592, "r_y2": 382.469, "r_x3": 134.765, "r_y3": 382.469, "coord_origin": "TOPLEFT"}, "text": "cludes the language definition, syntax rules and error-correction procedures. In", "orig": "cludes the language definition, syntax rules and error-correction procedures. In", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 33, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 403.221, "r_x1": 480.588, "r_y1": 403.221, "r_x2": 480.588, "r_y2": 394.424, "r_x3": 134.765, "r_y3": 394.424, "coord_origin": "TOPLEFT"}, "text": "section 5, we apply OTSL on the TableFormer architecture, compare it to Table-", "orig": "section 5, we apply OTSL on the TableFormer architecture, compare it to Table-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 34, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 415.177, "r_x1": 480.595, "r_y1": 415.177, "r_x2": 480.595, "r_y2": 406.38, "r_x3": 134.765, "r_y3": 406.38, "coord_origin": "TOPLEFT"}, "text": "Former models trained on HTML and ultimately demonstrate the advantages", "orig": "Former models trained on HTML and ultimately demonstrate the advantages", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 35, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 427.132, "r_x1": 142.789, "r_y1": 427.132, "r_x2": 142.789, "r_y2": 418.335, "r_x3": 134.765, "r_y3": 418.335, "coord_origin": "TOPLEFT"}, "text": "of", "orig": "of", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 36, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 147.431, "r_y0": 427.132, "r_x1": 170.173, "r_y1": 427.132, "r_x2": 170.173, "r_y2": 418.335, "r_x3": 147.431, "r_y3": 418.335, "coord_origin": "TOPLEFT"}, "text": "using", "orig": "using", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 37, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 174.826, "r_y0": 427.132, "r_x1": 288.974, "r_y1": 427.132, "r_x2": 288.974, "r_y2": 418.335, "r_x3": 174.826, "r_y3": 418.335, "coord_origin": "TOPLEFT"}, "text": "OTSL. Finally, in section", "orig": "OTSL. Finally, in section", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 38, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 293.627, "r_y0": 427.132, "r_x1": 480.596, "r_y1": 427.132, "r_x2": 480.596, "r_y2": 418.335, "r_x3": 293.627, "r_y3": 418.335, "coord_origin": "TOPLEFT"}, "text": "6 we conclude our work and outline next", "orig": "6 we conclude our work and outline next", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 39, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 439.087, "r_x1": 201.272, "r_y1": 439.087, "r_x2": 201.272, "r_y2": 430.29, "r_x3": 134.765, "r_y3": 430.29, "coord_origin": "TOPLEFT"}, "text": "potential steps.", "orig": "potential steps.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 40, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 472.656, "r_x1": 141.489, "r_y1": 472.656, "r_x2": 141.489, "r_y2": 462.088, "r_x3": 134.765, "r_y3": 462.088, "coord_origin": "TOPLEFT"}, "text": "2", "orig": "2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 41, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 154.938, "r_y0": 472.656, "r_x1": 236.769, "r_y1": 472.656, "r_x2": 236.769, "r_y2": 462.088, "r_x3": 154.938, "r_y3": 462.088, "coord_origin": "TOPLEFT"}, "text": "Related Work", "orig": "Related Work", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 42, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 497.483, "r_x1": 480.591, "r_y1": 497.483, "r_x2": 480.591, "r_y2": 488.686, "r_x3": 134.765, "r_y3": 488.686, "coord_origin": "TOPLEFT"}, "text": "Approaches to formalize the logical structure and layout of tables in electronic", "orig": "Approaches to formalize the logical structure and layout of tables in electronic", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 43, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 509.438, "r_x1": 480.592, "r_y1": 509.438, "r_x2": 480.592, "r_y2": 500.641, "r_x3": 134.765, "r_y3": 500.641, "coord_origin": "TOPLEFT"}, "text": "documents date back more than two decades [16]. In the recent past, a wide", "orig": "documents date back more than two decades [16]. In the recent past, a wide", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 44, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 521.393, "r_x1": 164.401, "r_y1": 521.393, "r_x2": 164.401, "r_y2": 512.596, "r_x3": 134.765, "r_y3": 512.596, "coord_origin": "TOPLEFT"}, "text": "variety", "orig": "variety", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 45, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 169.581, "r_y0": 521.393, "r_x1": 177.605, "r_y1": 521.393, "r_x2": 177.605, "r_y2": 512.596, "r_x3": 169.581, "r_y3": 512.596, "coord_origin": "TOPLEFT"}, "text": "of", "orig": "of", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 46, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 182.786, "r_y0": 521.393, "r_x1": 223.77, "r_y1": 521.393, "r_x2": 223.77, "r_y2": 512.596, "r_x3": 182.786, "r_y3": 512.596, "coord_origin": "TOPLEFT"}, "text": "computer", "orig": "computer", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 47, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 228.95, "r_y0": 521.393, "r_x1": 254.183, "r_y1": 521.393, "r_x2": 254.183, "r_y2": 512.596, "r_x3": 228.95, "r_y3": 512.596, "coord_origin": "TOPLEFT"}, "text": "vision", "orig": "vision", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 48, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 259.363, "r_y0": 521.393, "r_x1": 321.047, "r_y1": 521.393, "r_x2": 321.047, "r_y2": 512.596, "r_x3": 259.363, "r_y3": 512.596, "coord_origin": "TOPLEFT"}, "text": "methods have", "orig": "methods have", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 49, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 326.237, "r_y0": 521.393, "r_x1": 346.435, "r_y1": 521.393, "r_x2": 346.435, "r_y2": 512.596, "r_x3": 326.237, "r_y3": 512.596, "coord_origin": "TOPLEFT"}, "text": "been", "orig": "been", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 50, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 351.616, "r_y0": 521.393, "r_x1": 388.441, "r_y1": 521.393, "r_x2": 388.441, "r_y2": 512.596, "r_x3": 351.616, "r_y3": 512.596, "coord_origin": "TOPLEFT"}, "text": "explored", "orig": "explored", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 51, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 393.631, "r_y0": 521.393, "r_x1": 402.485, "r_y1": 521.393, "r_x2": 402.485, "r_y2": 512.596, "r_x3": 393.631, "r_y3": 512.596, "coord_origin": "TOPLEFT"}, "text": "to", "orig": "to", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 52, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 407.666, "r_y0": 521.393, "r_x1": 433.117, "r_y1": 521.393, "r_x2": 433.117, "r_y2": 512.596, "r_x3": 407.666, "r_y3": 512.596, "coord_origin": "TOPLEFT"}, "text": "tackle", "orig": "tackle", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 53, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 438.307, "r_y0": 521.393, "r_x1": 452.141, "r_y1": 521.393, "r_x2": 452.141, "r_y2": 512.596, "r_x3": 438.307, "r_y3": 512.596, "coord_origin": "TOPLEFT"}, "text": "the", "orig": "the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 54, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 457.321, "r_y0": 521.393, "r_x1": 480.59, "r_y1": 521.393, "r_x2": 480.59, "r_y2": 512.596, "r_x3": 457.321, "r_y3": 512.596, "coord_origin": "TOPLEFT"}, "text": "prob-", "orig": "prob-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 55, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 533.3489999999999, "r_x1": 163.373, "r_y1": 533.3489999999999, "r_x2": 163.373, "r_y2": 524.552, "r_x3": 134.765, "r_y3": 524.552, "coord_origin": "TOPLEFT"}, "text": "lem of", "orig": "lem of", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 56, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 168.463, "r_y0": 533.3489999999999, "r_x1": 190.043, "r_y1": 533.3489999999999, "r_x2": 190.043, "r_y2": 524.552, "r_x3": 168.463, "r_y3": 524.552, "coord_origin": "TOPLEFT"}, "text": "table", "orig": "table", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 57, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 195.134, "r_y0": 533.3489999999999, "r_x1": 234.531, "r_y1": 533.3489999999999, "r_x2": 234.531, "r_y2": 524.552, "r_x3": 195.134, "r_y3": 524.552, "coord_origin": "TOPLEFT"}, "text": "structure", "orig": "structure", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 58, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 239.632, "r_y0": 533.3489999999999, "r_x1": 290.567, "r_y1": 533.3489999999999, "r_x2": 290.567, "r_y2": 524.552, "r_x3": 239.632, "r_y3": 524.552, "coord_origin": "TOPLEFT"}, "text": "recognition,", "orig": "recognition,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 59, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 295.658, "r_y0": 533.3489999999999, "r_x1": 308.384, "r_y1": 533.3489999999999, "r_x2": 308.384, "r_y2": 524.552, "r_x3": 295.658, "r_y3": 524.552, "coord_origin": "TOPLEFT"}, "text": "i.e.", "orig": "i.e.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 60, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 313.475, "r_y0": 533.3489999999999, "r_x1": 327.308, "r_y1": 533.3489999999999, "r_x2": 327.308, "r_y2": 524.552, "r_x3": 313.475, "r_y3": 524.552, "coord_origin": "TOPLEFT"}, "text": "the", "orig": "the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 61, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 332.399, "r_y0": 533.3489999999999, "r_x1": 362.335, "r_y1": 533.3489999999999, "r_x2": 362.335, "r_y2": 524.552, "r_x3": 332.399, "r_y3": 524.552, "coord_origin": "TOPLEFT"}, "text": "correct", "orig": "correct", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 62, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 367.426, "r_y0": 533.3489999999999, "r_x1": 424.15, "r_y1": 533.3489999999999, "r_x2": 424.15, "r_y2": 524.552, "r_x3": 367.426, "r_y3": 524.552, "coord_origin": "TOPLEFT"}, "text": "identification", "orig": "identification", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 63, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 429.241, "r_y0": 533.3489999999999, "r_x1": 437.264, "r_y1": 533.3489999999999, "r_x2": 437.264, "r_y2": 524.552, "r_x3": 429.241, "r_y3": 524.552, "coord_origin": "TOPLEFT"}, "text": "of", "orig": "of", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 64, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 442.355, "r_y0": 533.3489999999999, "r_x1": 480.59, "r_y1": 533.3489999999999, "r_x2": 480.59, "r_y2": 524.552, "r_x3": 442.355, "r_y3": 524.552, "coord_origin": "TOPLEFT"}, "text": "columns,", "orig": "columns,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 65, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 545.304, "r_x1": 480.59, "r_y1": 545.304, "r_x2": 480.59, "r_y2": 536.5070000000001, "r_x3": 134.765, "r_y3": 536.5070000000001, "coord_origin": "TOPLEFT"}, "text": "rows and spanning cells in a given table. Broadly speaking, the current deep-", "orig": "rows and spanning cells in a given table. Broadly speaking, the current deep-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 66, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 557.259, "r_x1": 480.589, "r_y1": 557.259, "r_x2": 480.589, "r_y2": 548.462, "r_x3": 134.765, "r_y3": 548.462, "coord_origin": "TOPLEFT"}, "text": "learning based approaches fall into three categories: object detection (OD) meth-", "orig": "learning based approaches fall into three categories: object detection (OD) meth-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 67, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 569.2139999999999, "r_x1": 152.252, "r_y1": 569.2139999999999, "r_x2": 152.252, "r_y2": 560.417, "r_x3": 134.765, "r_y3": 560.417, "coord_origin": "TOPLEFT"}, "text": "ods,", "orig": "ods,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 68, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 157.433, "r_y0": 569.2139999999999, "r_x1": 257.459, "r_y1": 569.2139999999999, "r_x2": 257.459, "r_y2": 560.417, "r_x3": 157.433, "r_y3": 560.417, "coord_origin": "TOPLEFT"}, "text": "Graph-Neural-Network", "orig": "Graph-Neural-Network", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 69, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 262.65, "r_y0": 569.2139999999999, "r_x1": 480.591, "r_y1": 569.2139999999999, "r_x2": 480.591, "r_y2": 560.417, "r_x3": 262.65, "r_y3": 560.417, "coord_origin": "TOPLEFT"}, "text": "(GNN) methods and Image-to-Markup-Sequence", "orig": "(GNN) methods and Image-to-Markup-Sequence", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 70, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 581.169, "r_x1": 484.121, "r_y1": 581.169, "r_x2": 484.121, "r_y2": 572.3720000000001, "r_x3": 134.765, "r_y3": 572.3720000000001, "coord_origin": "TOPLEFT"}, "text": "(Im2Seq) methods. Object-detection based methods [11,12,13,14,21] rely on table-", "orig": "(Im2Seq) methods. Object-detection based methods [11,12,13,14,21] rely on table-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 71, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 593.124, "r_x1": 480.596, "r_y1": 593.124, "r_x2": 480.596, "r_y2": 584.327, "r_x3": 134.765, "r_y3": 584.327, "coord_origin": "TOPLEFT"}, "text": "structure annotation using (overlapping) bounding boxes for training, and pro-", "orig": "structure annotation using (overlapping) bounding boxes for training, and pro-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 72, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 605.08, "r_x1": 480.589, "r_y1": 605.08, "r_x2": 480.589, "r_y2": 596.283, "r_x3": 134.765, "r_y3": 596.283, "coord_origin": "TOPLEFT"}, "text": "duce bounding-box predictions to define table cells, rows, and columns on a table", "orig": "duce bounding-box predictions to define table cells, rows, and columns on a table", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 73, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 617.035, "r_x1": 480.591, "r_y1": 617.035, "r_x2": 480.591, "r_y2": 608.238, "r_x3": 134.765, "r_y3": 608.238, "coord_origin": "TOPLEFT"}, "text": "image. Graph Neural Network (GNN) based methods [3,6,17,18], as the name", "orig": "image. Graph Neural Network (GNN) based methods [3,6,17,18], as the name", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 74, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 628.99, "r_x1": 480.586, "r_y1": 628.99, "r_x2": 480.586, "r_y2": 620.193, "r_x3": 134.765, "r_y3": 620.193, "coord_origin": "TOPLEFT"}, "text": "suggests, represent tables as graph structures. The graph nodes represent the", "orig": "suggests, represent tables as graph structures. The graph nodes represent the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 75, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 640.9449999999999, "r_x1": 480.589, "r_y1": 640.9449999999999, "r_x2": 480.589, "r_y2": 632.148, "r_x3": 134.765, "r_y3": 632.148, "coord_origin": "TOPLEFT"}, "text": "content of each table cell, an embedding vector from the table image, or geomet-", "orig": "content of each table cell, an embedding vector from the table image, or geomet-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 76, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 652.9, "r_x1": 480.589, "r_y1": 652.9, "r_x2": 480.589, "r_y2": 644.1030000000001, "r_x3": 134.765, "r_y3": 644.1030000000001, "coord_origin": "TOPLEFT"}, "text": "ric coordinates of the table cell. The edges of the graph define the relationship", "orig": "ric coordinates of the table cell. The edges of the graph define the relationship", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 77, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 664.856, "r_x1": 480.591, "r_y1": 664.856, "r_x2": 480.591, "r_y2": 656.059, "r_x3": 134.765, "r_y3": 656.059, "coord_origin": "TOPLEFT"}, "text": "between the nodes, e.g. if they belong to the same column, row, or table cell.", "orig": "between the nodes, e.g. if they belong to the same column, row, or table cell.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "parsed_page": null, "predictions": {"layout": {"clusters": [{"id": 5, "label": "page_header", "bbox": {"l": 194.478, "t": 91.49300000000005, "r": 447.543, "b": 102.78200000000004, "coord_origin": "TOPLEFT"}, "confidence": 0.9325801730155945, "cells": [{"index": 0, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 194.478, "r_y0": 102.78200000000004, "r_x1": 447.543, "r_y1": 102.78200000000004, "r_x2": 447.543, "r_y2": 91.49300000000005, "r_x3": 194.478, "r_y3": 91.49300000000005, "coord_origin": "TOPLEFT"}, "text": "Optimized Table Tokenization for Table Structure Recognition", "orig": "Optimized Table Tokenization for Table Structure Recognition", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 6, "label": "page_header", "bbox": {"l": 475.984, "t": 91.49300000000005, "r": 480.591, "b": 102.78200000000004, "coord_origin": "TOPLEFT"}, "confidence": 0.8773486614227295, "cells": [{"index": 1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 475.984, "r_y0": 102.78200000000004, "r_x1": 480.591, "r_y1": 102.78200000000004, "r_x2": 480.591, "r_y2": 91.49300000000005, "r_x3": 475.984, "r_y3": 91.49300000000005, "coord_origin": "TOPLEFT"}, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 2, "label": "text", "bbox": {"l": 134.765, "t": 118.93399999999997, "r": 480.592, "b": 211.41700000000003, "coord_origin": "TOPLEFT"}, "confidence": 0.9871802926063538, "cells": [{"index": 2, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 149.709, "r_y0": 127.731, "r_x1": 480.592, "r_y1": 127.731, "r_x2": 480.592, "r_y2": 118.93399999999997, "r_x3": 149.709, "r_y3": 118.93399999999997, "coord_origin": "TOPLEFT"}, "text": "While the majority of research in TSR is currently focused on the develop-", "orig": "While the majority of research in TSR is currently focused on the develop-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 3, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 139.68600000000004, "r_x1": 480.587, "r_y1": 139.68600000000004, "r_x2": 480.587, "r_y2": 130.889, "r_x3": 134.765, "r_y3": 130.889, "coord_origin": "TOPLEFT"}, "text": "ment and application of novel neural model architectures, the table structure", "orig": "ment and application of novel neural model architectures, the table structure", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 4, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 151.64200000000005, "r_x1": 480.592, "r_y1": 151.64200000000005, "r_x2": 480.592, "r_y2": 142.84500000000003, "r_x3": 134.765, "r_y3": 142.84500000000003, "coord_origin": "TOPLEFT"}, "text": "representation language (e.g. HTML in PubTabNet and FinTabNet) is usually", "orig": "representation language (e.g. HTML in PubTabNet and FinTabNet) is usually", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 5, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 163.59699999999998, "r_x1": 169.625, "r_y1": 163.59699999999998, "r_x2": 169.625, "r_y2": 154.79999999999995, "r_x3": 134.765, "r_y3": 154.79999999999995, "coord_origin": "TOPLEFT"}, "text": "adopted", "orig": "adopted", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 6, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 173.861, "r_y0": 163.59699999999998, "r_x1": 194.555, "r_y1": 163.59699999999998, "r_x2": 194.555, "r_y2": 154.79999999999995, "r_x3": 173.861, "r_y3": 154.79999999999995, "coord_origin": "TOPLEFT"}, "text": "as is", "orig": "as is", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 7, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 199.61, "r_y0": 163.59699999999998, "r_x1": 211.535, "r_y1": 163.59699999999998, "r_x2": 211.535, "r_y2": 154.79999999999995, "r_x3": 199.61, "r_y3": 154.79999999999995, "coord_origin": "TOPLEFT"}, "text": "for", "orig": "for", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 8, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 215.769, "r_y0": 163.59699999999998, "r_x1": 480.586, "r_y1": 163.59699999999998, "r_x2": 480.586, "r_y2": 154.79999999999995, "r_x3": 215.769, "r_y3": 154.79999999999995, "coord_origin": "TOPLEFT"}, "text": "the sequence tokenization in Im2Seq models. In this paper,", "orig": "the sequence tokenization in Im2Seq models. In this paper,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 9, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 175.55200000000002, "r_x1": 480.592, "r_y1": 175.55200000000002, "r_x2": 480.592, "r_y2": 166.755, "r_x3": 134.765, "r_y3": 166.755, "coord_origin": "TOPLEFT"}, "text": "we aim for the opposite and investigate the impact of the table structure rep-", "orig": "we aim for the opposite and investigate the impact of the table structure rep-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 10, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 187.50699999999995, "r_x1": 480.59, "r_y1": 187.50699999999995, "r_x2": 480.59, "r_y2": 178.71000000000004, "r_x3": 134.765, "r_y3": 178.71000000000004, "coord_origin": "TOPLEFT"}, "text": "resentation language with an otherwise unmodified Im2Seq transformer-based", "orig": "resentation language with an otherwise unmodified Im2Seq transformer-based", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 11, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 199.462, "r_x1": 480.592, "r_y1": 199.462, "r_x2": 480.592, "r_y2": 190.66499999999996, "r_x3": 134.765, "r_y3": 190.66499999999996, "coord_origin": "TOPLEFT"}, "text": "architecture. Since the current state-of-the-art Im2Seq model is TableFormer [9],", "orig": "architecture. Since the current state-of-the-art Im2Seq model is TableFormer [9],", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 12, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 211.41700000000003, "r_x1": 348.355, "r_y1": 211.41700000000003, "r_x2": 348.355, "r_y2": 202.62, "r_x3": 134.765, "r_y3": 202.62, "coord_origin": "TOPLEFT"}, "text": "we select this model to perform our experiments.", "orig": "we select this model to perform our experiments.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 1, "label": "text", "bbox": {"l": 134.765, "t": 214.836, "r": 480.596, "b": 331.23, "coord_origin": "TOPLEFT"}, "confidence": 0.9871861338615417, "cells": [{"index": 13, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 149.709, "r_y0": 223.63300000000004, "r_x1": 480.594, "r_y1": 223.63300000000004, "r_x2": 480.594, "r_y2": 214.836, "r_x3": 149.709, "r_y3": 214.836, "coord_origin": "TOPLEFT"}, "text": "The main contribution of this paper is the introduction of a new optimised ta-", "orig": "The main contribution of this paper is the introduction of a new optimised ta-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 14, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 235.58799999999997, "r_x1": 480.594, "r_y1": 235.58799999999997, "r_x2": 480.594, "r_y2": 226.79100000000005, "r_x3": 134.765, "r_y3": 226.79100000000005, "coord_origin": "TOPLEFT"}, "text": "ble structure language (OTSL), specifically designed to describe table-structure", "orig": "ble structure language (OTSL), specifically designed to describe table-structure", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 15, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 247.54399999999998, "r_x1": 480.587, "r_y1": 247.54399999999998, "r_x2": 480.587, "r_y2": 238.74699999999996, "r_x3": 134.765, "r_y3": 238.74699999999996, "coord_origin": "TOPLEFT"}, "text": "in an compact and structured way for Im2Seq models. OTSL has a number of", "orig": "in an compact and structured way for Im2Seq models. OTSL has a number of", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 16, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 259.499, "r_x1": 480.587, "r_y1": 259.499, "r_x2": 480.587, "r_y2": 250.702, "r_x3": 134.765, "r_y3": 250.702, "coord_origin": "TOPLEFT"}, "text": "key features, which make it very attractive to use in Im2Seq models. Specifically,", "orig": "key features, which make it very attractive to use in Im2Seq models. Specifically,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 17, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 271.45399999999995, "r_x1": 480.588, "r_y1": 271.45399999999995, "r_x2": 480.588, "r_y2": 262.65700000000004, "r_x3": 134.765, "r_y3": 262.65700000000004, "coord_origin": "TOPLEFT"}, "text": "compared to other languages such as HTML, OTSL has a minimized vocabulary", "orig": "compared to other languages such as HTML, OTSL has a minimized vocabulary", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 18, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 283.409, "r_x1": 480.596, "r_y1": 283.409, "r_x2": 480.596, "r_y2": 274.61199999999997, "r_x3": 134.765, "r_y3": 274.61199999999997, "coord_origin": "TOPLEFT"}, "text": "which yields short sequence length, strong inherent structure (e.g. strict rectan-", "orig": "which yields short sequence length, strong inherent structure (e.g. strict rectan-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 19, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 295.364, "r_x1": 480.593, "r_y1": 295.364, "r_x2": 480.593, "r_y2": 286.567, "r_x3": 134.765, "r_y3": 286.567, "coord_origin": "TOPLEFT"}, "text": "gular layout) and a strict syntax with rules that only look backwards. The latter", "orig": "gular layout) and a strict syntax with rules that only look backwards. The latter", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 20, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 307.319, "r_x1": 480.595, "r_y1": 307.319, "r_x2": 480.595, "r_y2": 298.522, "r_x3": 134.765, "r_y3": 298.522, "coord_origin": "TOPLEFT"}, "text": "allows for syntax validation during inference and ensures a syntactically correct", "orig": "allows for syntax validation during inference and ensures a syntactically correct", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 21, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 319.275, "r_x1": 480.587, "r_y1": 319.275, "r_x2": 480.587, "r_y2": 310.478, "r_x3": 134.765, "r_y3": 310.478, "coord_origin": "TOPLEFT"}, "text": "table-structure. These OTSL features are illustrated in Figure 1, in comparison", "orig": "table-structure. These OTSL features are illustrated in Figure 1, in comparison", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 22, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 331.23, "r_x1": 179.72, "r_y1": 331.23, "r_x2": 179.72, "r_y2": 322.433, "r_x3": 134.765, "r_y3": 322.433, "coord_origin": "TOPLEFT"}, "text": "to HTML.", "orig": "to HTML.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 0, "label": "text", "bbox": {"l": 134.765, "t": 334.648, "r": 480.596, "b": 439.087, "coord_origin": "TOPLEFT"}, "confidence": 0.988121747970581, "cells": [{"index": 23, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 149.709, "r_y0": 343.445, "r_x1": 480.588, "r_y1": 343.445, "r_x2": 480.588, "r_y2": 334.648, "r_x3": 149.709, "r_y3": 334.648, "coord_origin": "TOPLEFT"}, "text": "The paper is structured as follows. In section 2, we give an overview of the", "orig": "The paper is structured as follows. In section 2, we give an overview of the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 24, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 355.401, "r_x1": 158.613, "r_y1": 355.401, "r_x2": 158.613, "r_y2": 346.604, "r_x3": 134.765, "r_y3": 346.604, "coord_origin": "TOPLEFT"}, "text": "latest", "orig": "latest", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 25, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 163.366, "r_y0": 355.401, "r_x1": 303.894, "r_y1": 355.401, "r_x2": 303.894, "r_y2": 346.604, "r_x3": 163.366, "r_y3": 346.604, "coord_origin": "TOPLEFT"}, "text": "developments in table-structure", "orig": "developments in table-structure", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 26, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.636, "r_y0": 355.401, "r_x1": 373.487, "r_y1": 355.401, "r_x2": 373.487, "r_y2": 346.604, "r_x3": 308.636, "r_y3": 346.604, "coord_origin": "TOPLEFT"}, "text": "reconstruction.", "orig": "reconstruction.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 27, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 378.239, "r_y0": 355.401, "r_x1": 387.369, "r_y1": 355.401, "r_x2": 387.369, "r_y2": 346.604, "r_x3": 378.239, "r_y3": 346.604, "coord_origin": "TOPLEFT"}, "text": "In", "orig": "In", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 28, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 392.111, "r_y0": 355.401, "r_x1": 422.055, "r_y1": 355.401, "r_x2": 422.055, "r_y2": 346.604, "r_x3": 392.111, "r_y3": 346.604, "coord_origin": "TOPLEFT"}, "text": "section", "orig": "section", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 29, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 426.798, "r_y0": 355.401, "r_x1": 480.594, "r_y1": 355.401, "r_x2": 480.594, "r_y2": 346.604, "r_x3": 426.798, "r_y3": 346.604, "coord_origin": "TOPLEFT"}, "text": "3 we review", "orig": "3 we review", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 30, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 367.356, "r_x1": 480.587, "r_y1": 367.356, "r_x2": 480.587, "r_y2": 358.559, "r_x3": 134.765, "r_y3": 358.559, "coord_origin": "TOPLEFT"}, "text": "the current HTML table encoding (popularised by PubTabNet and FinTabNet)", "orig": "the current HTML table encoding (popularised by PubTabNet and FinTabNet)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 31, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 379.311, "r_x1": 480.592, "r_y1": 379.311, "r_x2": 480.592, "r_y2": 370.514, "r_x3": 134.765, "r_y3": 370.514, "coord_origin": "TOPLEFT"}, "text": "and discuss its flaws. Subsequently, we introduce OTSL in section 4, which in-", "orig": "and discuss its flaws. Subsequently, we introduce OTSL in section 4, which in-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 32, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 391.266, "r_x1": 480.592, "r_y1": 391.266, "r_x2": 480.592, "r_y2": 382.469, "r_x3": 134.765, "r_y3": 382.469, "coord_origin": "TOPLEFT"}, "text": "cludes the language definition, syntax rules and error-correction procedures. In", "orig": "cludes the language definition, syntax rules and error-correction procedures. In", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 33, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 403.221, "r_x1": 480.588, "r_y1": 403.221, "r_x2": 480.588, "r_y2": 394.424, "r_x3": 134.765, "r_y3": 394.424, "coord_origin": "TOPLEFT"}, "text": "section 5, we apply OTSL on the TableFormer architecture, compare it to Table-", "orig": "section 5, we apply OTSL on the TableFormer architecture, compare it to Table-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 34, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 415.177, "r_x1": 480.595, "r_y1": 415.177, "r_x2": 480.595, "r_y2": 406.38, "r_x3": 134.765, "r_y3": 406.38, "coord_origin": "TOPLEFT"}, "text": "Former models trained on HTML and ultimately demonstrate the advantages", "orig": "Former models trained on HTML and ultimately demonstrate the advantages", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 35, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 427.132, "r_x1": 142.789, "r_y1": 427.132, "r_x2": 142.789, "r_y2": 418.335, "r_x3": 134.765, "r_y3": 418.335, "coord_origin": "TOPLEFT"}, "text": "of", "orig": "of", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 36, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 147.431, "r_y0": 427.132, "r_x1": 170.173, "r_y1": 427.132, "r_x2": 170.173, "r_y2": 418.335, "r_x3": 147.431, "r_y3": 418.335, "coord_origin": "TOPLEFT"}, "text": "using", "orig": "using", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 37, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 174.826, "r_y0": 427.132, "r_x1": 288.974, "r_y1": 427.132, "r_x2": 288.974, "r_y2": 418.335, "r_x3": 174.826, "r_y3": 418.335, "coord_origin": "TOPLEFT"}, "text": "OTSL. Finally, in section", "orig": "OTSL. Finally, in section", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 38, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 293.627, "r_y0": 427.132, "r_x1": 480.596, "r_y1": 427.132, "r_x2": 480.596, "r_y2": 418.335, "r_x3": 293.627, "r_y3": 418.335, "coord_origin": "TOPLEFT"}, "text": "6 we conclude our work and outline next", "orig": "6 we conclude our work and outline next", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 39, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 439.087, "r_x1": 201.272, "r_y1": 439.087, "r_x2": 201.272, "r_y2": 430.29, "r_x3": 134.765, "r_y3": 430.29, "coord_origin": "TOPLEFT"}, "text": "potential steps.", "orig": "potential steps.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 4, "label": "section_header", "bbox": {"l": 134.765, "t": 462.088, "r": 236.769, "b": 472.656, "coord_origin": "TOPLEFT"}, "confidence": 0.9439423680305481, "cells": [{"index": 40, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 472.656, "r_x1": 141.489, "r_y1": 472.656, "r_x2": 141.489, "r_y2": 462.088, "r_x3": 134.765, "r_y3": 462.088, "coord_origin": "TOPLEFT"}, "text": "2", "orig": "2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 41, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 154.938, "r_y0": 472.656, "r_x1": 236.769, "r_y1": 472.656, "r_x2": 236.769, "r_y2": 462.088, "r_x3": 154.938, "r_y3": 462.088, "coord_origin": "TOPLEFT"}, "text": "Related Work", "orig": "Related Work", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 3, "label": "text", "bbox": {"l": 134.765, "t": 488.686, "r": 484.121, "b": 664.856, "coord_origin": "TOPLEFT"}, "confidence": 0.9870182871818542, "cells": [{"index": 42, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 497.483, "r_x1": 480.591, "r_y1": 497.483, "r_x2": 480.591, "r_y2": 488.686, "r_x3": 134.765, "r_y3": 488.686, "coord_origin": "TOPLEFT"}, "text": "Approaches to formalize the logical structure and layout of tables in electronic", "orig": "Approaches to formalize the logical structure and layout of tables in electronic", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 43, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 509.438, "r_x1": 480.592, "r_y1": 509.438, "r_x2": 480.592, "r_y2": 500.641, "r_x3": 134.765, "r_y3": 500.641, "coord_origin": "TOPLEFT"}, "text": "documents date back more than two decades [16]. In the recent past, a wide", "orig": "documents date back more than two decades [16]. In the recent past, a wide", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 44, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 521.393, "r_x1": 164.401, "r_y1": 521.393, "r_x2": 164.401, "r_y2": 512.596, "r_x3": 134.765, "r_y3": 512.596, "coord_origin": "TOPLEFT"}, "text": "variety", "orig": "variety", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 45, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 169.581, "r_y0": 521.393, "r_x1": 177.605, "r_y1": 521.393, "r_x2": 177.605, "r_y2": 512.596, "r_x3": 169.581, "r_y3": 512.596, "coord_origin": "TOPLEFT"}, "text": "of", "orig": "of", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 46, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 182.786, "r_y0": 521.393, "r_x1": 223.77, "r_y1": 521.393, "r_x2": 223.77, "r_y2": 512.596, "r_x3": 182.786, "r_y3": 512.596, "coord_origin": "TOPLEFT"}, "text": "computer", "orig": "computer", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 47, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 228.95, "r_y0": 521.393, "r_x1": 254.183, "r_y1": 521.393, "r_x2": 254.183, "r_y2": 512.596, "r_x3": 228.95, "r_y3": 512.596, "coord_origin": "TOPLEFT"}, "text": "vision", "orig": "vision", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 48, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 259.363, "r_y0": 521.393, "r_x1": 321.047, "r_y1": 521.393, "r_x2": 321.047, "r_y2": 512.596, "r_x3": 259.363, "r_y3": 512.596, "coord_origin": "TOPLEFT"}, "text": "methods have", "orig": "methods have", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 49, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 326.237, "r_y0": 521.393, "r_x1": 346.435, "r_y1": 521.393, "r_x2": 346.435, "r_y2": 512.596, "r_x3": 326.237, "r_y3": 512.596, "coord_origin": "TOPLEFT"}, "text": "been", "orig": "been", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 50, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 351.616, "r_y0": 521.393, "r_x1": 388.441, "r_y1": 521.393, "r_x2": 388.441, "r_y2": 512.596, "r_x3": 351.616, "r_y3": 512.596, "coord_origin": "TOPLEFT"}, "text": "explored", "orig": "explored", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 51, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 393.631, "r_y0": 521.393, "r_x1": 402.485, "r_y1": 521.393, "r_x2": 402.485, "r_y2": 512.596, "r_x3": 393.631, "r_y3": 512.596, "coord_origin": "TOPLEFT"}, "text": "to", "orig": "to", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 52, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 407.666, "r_y0": 521.393, "r_x1": 433.117, "r_y1": 521.393, "r_x2": 433.117, "r_y2": 512.596, "r_x3": 407.666, "r_y3": 512.596, "coord_origin": "TOPLEFT"}, "text": "tackle", "orig": "tackle", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 53, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 438.307, "r_y0": 521.393, "r_x1": 452.141, "r_y1": 521.393, "r_x2": 452.141, "r_y2": 512.596, "r_x3": 438.307, "r_y3": 512.596, "coord_origin": "TOPLEFT"}, "text": "the", "orig": "the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 54, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 457.321, "r_y0": 521.393, "r_x1": 480.59, "r_y1": 521.393, "r_x2": 480.59, "r_y2": 512.596, "r_x3": 457.321, "r_y3": 512.596, "coord_origin": "TOPLEFT"}, "text": "prob-", "orig": "prob-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 55, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 533.3489999999999, "r_x1": 163.373, "r_y1": 533.3489999999999, "r_x2": 163.373, "r_y2": 524.552, "r_x3": 134.765, "r_y3": 524.552, "coord_origin": "TOPLEFT"}, "text": "lem of", "orig": "lem of", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 56, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 168.463, "r_y0": 533.3489999999999, "r_x1": 190.043, "r_y1": 533.3489999999999, "r_x2": 190.043, "r_y2": 524.552, "r_x3": 168.463, "r_y3": 524.552, "coord_origin": "TOPLEFT"}, "text": "table", "orig": "table", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 57, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 195.134, "r_y0": 533.3489999999999, "r_x1": 234.531, "r_y1": 533.3489999999999, "r_x2": 234.531, "r_y2": 524.552, "r_x3": 195.134, "r_y3": 524.552, "coord_origin": "TOPLEFT"}, "text": "structure", "orig": "structure", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 58, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 239.632, "r_y0": 533.3489999999999, "r_x1": 290.567, "r_y1": 533.3489999999999, "r_x2": 290.567, "r_y2": 524.552, "r_x3": 239.632, "r_y3": 524.552, "coord_origin": "TOPLEFT"}, "text": "recognition,", "orig": "recognition,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 59, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 295.658, "r_y0": 533.3489999999999, "r_x1": 308.384, "r_y1": 533.3489999999999, "r_x2": 308.384, "r_y2": 524.552, "r_x3": 295.658, "r_y3": 524.552, "coord_origin": "TOPLEFT"}, "text": "i.e.", "orig": "i.e.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 60, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 313.475, "r_y0": 533.3489999999999, "r_x1": 327.308, "r_y1": 533.3489999999999, "r_x2": 327.308, "r_y2": 524.552, "r_x3": 313.475, "r_y3": 524.552, "coord_origin": "TOPLEFT"}, "text": "the", "orig": "the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 61, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 332.399, "r_y0": 533.3489999999999, "r_x1": 362.335, "r_y1": 533.3489999999999, "r_x2": 362.335, "r_y2": 524.552, "r_x3": 332.399, "r_y3": 524.552, "coord_origin": "TOPLEFT"}, "text": "correct", "orig": "correct", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 62, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 367.426, "r_y0": 533.3489999999999, "r_x1": 424.15, "r_y1": 533.3489999999999, "r_x2": 424.15, "r_y2": 524.552, "r_x3": 367.426, "r_y3": 524.552, "coord_origin": "TOPLEFT"}, "text": "identification", "orig": "identification", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 63, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 429.241, "r_y0": 533.3489999999999, "r_x1": 437.264, "r_y1": 533.3489999999999, "r_x2": 437.264, "r_y2": 524.552, "r_x3": 429.241, "r_y3": 524.552, "coord_origin": "TOPLEFT"}, "text": "of", "orig": "of", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 64, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 442.355, "r_y0": 533.3489999999999, "r_x1": 480.59, "r_y1": 533.3489999999999, "r_x2": 480.59, "r_y2": 524.552, "r_x3": 442.355, "r_y3": 524.552, "coord_origin": "TOPLEFT"}, "text": "columns,", "orig": "columns,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 65, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 545.304, "r_x1": 480.59, "r_y1": 545.304, "r_x2": 480.59, "r_y2": 536.5070000000001, "r_x3": 134.765, "r_y3": 536.5070000000001, "coord_origin": "TOPLEFT"}, "text": "rows and spanning cells in a given table. Broadly speaking, the current deep-", "orig": "rows and spanning cells in a given table. Broadly speaking, the current deep-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 66, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 557.259, "r_x1": 480.589, "r_y1": 557.259, "r_x2": 480.589, "r_y2": 548.462, "r_x3": 134.765, "r_y3": 548.462, "coord_origin": "TOPLEFT"}, "text": "learning based approaches fall into three categories: object detection (OD) meth-", "orig": "learning based approaches fall into three categories: object detection (OD) meth-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 67, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 569.2139999999999, "r_x1": 152.252, "r_y1": 569.2139999999999, "r_x2": 152.252, "r_y2": 560.417, "r_x3": 134.765, "r_y3": 560.417, "coord_origin": "TOPLEFT"}, "text": "ods,", "orig": "ods,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 68, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 157.433, "r_y0": 569.2139999999999, "r_x1": 257.459, "r_y1": 569.2139999999999, "r_x2": 257.459, "r_y2": 560.417, "r_x3": 157.433, "r_y3": 560.417, "coord_origin": "TOPLEFT"}, "text": "Graph-Neural-Network", "orig": "Graph-Neural-Network", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 69, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 262.65, "r_y0": 569.2139999999999, "r_x1": 480.591, "r_y1": 569.2139999999999, "r_x2": 480.591, "r_y2": 560.417, "r_x3": 262.65, "r_y3": 560.417, "coord_origin": "TOPLEFT"}, "text": "(GNN) methods and Image-to-Markup-Sequence", "orig": "(GNN) methods and Image-to-Markup-Sequence", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 70, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 581.169, "r_x1": 484.121, "r_y1": 581.169, "r_x2": 484.121, "r_y2": 572.3720000000001, "r_x3": 134.765, "r_y3": 572.3720000000001, "coord_origin": "TOPLEFT"}, "text": "(Im2Seq) methods. Object-detection based methods [11,12,13,14,21] rely on table-", "orig": "(Im2Seq) methods. Object-detection based methods [11,12,13,14,21] rely on table-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 71, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 593.124, "r_x1": 480.596, "r_y1": 593.124, "r_x2": 480.596, "r_y2": 584.327, "r_x3": 134.765, "r_y3": 584.327, "coord_origin": "TOPLEFT"}, "text": "structure annotation using (overlapping) bounding boxes for training, and pro-", "orig": "structure annotation using (overlapping) bounding boxes for training, and pro-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 72, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 605.08, "r_x1": 480.589, "r_y1": 605.08, "r_x2": 480.589, "r_y2": 596.283, "r_x3": 134.765, "r_y3": 596.283, "coord_origin": "TOPLEFT"}, "text": "duce bounding-box predictions to define table cells, rows, and columns on a table", "orig": "duce bounding-box predictions to define table cells, rows, and columns on a table", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 73, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 617.035, "r_x1": 480.591, "r_y1": 617.035, "r_x2": 480.591, "r_y2": 608.238, "r_x3": 134.765, "r_y3": 608.238, "coord_origin": "TOPLEFT"}, "text": "image. Graph Neural Network (GNN) based methods [3,6,17,18], as the name", "orig": "image. Graph Neural Network (GNN) based methods [3,6,17,18], as the name", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 74, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 628.99, "r_x1": 480.586, "r_y1": 628.99, "r_x2": 480.586, "r_y2": 620.193, "r_x3": 134.765, "r_y3": 620.193, "coord_origin": "TOPLEFT"}, "text": "suggests, represent tables as graph structures. The graph nodes represent the", "orig": "suggests, represent tables as graph structures. The graph nodes represent the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 75, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 640.9449999999999, "r_x1": 480.589, "r_y1": 640.9449999999999, "r_x2": 480.589, "r_y2": 632.148, "r_x3": 134.765, "r_y3": 632.148, "coord_origin": "TOPLEFT"}, "text": "content of each table cell, an embedding vector from the table image, or geomet-", "orig": "content of each table cell, an embedding vector from the table image, or geomet-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 76, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 652.9, "r_x1": 480.589, "r_y1": 652.9, "r_x2": 480.589, "r_y2": 644.1030000000001, "r_x3": 134.765, "r_y3": 644.1030000000001, "coord_origin": "TOPLEFT"}, "text": "ric coordinates of the table cell. The edges of the graph define the relationship", "orig": "ric coordinates of the table cell. The edges of the graph define the relationship", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 77, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 664.856, "r_x1": 480.591, "r_y1": 664.856, "r_x2": 480.591, "r_y2": 656.059, "r_x3": 134.765, "r_y3": 656.059, "coord_origin": "TOPLEFT"}, "text": "between the nodes, e.g. if they belong to the same column, row, or table cell.", "orig": "between the nodes, e.g. if they belong to the same column, row, or table cell.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}]}, "tablestructure": {"table_map": {}}, "figures_classification": null, "equations_prediction": null, "vlm_response": null}, "assembled": {"elements": [{"label": "page_header", "id": 5, "page_no": 2, "cluster": {"id": 5, "label": "page_header", "bbox": {"l": 194.478, "t": 91.49300000000005, "r": 447.543, "b": 102.78200000000004, "coord_origin": "TOPLEFT"}, "confidence": 0.9325801730155945, "cells": [{"index": 0, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 194.478, "r_y0": 102.78200000000004, "r_x1": 447.543, "r_y1": 102.78200000000004, "r_x2": 447.543, "r_y2": 91.49300000000005, "r_x3": 194.478, "r_y3": 91.49300000000005, "coord_origin": "TOPLEFT"}, "text": "Optimized Table Tokenization for Table Structure Recognition", "orig": "Optimized Table Tokenization for Table Structure Recognition", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "Optimized Table Tokenization for Table Structure Recognition"}, {"label": "page_header", "id": 6, "page_no": 2, "cluster": {"id": 6, "label": "page_header", "bbox": {"l": 475.984, "t": 91.49300000000005, "r": 480.591, "b": 102.78200000000004, "coord_origin": "TOPLEFT"}, "confidence": 0.8773486614227295, "cells": [{"index": 1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 475.984, "r_y0": 102.78200000000004, "r_x1": 480.591, "r_y1": 102.78200000000004, "r_x2": 480.591, "r_y2": 91.49300000000005, "r_x3": 475.984, "r_y3": 91.49300000000005, "coord_origin": "TOPLEFT"}, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "3"}, {"label": "text", "id": 2, "page_no": 2, "cluster": {"id": 2, "label": "text", "bbox": {"l": 134.765, "t": 118.93399999999997, "r": 480.592, "b": 211.41700000000003, "coord_origin": "TOPLEFT"}, "confidence": 0.9871802926063538, "cells": [{"index": 2, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 149.709, "r_y0": 127.731, "r_x1": 480.592, "r_y1": 127.731, "r_x2": 480.592, "r_y2": 118.93399999999997, "r_x3": 149.709, "r_y3": 118.93399999999997, "coord_origin": "TOPLEFT"}, "text": "While the majority of research in TSR is currently focused on the develop-", "orig": "While the majority of research in TSR is currently focused on the develop-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 3, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 139.68600000000004, "r_x1": 480.587, "r_y1": 139.68600000000004, "r_x2": 480.587, "r_y2": 130.889, "r_x3": 134.765, "r_y3": 130.889, "coord_origin": "TOPLEFT"}, "text": "ment and application of novel neural model architectures, the table structure", "orig": "ment and application of novel neural model architectures, the table structure", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 4, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 151.64200000000005, "r_x1": 480.592, "r_y1": 151.64200000000005, "r_x2": 480.592, "r_y2": 142.84500000000003, "r_x3": 134.765, "r_y3": 142.84500000000003, "coord_origin": "TOPLEFT"}, "text": "representation language (e.g. HTML in PubTabNet and FinTabNet) is usually", "orig": "representation language (e.g. HTML in PubTabNet and FinTabNet) is usually", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 5, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 163.59699999999998, "r_x1": 169.625, "r_y1": 163.59699999999998, "r_x2": 169.625, "r_y2": 154.79999999999995, "r_x3": 134.765, "r_y3": 154.79999999999995, "coord_origin": "TOPLEFT"}, "text": "adopted", "orig": "adopted", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 6, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 173.861, "r_y0": 163.59699999999998, "r_x1": 194.555, "r_y1": 163.59699999999998, "r_x2": 194.555, "r_y2": 154.79999999999995, "r_x3": 173.861, "r_y3": 154.79999999999995, "coord_origin": "TOPLEFT"}, "text": "as is", "orig": "as is", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 7, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 199.61, "r_y0": 163.59699999999998, "r_x1": 211.535, "r_y1": 163.59699999999998, "r_x2": 211.535, "r_y2": 154.79999999999995, "r_x3": 199.61, "r_y3": 154.79999999999995, "coord_origin": "TOPLEFT"}, "text": "for", "orig": "for", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 8, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 215.769, "r_y0": 163.59699999999998, "r_x1": 480.586, "r_y1": 163.59699999999998, "r_x2": 480.586, "r_y2": 154.79999999999995, "r_x3": 215.769, "r_y3": 154.79999999999995, "coord_origin": "TOPLEFT"}, "text": "the sequence tokenization in Im2Seq models. In this paper,", "orig": "the sequence tokenization in Im2Seq models. In this paper,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 9, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 175.55200000000002, "r_x1": 480.592, "r_y1": 175.55200000000002, "r_x2": 480.592, "r_y2": 166.755, "r_x3": 134.765, "r_y3": 166.755, "coord_origin": "TOPLEFT"}, "text": "we aim for the opposite and investigate the impact of the table structure rep-", "orig": "we aim for the opposite and investigate the impact of the table structure rep-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 10, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 187.50699999999995, "r_x1": 480.59, "r_y1": 187.50699999999995, "r_x2": 480.59, "r_y2": 178.71000000000004, "r_x3": 134.765, "r_y3": 178.71000000000004, "coord_origin": "TOPLEFT"}, "text": "resentation language with an otherwise unmodified Im2Seq transformer-based", "orig": "resentation language with an otherwise unmodified Im2Seq transformer-based", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 11, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 199.462, "r_x1": 480.592, "r_y1": 199.462, "r_x2": 480.592, "r_y2": 190.66499999999996, "r_x3": 134.765, "r_y3": 190.66499999999996, "coord_origin": "TOPLEFT"}, "text": "architecture. Since the current state-of-the-art Im2Seq model is TableFormer [9],", "orig": "architecture. Since the current state-of-the-art Im2Seq model is TableFormer [9],", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 12, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 211.41700000000003, "r_x1": 348.355, "r_y1": 211.41700000000003, "r_x2": 348.355, "r_y2": 202.62, "r_x3": 134.765, "r_y3": 202.62, "coord_origin": "TOPLEFT"}, "text": "we select this model to perform our experiments.", "orig": "we select this model to perform our experiments.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "While the majority of research in TSR is currently focused on the development and application of novel neural model architectures, the table structure representation language (e.g. HTML in PubTabNet and FinTabNet) is usually adopted as is for the sequence tokenization in Im2Seq models. In this paper, we aim for the opposite and investigate the impact of the table structure representation language with an otherwise unmodified Im2Seq transformer-based architecture. Since the current state-of-the-art Im2Seq model is TableFormer [9], we select this model to perform our experiments."}, {"label": "text", "id": 1, "page_no": 2, "cluster": {"id": 1, "label": "text", "bbox": {"l": 134.765, "t": 214.836, "r": 480.596, "b": 331.23, "coord_origin": "TOPLEFT"}, "confidence": 0.9871861338615417, "cells": [{"index": 13, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 149.709, "r_y0": 223.63300000000004, "r_x1": 480.594, "r_y1": 223.63300000000004, "r_x2": 480.594, "r_y2": 214.836, "r_x3": 149.709, "r_y3": 214.836, "coord_origin": "TOPLEFT"}, "text": "The main contribution of this paper is the introduction of a new optimised ta-", "orig": "The main contribution of this paper is the introduction of a new optimised ta-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 14, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 235.58799999999997, "r_x1": 480.594, "r_y1": 235.58799999999997, "r_x2": 480.594, "r_y2": 226.79100000000005, "r_x3": 134.765, "r_y3": 226.79100000000005, "coord_origin": "TOPLEFT"}, "text": "ble structure language (OTSL), specifically designed to describe table-structure", "orig": "ble structure language (OTSL), specifically designed to describe table-structure", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 15, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 247.54399999999998, "r_x1": 480.587, "r_y1": 247.54399999999998, "r_x2": 480.587, "r_y2": 238.74699999999996, "r_x3": 134.765, "r_y3": 238.74699999999996, "coord_origin": "TOPLEFT"}, "text": "in an compact and structured way for Im2Seq models. OTSL has a number of", "orig": "in an compact and structured way for Im2Seq models. OTSL has a number of", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 16, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 259.499, "r_x1": 480.587, "r_y1": 259.499, "r_x2": 480.587, "r_y2": 250.702, "r_x3": 134.765, "r_y3": 250.702, "coord_origin": "TOPLEFT"}, "text": "key features, which make it very attractive to use in Im2Seq models. Specifically,", "orig": "key features, which make it very attractive to use in Im2Seq models. Specifically,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 17, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 271.45399999999995, "r_x1": 480.588, "r_y1": 271.45399999999995, "r_x2": 480.588, "r_y2": 262.65700000000004, "r_x3": 134.765, "r_y3": 262.65700000000004, "coord_origin": "TOPLEFT"}, "text": "compared to other languages such as HTML, OTSL has a minimized vocabulary", "orig": "compared to other languages such as HTML, OTSL has a minimized vocabulary", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 18, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 283.409, "r_x1": 480.596, "r_y1": 283.409, "r_x2": 480.596, "r_y2": 274.61199999999997, "r_x3": 134.765, "r_y3": 274.61199999999997, "coord_origin": "TOPLEFT"}, "text": "which yields short sequence length, strong inherent structure (e.g. strict rectan-", "orig": "which yields short sequence length, strong inherent structure (e.g. strict rectan-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 19, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 295.364, "r_x1": 480.593, "r_y1": 295.364, "r_x2": 480.593, "r_y2": 286.567, "r_x3": 134.765, "r_y3": 286.567, "coord_origin": "TOPLEFT"}, "text": "gular layout) and a strict syntax with rules that only look backwards. The latter", "orig": "gular layout) and a strict syntax with rules that only look backwards. The latter", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 20, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 307.319, "r_x1": 480.595, "r_y1": 307.319, "r_x2": 480.595, "r_y2": 298.522, "r_x3": 134.765, "r_y3": 298.522, "coord_origin": "TOPLEFT"}, "text": "allows for syntax validation during inference and ensures a syntactically correct", "orig": "allows for syntax validation during inference and ensures a syntactically correct", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 21, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 319.275, "r_x1": 480.587, "r_y1": 319.275, "r_x2": 480.587, "r_y2": 310.478, "r_x3": 134.765, "r_y3": 310.478, "coord_origin": "TOPLEFT"}, "text": "table-structure. These OTSL features are illustrated in Figure 1, in comparison", "orig": "table-structure. These OTSL features are illustrated in Figure 1, in comparison", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 22, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 331.23, "r_x1": 179.72, "r_y1": 331.23, "r_x2": 179.72, "r_y2": 322.433, "r_x3": 134.765, "r_y3": 322.433, "coord_origin": "TOPLEFT"}, "text": "to HTML.", "orig": "to HTML.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "The main contribution of this paper is the introduction of a new optimised table structure language (OTSL), specifically designed to describe table-structure in an compact and structured way for Im2Seq models. OTSL has a number of key features, which make it very attractive to use in Im2Seq models. Specifically, compared to other languages such as HTML, OTSL has a minimized vocabulary which yields short sequence length, strong inherent structure (e.g. strict rectangular layout) and a strict syntax with rules that only look backwards. The latter allows for syntax validation during inference and ensures a syntactically correct table-structure. These OTSL features are illustrated in Figure 1, in comparison to HTML."}, {"label": "text", "id": 0, "page_no": 2, "cluster": {"id": 0, "label": "text", "bbox": {"l": 134.765, "t": 334.648, "r": 480.596, "b": 439.087, "coord_origin": "TOPLEFT"}, "confidence": 0.988121747970581, "cells": [{"index": 23, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 149.709, "r_y0": 343.445, "r_x1": 480.588, "r_y1": 343.445, "r_x2": 480.588, "r_y2": 334.648, "r_x3": 149.709, "r_y3": 334.648, "coord_origin": "TOPLEFT"}, "text": "The paper is structured as follows. In section 2, we give an overview of the", "orig": "The paper is structured as follows. In section 2, we give an overview of the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 24, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 355.401, "r_x1": 158.613, "r_y1": 355.401, "r_x2": 158.613, "r_y2": 346.604, "r_x3": 134.765, "r_y3": 346.604, "coord_origin": "TOPLEFT"}, "text": "latest", "orig": "latest", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 25, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 163.366, "r_y0": 355.401, "r_x1": 303.894, "r_y1": 355.401, "r_x2": 303.894, "r_y2": 346.604, "r_x3": 163.366, "r_y3": 346.604, "coord_origin": "TOPLEFT"}, "text": "developments in table-structure", "orig": "developments in table-structure", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 26, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.636, "r_y0": 355.401, "r_x1": 373.487, "r_y1": 355.401, "r_x2": 373.487, "r_y2": 346.604, "r_x3": 308.636, "r_y3": 346.604, "coord_origin": "TOPLEFT"}, "text": "reconstruction.", "orig": "reconstruction.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 27, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 378.239, "r_y0": 355.401, "r_x1": 387.369, "r_y1": 355.401, "r_x2": 387.369, "r_y2": 346.604, "r_x3": 378.239, "r_y3": 346.604, "coord_origin": "TOPLEFT"}, "text": "In", "orig": "In", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 28, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 392.111, "r_y0": 355.401, "r_x1": 422.055, "r_y1": 355.401, "r_x2": 422.055, "r_y2": 346.604, "r_x3": 392.111, "r_y3": 346.604, "coord_origin": "TOPLEFT"}, "text": "section", "orig": "section", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 29, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 426.798, "r_y0": 355.401, "r_x1": 480.594, "r_y1": 355.401, "r_x2": 480.594, "r_y2": 346.604, "r_x3": 426.798, "r_y3": 346.604, "coord_origin": "TOPLEFT"}, "text": "3 we review", "orig": "3 we review", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 30, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 367.356, "r_x1": 480.587, "r_y1": 367.356, "r_x2": 480.587, "r_y2": 358.559, "r_x3": 134.765, "r_y3": 358.559, "coord_origin": "TOPLEFT"}, "text": "the current HTML table encoding (popularised by PubTabNet and FinTabNet)", "orig": "the current HTML table encoding (popularised by PubTabNet and FinTabNet)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 31, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 379.311, "r_x1": 480.592, "r_y1": 379.311, "r_x2": 480.592, "r_y2": 370.514, "r_x3": 134.765, "r_y3": 370.514, "coord_origin": "TOPLEFT"}, "text": "and discuss its flaws. Subsequently, we introduce OTSL in section 4, which in-", "orig": "and discuss its flaws. Subsequently, we introduce OTSL in section 4, which in-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 32, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 391.266, "r_x1": 480.592, "r_y1": 391.266, "r_x2": 480.592, "r_y2": 382.469, "r_x3": 134.765, "r_y3": 382.469, "coord_origin": "TOPLEFT"}, "text": "cludes the language definition, syntax rules and error-correction procedures. In", "orig": "cludes the language definition, syntax rules and error-correction procedures. In", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 33, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 403.221, "r_x1": 480.588, "r_y1": 403.221, "r_x2": 480.588, "r_y2": 394.424, "r_x3": 134.765, "r_y3": 394.424, "coord_origin": "TOPLEFT"}, "text": "section 5, we apply OTSL on the TableFormer architecture, compare it to Table-", "orig": "section 5, we apply OTSL on the TableFormer architecture, compare it to Table-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 34, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 415.177, "r_x1": 480.595, "r_y1": 415.177, "r_x2": 480.595, "r_y2": 406.38, "r_x3": 134.765, "r_y3": 406.38, "coord_origin": "TOPLEFT"}, "text": "Former models trained on HTML and ultimately demonstrate the advantages", "orig": "Former models trained on HTML and ultimately demonstrate the advantages", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 35, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 427.132, "r_x1": 142.789, "r_y1": 427.132, "r_x2": 142.789, "r_y2": 418.335, "r_x3": 134.765, "r_y3": 418.335, "coord_origin": "TOPLEFT"}, "text": "of", "orig": "of", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 36, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 147.431, "r_y0": 427.132, "r_x1": 170.173, "r_y1": 427.132, "r_x2": 170.173, "r_y2": 418.335, "r_x3": 147.431, "r_y3": 418.335, "coord_origin": "TOPLEFT"}, "text": "using", "orig": "using", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 37, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 174.826, "r_y0": 427.132, "r_x1": 288.974, "r_y1": 427.132, "r_x2": 288.974, "r_y2": 418.335, "r_x3": 174.826, "r_y3": 418.335, "coord_origin": "TOPLEFT"}, "text": "OTSL. Finally, in section", "orig": "OTSL. Finally, in section", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 38, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 293.627, "r_y0": 427.132, "r_x1": 480.596, "r_y1": 427.132, "r_x2": 480.596, "r_y2": 418.335, "r_x3": 293.627, "r_y3": 418.335, "coord_origin": "TOPLEFT"}, "text": "6 we conclude our work and outline next", "orig": "6 we conclude our work and outline next", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 39, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 439.087, "r_x1": 201.272, "r_y1": 439.087, "r_x2": 201.272, "r_y2": 430.29, "r_x3": 134.765, "r_y3": 430.29, "coord_origin": "TOPLEFT"}, "text": "potential steps.", "orig": "potential steps.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "The paper is structured as follows. In section 2, we give an overview of the latest developments in table-structure reconstruction. In section 3 we review the current HTML table encoding (popularised by PubTabNet and FinTabNet) and discuss its flaws. Subsequently, we introduce OTSL in section 4, which includes the language definition, syntax rules and error-correction procedures. In section 5, we apply OTSL on the TableFormer architecture, compare it to TableFormer models trained on HTML and ultimately demonstrate the advantages of using OTSL. Finally, in section 6 we conclude our work and outline next potential steps."}, {"label": "section_header", "id": 4, "page_no": 2, "cluster": {"id": 4, "label": "section_header", "bbox": {"l": 134.765, "t": 462.088, "r": 236.769, "b": 472.656, "coord_origin": "TOPLEFT"}, "confidence": 0.9439423680305481, "cells": [{"index": 40, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 472.656, "r_x1": 141.489, "r_y1": 472.656, "r_x2": 141.489, "r_y2": 462.088, "r_x3": 134.765, "r_y3": 462.088, "coord_origin": "TOPLEFT"}, "text": "2", "orig": "2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 41, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 154.938, "r_y0": 472.656, "r_x1": 236.769, "r_y1": 472.656, "r_x2": 236.769, "r_y2": 462.088, "r_x3": 154.938, "r_y3": 462.088, "coord_origin": "TOPLEFT"}, "text": "Related Work", "orig": "Related Work", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "2 Related Work"}, {"label": "text", "id": 3, "page_no": 2, "cluster": {"id": 3, "label": "text", "bbox": {"l": 134.765, "t": 488.686, "r": 484.121, "b": 664.856, "coord_origin": "TOPLEFT"}, "confidence": 0.9870182871818542, "cells": [{"index": 42, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 497.483, "r_x1": 480.591, "r_y1": 497.483, "r_x2": 480.591, "r_y2": 488.686, "r_x3": 134.765, "r_y3": 488.686, "coord_origin": "TOPLEFT"}, "text": "Approaches to formalize the logical structure and layout of tables in electronic", "orig": "Approaches to formalize the logical structure and layout of tables in electronic", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 43, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 509.438, "r_x1": 480.592, "r_y1": 509.438, "r_x2": 480.592, "r_y2": 500.641, "r_x3": 134.765, "r_y3": 500.641, "coord_origin": "TOPLEFT"}, "text": "documents date back more than two decades [16]. In the recent past, a wide", "orig": "documents date back more than two decades [16]. In the recent past, a wide", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 44, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 521.393, "r_x1": 164.401, "r_y1": 521.393, "r_x2": 164.401, "r_y2": 512.596, "r_x3": 134.765, "r_y3": 512.596, "coord_origin": "TOPLEFT"}, "text": "variety", "orig": "variety", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 45, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 169.581, "r_y0": 521.393, "r_x1": 177.605, "r_y1": 521.393, "r_x2": 177.605, "r_y2": 512.596, "r_x3": 169.581, "r_y3": 512.596, "coord_origin": "TOPLEFT"}, "text": "of", "orig": "of", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 46, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 182.786, "r_y0": 521.393, "r_x1": 223.77, "r_y1": 521.393, "r_x2": 223.77, "r_y2": 512.596, "r_x3": 182.786, "r_y3": 512.596, "coord_origin": "TOPLEFT"}, "text": "computer", "orig": "computer", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 47, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 228.95, "r_y0": 521.393, "r_x1": 254.183, "r_y1": 521.393, "r_x2": 254.183, "r_y2": 512.596, "r_x3": 228.95, "r_y3": 512.596, "coord_origin": "TOPLEFT"}, "text": "vision", "orig": "vision", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 48, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 259.363, "r_y0": 521.393, "r_x1": 321.047, "r_y1": 521.393, "r_x2": 321.047, "r_y2": 512.596, "r_x3": 259.363, "r_y3": 512.596, "coord_origin": "TOPLEFT"}, "text": "methods have", "orig": "methods have", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 49, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 326.237, "r_y0": 521.393, "r_x1": 346.435, "r_y1": 521.393, "r_x2": 346.435, "r_y2": 512.596, "r_x3": 326.237, "r_y3": 512.596, "coord_origin": "TOPLEFT"}, "text": "been", "orig": "been", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 50, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 351.616, "r_y0": 521.393, "r_x1": 388.441, "r_y1": 521.393, "r_x2": 388.441, "r_y2": 512.596, "r_x3": 351.616, "r_y3": 512.596, "coord_origin": "TOPLEFT"}, "text": "explored", "orig": "explored", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 51, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 393.631, "r_y0": 521.393, "r_x1": 402.485, "r_y1": 521.393, "r_x2": 402.485, "r_y2": 512.596, "r_x3": 393.631, "r_y3": 512.596, "coord_origin": "TOPLEFT"}, "text": "to", "orig": "to", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 52, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 407.666, "r_y0": 521.393, "r_x1": 433.117, "r_y1": 521.393, "r_x2": 433.117, "r_y2": 512.596, "r_x3": 407.666, "r_y3": 512.596, "coord_origin": "TOPLEFT"}, "text": "tackle", "orig": "tackle", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 53, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 438.307, "r_y0": 521.393, "r_x1": 452.141, "r_y1": 521.393, "r_x2": 452.141, "r_y2": 512.596, "r_x3": 438.307, "r_y3": 512.596, "coord_origin": "TOPLEFT"}, "text": "the", "orig": "the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 54, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 457.321, "r_y0": 521.393, "r_x1": 480.59, "r_y1": 521.393, "r_x2": 480.59, "r_y2": 512.596, "r_x3": 457.321, "r_y3": 512.596, "coord_origin": "TOPLEFT"}, "text": "prob-", "orig": "prob-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 55, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 533.3489999999999, "r_x1": 163.373, "r_y1": 533.3489999999999, "r_x2": 163.373, "r_y2": 524.552, "r_x3": 134.765, "r_y3": 524.552, "coord_origin": "TOPLEFT"}, "text": "lem of", "orig": "lem of", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 56, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 168.463, "r_y0": 533.3489999999999, "r_x1": 190.043, "r_y1": 533.3489999999999, "r_x2": 190.043, "r_y2": 524.552, "r_x3": 168.463, "r_y3": 524.552, "coord_origin": "TOPLEFT"}, "text": "table", "orig": "table", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 57, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 195.134, "r_y0": 533.3489999999999, "r_x1": 234.531, "r_y1": 533.3489999999999, "r_x2": 234.531, "r_y2": 524.552, "r_x3": 195.134, "r_y3": 524.552, "coord_origin": "TOPLEFT"}, "text": "structure", "orig": "structure", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 58, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 239.632, "r_y0": 533.3489999999999, "r_x1": 290.567, "r_y1": 533.3489999999999, "r_x2": 290.567, "r_y2": 524.552, "r_x3": 239.632, "r_y3": 524.552, "coord_origin": "TOPLEFT"}, "text": "recognition,", "orig": "recognition,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 59, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 295.658, "r_y0": 533.3489999999999, "r_x1": 308.384, "r_y1": 533.3489999999999, "r_x2": 308.384, "r_y2": 524.552, "r_x3": 295.658, "r_y3": 524.552, "coord_origin": "TOPLEFT"}, "text": "i.e.", "orig": "i.e.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 60, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 313.475, "r_y0": 533.3489999999999, "r_x1": 327.308, "r_y1": 533.3489999999999, "r_x2": 327.308, "r_y2": 524.552, "r_x3": 313.475, "r_y3": 524.552, "coord_origin": "TOPLEFT"}, "text": "the", "orig": "the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 61, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 332.399, "r_y0": 533.3489999999999, "r_x1": 362.335, "r_y1": 533.3489999999999, "r_x2": 362.335, "r_y2": 524.552, "r_x3": 332.399, "r_y3": 524.552, "coord_origin": "TOPLEFT"}, "text": "correct", "orig": "correct", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 62, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 367.426, "r_y0": 533.3489999999999, "r_x1": 424.15, "r_y1": 533.3489999999999, "r_x2": 424.15, "r_y2": 524.552, "r_x3": 367.426, "r_y3": 524.552, "coord_origin": "TOPLEFT"}, "text": "identification", "orig": "identification", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 63, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 429.241, "r_y0": 533.3489999999999, "r_x1": 437.264, "r_y1": 533.3489999999999, "r_x2": 437.264, "r_y2": 524.552, "r_x3": 429.241, "r_y3": 524.552, "coord_origin": "TOPLEFT"}, "text": "of", "orig": "of", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 64, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 442.355, "r_y0": 533.3489999999999, "r_x1": 480.59, "r_y1": 533.3489999999999, "r_x2": 480.59, "r_y2": 524.552, "r_x3": 442.355, "r_y3": 524.552, "coord_origin": "TOPLEFT"}, "text": "columns,", "orig": "columns,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 65, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 545.304, "r_x1": 480.59, "r_y1": 545.304, "r_x2": 480.59, "r_y2": 536.5070000000001, "r_x3": 134.765, "r_y3": 536.5070000000001, "coord_origin": "TOPLEFT"}, "text": "rows and spanning cells in a given table. Broadly speaking, the current deep-", "orig": "rows and spanning cells in a given table. Broadly speaking, the current deep-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 66, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 557.259, "r_x1": 480.589, "r_y1": 557.259, "r_x2": 480.589, "r_y2": 548.462, "r_x3": 134.765, "r_y3": 548.462, "coord_origin": "TOPLEFT"}, "text": "learning based approaches fall into three categories: object detection (OD) meth-", "orig": "learning based approaches fall into three categories: object detection (OD) meth-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 67, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 569.2139999999999, "r_x1": 152.252, "r_y1": 569.2139999999999, "r_x2": 152.252, "r_y2": 560.417, "r_x3": 134.765, "r_y3": 560.417, "coord_origin": "TOPLEFT"}, "text": "ods,", "orig": "ods,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 68, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 157.433, "r_y0": 569.2139999999999, "r_x1": 257.459, "r_y1": 569.2139999999999, "r_x2": 257.459, "r_y2": 560.417, "r_x3": 157.433, "r_y3": 560.417, "coord_origin": "TOPLEFT"}, "text": "Graph-Neural-Network", "orig": "Graph-Neural-Network", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 69, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 262.65, "r_y0": 569.2139999999999, "r_x1": 480.591, "r_y1": 569.2139999999999, "r_x2": 480.591, "r_y2": 560.417, "r_x3": 262.65, "r_y3": 560.417, "coord_origin": "TOPLEFT"}, "text": "(GNN) methods and Image-to-Markup-Sequence", "orig": "(GNN) methods and Image-to-Markup-Sequence", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 70, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 581.169, "r_x1": 484.121, "r_y1": 581.169, "r_x2": 484.121, "r_y2": 572.3720000000001, "r_x3": 134.765, "r_y3": 572.3720000000001, "coord_origin": "TOPLEFT"}, "text": "(Im2Seq) methods. Object-detection based methods [11,12,13,14,21] rely on table-", "orig": "(Im2Seq) methods. Object-detection based methods [11,12,13,14,21] rely on table-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 71, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 593.124, "r_x1": 480.596, "r_y1": 593.124, "r_x2": 480.596, "r_y2": 584.327, "r_x3": 134.765, "r_y3": 584.327, "coord_origin": "TOPLEFT"}, "text": "structure annotation using (overlapping) bounding boxes for training, and pro-", "orig": "structure annotation using (overlapping) bounding boxes for training, and pro-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 72, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 605.08, "r_x1": 480.589, "r_y1": 605.08, "r_x2": 480.589, "r_y2": 596.283, "r_x3": 134.765, "r_y3": 596.283, "coord_origin": "TOPLEFT"}, "text": "duce bounding-box predictions to define table cells, rows, and columns on a table", "orig": "duce bounding-box predictions to define table cells, rows, and columns on a table", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 73, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 617.035, "r_x1": 480.591, "r_y1": 617.035, "r_x2": 480.591, "r_y2": 608.238, "r_x3": 134.765, "r_y3": 608.238, "coord_origin": "TOPLEFT"}, "text": "image. Graph Neural Network (GNN) based methods [3,6,17,18], as the name", "orig": "image. Graph Neural Network (GNN) based methods [3,6,17,18], as the name", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 74, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 628.99, "r_x1": 480.586, "r_y1": 628.99, "r_x2": 480.586, "r_y2": 620.193, "r_x3": 134.765, "r_y3": 620.193, "coord_origin": "TOPLEFT"}, "text": "suggests, represent tables as graph structures. The graph nodes represent the", "orig": "suggests, represent tables as graph structures. The graph nodes represent the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 75, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 640.9449999999999, "r_x1": 480.589, "r_y1": 640.9449999999999, "r_x2": 480.589, "r_y2": 632.148, "r_x3": 134.765, "r_y3": 632.148, "coord_origin": "TOPLEFT"}, "text": "content of each table cell, an embedding vector from the table image, or geomet-", "orig": "content of each table cell, an embedding vector from the table image, or geomet-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 76, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 652.9, "r_x1": 480.589, "r_y1": 652.9, "r_x2": 480.589, "r_y2": 644.1030000000001, "r_x3": 134.765, "r_y3": 644.1030000000001, "coord_origin": "TOPLEFT"}, "text": "ric coordinates of the table cell. The edges of the graph define the relationship", "orig": "ric coordinates of the table cell. The edges of the graph define the relationship", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 77, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 664.856, "r_x1": 480.591, "r_y1": 664.856, "r_x2": 480.591, "r_y2": 656.059, "r_x3": 134.765, "r_y3": 656.059, "coord_origin": "TOPLEFT"}, "text": "between the nodes, e.g. if they belong to the same column, row, or table cell.", "orig": "between the nodes, e.g. if they belong to the same column, row, or table cell.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "Approaches to formalize the logical structure and layout of tables in electronic documents date back more than two decades [16]. In the recent past, a wide variety of computer vision methods have been explored to tackle the problem of table structure recognition, i.e. the correct identification of columns, rows and spanning cells in a given table. Broadly speaking, the current deeplearning based approaches fall into three categories: object detection (OD) methods, Graph-Neural-Network (GNN) methods and Image-to-Markup-Sequence (Im2Seq) methods. Object-detection based methods [11,12,13,14,21] rely on tablestructure annotation using (overlapping) bounding boxes for training, and produce bounding-box predictions to define table cells, rows, and columns on a table image. Graph Neural Network (GNN) based methods [3,6,17,18], as the name suggests, represent tables as graph structures. The graph nodes represent the content of each table cell, an embedding vector from the table image, or geometric coordinates of the table cell. The edges of the graph define the relationship between the nodes, e.g. if they belong to the same column, row, or table cell."}], "body": [{"label": "text", "id": 2, "page_no": 2, "cluster": {"id": 2, "label": "text", "bbox": {"l": 134.765, "t": 118.93399999999997, "r": 480.592, "b": 211.41700000000003, "coord_origin": "TOPLEFT"}, "confidence": 0.9871802926063538, "cells": [{"index": 2, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 149.709, "r_y0": 127.731, "r_x1": 480.592, "r_y1": 127.731, "r_x2": 480.592, "r_y2": 118.93399999999997, "r_x3": 149.709, "r_y3": 118.93399999999997, "coord_origin": "TOPLEFT"}, "text": "While the majority of research in TSR is currently focused on the develop-", "orig": "While the majority of research in TSR is currently focused on the develop-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 3, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 139.68600000000004, "r_x1": 480.587, "r_y1": 139.68600000000004, "r_x2": 480.587, "r_y2": 130.889, "r_x3": 134.765, "r_y3": 130.889, "coord_origin": "TOPLEFT"}, "text": "ment and application of novel neural model architectures, the table structure", "orig": "ment and application of novel neural model architectures, the table structure", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 4, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 151.64200000000005, "r_x1": 480.592, "r_y1": 151.64200000000005, "r_x2": 480.592, "r_y2": 142.84500000000003, "r_x3": 134.765, "r_y3": 142.84500000000003, "coord_origin": "TOPLEFT"}, "text": "representation language (e.g. HTML in PubTabNet and FinTabNet) is usually", "orig": "representation language (e.g. HTML in PubTabNet and FinTabNet) is usually", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 5, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 163.59699999999998, "r_x1": 169.625, "r_y1": 163.59699999999998, "r_x2": 169.625, "r_y2": 154.79999999999995, "r_x3": 134.765, "r_y3": 154.79999999999995, "coord_origin": "TOPLEFT"}, "text": "adopted", "orig": "adopted", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 6, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 173.861, "r_y0": 163.59699999999998, "r_x1": 194.555, "r_y1": 163.59699999999998, "r_x2": 194.555, "r_y2": 154.79999999999995, "r_x3": 173.861, "r_y3": 154.79999999999995, "coord_origin": "TOPLEFT"}, "text": "as is", "orig": "as is", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 7, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 199.61, "r_y0": 163.59699999999998, "r_x1": 211.535, "r_y1": 163.59699999999998, "r_x2": 211.535, "r_y2": 154.79999999999995, "r_x3": 199.61, "r_y3": 154.79999999999995, "coord_origin": "TOPLEFT"}, "text": "for", "orig": "for", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 8, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 215.769, "r_y0": 163.59699999999998, "r_x1": 480.586, "r_y1": 163.59699999999998, "r_x2": 480.586, "r_y2": 154.79999999999995, "r_x3": 215.769, "r_y3": 154.79999999999995, "coord_origin": "TOPLEFT"}, "text": "the sequence tokenization in Im2Seq models. In this paper,", "orig": "the sequence tokenization in Im2Seq models. In this paper,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 9, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 175.55200000000002, "r_x1": 480.592, "r_y1": 175.55200000000002, "r_x2": 480.592, "r_y2": 166.755, "r_x3": 134.765, "r_y3": 166.755, "coord_origin": "TOPLEFT"}, "text": "we aim for the opposite and investigate the impact of the table structure rep-", "orig": "we aim for the opposite and investigate the impact of the table structure rep-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 10, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 187.50699999999995, "r_x1": 480.59, "r_y1": 187.50699999999995, "r_x2": 480.59, "r_y2": 178.71000000000004, "r_x3": 134.765, "r_y3": 178.71000000000004, "coord_origin": "TOPLEFT"}, "text": "resentation language with an otherwise unmodified Im2Seq transformer-based", "orig": "resentation language with an otherwise unmodified Im2Seq transformer-based", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 11, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 199.462, "r_x1": 480.592, "r_y1": 199.462, "r_x2": 480.592, "r_y2": 190.66499999999996, "r_x3": 134.765, "r_y3": 190.66499999999996, "coord_origin": "TOPLEFT"}, "text": "architecture. Since the current state-of-the-art Im2Seq model is TableFormer [9],", "orig": "architecture. Since the current state-of-the-art Im2Seq model is TableFormer [9],", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 12, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 211.41700000000003, "r_x1": 348.355, "r_y1": 211.41700000000003, "r_x2": 348.355, "r_y2": 202.62, "r_x3": 134.765, "r_y3": 202.62, "coord_origin": "TOPLEFT"}, "text": "we select this model to perform our experiments.", "orig": "we select this model to perform our experiments.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "While the majority of research in TSR is currently focused on the development and application of novel neural model architectures, the table structure representation language (e.g. HTML in PubTabNet and FinTabNet) is usually adopted as is for the sequence tokenization in Im2Seq models. In this paper, we aim for the opposite and investigate the impact of the table structure representation language with an otherwise unmodified Im2Seq transformer-based architecture. Since the current state-of-the-art Im2Seq model is TableFormer [9], we select this model to perform our experiments."}, {"label": "text", "id": 1, "page_no": 2, "cluster": {"id": 1, "label": "text", "bbox": {"l": 134.765, "t": 214.836, "r": 480.596, "b": 331.23, "coord_origin": "TOPLEFT"}, "confidence": 0.9871861338615417, "cells": [{"index": 13, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 149.709, "r_y0": 223.63300000000004, "r_x1": 480.594, "r_y1": 223.63300000000004, "r_x2": 480.594, "r_y2": 214.836, "r_x3": 149.709, "r_y3": 214.836, "coord_origin": "TOPLEFT"}, "text": "The main contribution of this paper is the introduction of a new optimised ta-", "orig": "The main contribution of this paper is the introduction of a new optimised ta-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 14, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 235.58799999999997, "r_x1": 480.594, "r_y1": 235.58799999999997, "r_x2": 480.594, "r_y2": 226.79100000000005, "r_x3": 134.765, "r_y3": 226.79100000000005, "coord_origin": "TOPLEFT"}, "text": "ble structure language (OTSL), specifically designed to describe table-structure", "orig": "ble structure language (OTSL), specifically designed to describe table-structure", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 15, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 247.54399999999998, "r_x1": 480.587, "r_y1": 247.54399999999998, "r_x2": 480.587, "r_y2": 238.74699999999996, "r_x3": 134.765, "r_y3": 238.74699999999996, "coord_origin": "TOPLEFT"}, "text": "in an compact and structured way for Im2Seq models. OTSL has a number of", "orig": "in an compact and structured way for Im2Seq models. OTSL has a number of", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 16, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 259.499, "r_x1": 480.587, "r_y1": 259.499, "r_x2": 480.587, "r_y2": 250.702, "r_x3": 134.765, "r_y3": 250.702, "coord_origin": "TOPLEFT"}, "text": "key features, which make it very attractive to use in Im2Seq models. Specifically,", "orig": "key features, which make it very attractive to use in Im2Seq models. Specifically,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 17, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 271.45399999999995, "r_x1": 480.588, "r_y1": 271.45399999999995, "r_x2": 480.588, "r_y2": 262.65700000000004, "r_x3": 134.765, "r_y3": 262.65700000000004, "coord_origin": "TOPLEFT"}, "text": "compared to other languages such as HTML, OTSL has a minimized vocabulary", "orig": "compared to other languages such as HTML, OTSL has a minimized vocabulary", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 18, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 283.409, "r_x1": 480.596, "r_y1": 283.409, "r_x2": 480.596, "r_y2": 274.61199999999997, "r_x3": 134.765, "r_y3": 274.61199999999997, "coord_origin": "TOPLEFT"}, "text": "which yields short sequence length, strong inherent structure (e.g. strict rectan-", "orig": "which yields short sequence length, strong inherent structure (e.g. strict rectan-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 19, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 295.364, "r_x1": 480.593, "r_y1": 295.364, "r_x2": 480.593, "r_y2": 286.567, "r_x3": 134.765, "r_y3": 286.567, "coord_origin": "TOPLEFT"}, "text": "gular layout) and a strict syntax with rules that only look backwards. The latter", "orig": "gular layout) and a strict syntax with rules that only look backwards. The latter", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 20, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 307.319, "r_x1": 480.595, "r_y1": 307.319, "r_x2": 480.595, "r_y2": 298.522, "r_x3": 134.765, "r_y3": 298.522, "coord_origin": "TOPLEFT"}, "text": "allows for syntax validation during inference and ensures a syntactically correct", "orig": "allows for syntax validation during inference and ensures a syntactically correct", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 21, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 319.275, "r_x1": 480.587, "r_y1": 319.275, "r_x2": 480.587, "r_y2": 310.478, "r_x3": 134.765, "r_y3": 310.478, "coord_origin": "TOPLEFT"}, "text": "table-structure. These OTSL features are illustrated in Figure 1, in comparison", "orig": "table-structure. These OTSL features are illustrated in Figure 1, in comparison", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 22, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 331.23, "r_x1": 179.72, "r_y1": 331.23, "r_x2": 179.72, "r_y2": 322.433, "r_x3": 134.765, "r_y3": 322.433, "coord_origin": "TOPLEFT"}, "text": "to HTML.", "orig": "to HTML.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "The main contribution of this paper is the introduction of a new optimised table structure language (OTSL), specifically designed to describe table-structure in an compact and structured way for Im2Seq models. OTSL has a number of key features, which make it very attractive to use in Im2Seq models. Specifically, compared to other languages such as HTML, OTSL has a minimized vocabulary which yields short sequence length, strong inherent structure (e.g. strict rectangular layout) and a strict syntax with rules that only look backwards. The latter allows for syntax validation during inference and ensures a syntactically correct table-structure. These OTSL features are illustrated in Figure 1, in comparison to HTML."}, {"label": "text", "id": 0, "page_no": 2, "cluster": {"id": 0, "label": "text", "bbox": {"l": 134.765, "t": 334.648, "r": 480.596, "b": 439.087, "coord_origin": "TOPLEFT"}, "confidence": 0.988121747970581, "cells": [{"index": 23, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 149.709, "r_y0": 343.445, "r_x1": 480.588, "r_y1": 343.445, "r_x2": 480.588, "r_y2": 334.648, "r_x3": 149.709, "r_y3": 334.648, "coord_origin": "TOPLEFT"}, "text": "The paper is structured as follows. In section 2, we give an overview of the", "orig": "The paper is structured as follows. In section 2, we give an overview of the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 24, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 355.401, "r_x1": 158.613, "r_y1": 355.401, "r_x2": 158.613, "r_y2": 346.604, "r_x3": 134.765, "r_y3": 346.604, "coord_origin": "TOPLEFT"}, "text": "latest", "orig": "latest", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 25, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 163.366, "r_y0": 355.401, "r_x1": 303.894, "r_y1": 355.401, "r_x2": 303.894, "r_y2": 346.604, "r_x3": 163.366, "r_y3": 346.604, "coord_origin": "TOPLEFT"}, "text": "developments in table-structure", "orig": "developments in table-structure", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 26, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.636, "r_y0": 355.401, "r_x1": 373.487, "r_y1": 355.401, "r_x2": 373.487, "r_y2": 346.604, "r_x3": 308.636, "r_y3": 346.604, "coord_origin": "TOPLEFT"}, "text": "reconstruction.", "orig": "reconstruction.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 27, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 378.239, "r_y0": 355.401, "r_x1": 387.369, "r_y1": 355.401, "r_x2": 387.369, "r_y2": 346.604, "r_x3": 378.239, "r_y3": 346.604, "coord_origin": "TOPLEFT"}, "text": "In", "orig": "In", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 28, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 392.111, "r_y0": 355.401, "r_x1": 422.055, "r_y1": 355.401, "r_x2": 422.055, "r_y2": 346.604, "r_x3": 392.111, "r_y3": 346.604, "coord_origin": "TOPLEFT"}, "text": "section", "orig": "section", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 29, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 426.798, "r_y0": 355.401, "r_x1": 480.594, "r_y1": 355.401, "r_x2": 480.594, "r_y2": 346.604, "r_x3": 426.798, "r_y3": 346.604, "coord_origin": "TOPLEFT"}, "text": "3 we review", "orig": "3 we review", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 30, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 367.356, "r_x1": 480.587, "r_y1": 367.356, "r_x2": 480.587, "r_y2": 358.559, "r_x3": 134.765, "r_y3": 358.559, "coord_origin": "TOPLEFT"}, "text": "the current HTML table encoding (popularised by PubTabNet and FinTabNet)", "orig": "the current HTML table encoding (popularised by PubTabNet and FinTabNet)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 31, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 379.311, "r_x1": 480.592, "r_y1": 379.311, "r_x2": 480.592, "r_y2": 370.514, "r_x3": 134.765, "r_y3": 370.514, "coord_origin": "TOPLEFT"}, "text": "and discuss its flaws. Subsequently, we introduce OTSL in section 4, which in-", "orig": "and discuss its flaws. Subsequently, we introduce OTSL in section 4, which in-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 32, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 391.266, "r_x1": 480.592, "r_y1": 391.266, "r_x2": 480.592, "r_y2": 382.469, "r_x3": 134.765, "r_y3": 382.469, "coord_origin": "TOPLEFT"}, "text": "cludes the language definition, syntax rules and error-correction procedures. In", "orig": "cludes the language definition, syntax rules and error-correction procedures. In", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 33, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 403.221, "r_x1": 480.588, "r_y1": 403.221, "r_x2": 480.588, "r_y2": 394.424, "r_x3": 134.765, "r_y3": 394.424, "coord_origin": "TOPLEFT"}, "text": "section 5, we apply OTSL on the TableFormer architecture, compare it to Table-", "orig": "section 5, we apply OTSL on the TableFormer architecture, compare it to Table-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 34, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 415.177, "r_x1": 480.595, "r_y1": 415.177, "r_x2": 480.595, "r_y2": 406.38, "r_x3": 134.765, "r_y3": 406.38, "coord_origin": "TOPLEFT"}, "text": "Former models trained on HTML and ultimately demonstrate the advantages", "orig": "Former models trained on HTML and ultimately demonstrate the advantages", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 35, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 427.132, "r_x1": 142.789, "r_y1": 427.132, "r_x2": 142.789, "r_y2": 418.335, "r_x3": 134.765, "r_y3": 418.335, "coord_origin": "TOPLEFT"}, "text": "of", "orig": "of", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 36, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 147.431, "r_y0": 427.132, "r_x1": 170.173, "r_y1": 427.132, "r_x2": 170.173, "r_y2": 418.335, "r_x3": 147.431, "r_y3": 418.335, "coord_origin": "TOPLEFT"}, "text": "using", "orig": "using", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 37, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 174.826, "r_y0": 427.132, "r_x1": 288.974, "r_y1": 427.132, "r_x2": 288.974, "r_y2": 418.335, "r_x3": 174.826, "r_y3": 418.335, "coord_origin": "TOPLEFT"}, "text": "OTSL. Finally, in section", "orig": "OTSL. Finally, in section", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 38, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 293.627, "r_y0": 427.132, "r_x1": 480.596, "r_y1": 427.132, "r_x2": 480.596, "r_y2": 418.335, "r_x3": 293.627, "r_y3": 418.335, "coord_origin": "TOPLEFT"}, "text": "6 we conclude our work and outline next", "orig": "6 we conclude our work and outline next", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 39, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 439.087, "r_x1": 201.272, "r_y1": 439.087, "r_x2": 201.272, "r_y2": 430.29, "r_x3": 134.765, "r_y3": 430.29, "coord_origin": "TOPLEFT"}, "text": "potential steps.", "orig": "potential steps.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "The paper is structured as follows. In section 2, we give an overview of the latest developments in table-structure reconstruction. In section 3 we review the current HTML table encoding (popularised by PubTabNet and FinTabNet) and discuss its flaws. Subsequently, we introduce OTSL in section 4, which includes the language definition, syntax rules and error-correction procedures. In section 5, we apply OTSL on the TableFormer architecture, compare it to TableFormer models trained on HTML and ultimately demonstrate the advantages of using OTSL. Finally, in section 6 we conclude our work and outline next potential steps."}, {"label": "section_header", "id": 4, "page_no": 2, "cluster": {"id": 4, "label": "section_header", "bbox": {"l": 134.765, "t": 462.088, "r": 236.769, "b": 472.656, "coord_origin": "TOPLEFT"}, "confidence": 0.9439423680305481, "cells": [{"index": 40, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 472.656, "r_x1": 141.489, "r_y1": 472.656, "r_x2": 141.489, "r_y2": 462.088, "r_x3": 134.765, "r_y3": 462.088, "coord_origin": "TOPLEFT"}, "text": "2", "orig": "2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 41, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 154.938, "r_y0": 472.656, "r_x1": 236.769, "r_y1": 472.656, "r_x2": 236.769, "r_y2": 462.088, "r_x3": 154.938, "r_y3": 462.088, "coord_origin": "TOPLEFT"}, "text": "Related Work", "orig": "Related Work", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "2 Related Work"}, {"label": "text", "id": 3, "page_no": 2, "cluster": {"id": 3, "label": "text", "bbox": {"l": 134.765, "t": 488.686, "r": 484.121, "b": 664.856, "coord_origin": "TOPLEFT"}, "confidence": 0.9870182871818542, "cells": [{"index": 42, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 497.483, "r_x1": 480.591, "r_y1": 497.483, "r_x2": 480.591, "r_y2": 488.686, "r_x3": 134.765, "r_y3": 488.686, "coord_origin": "TOPLEFT"}, "text": "Approaches to formalize the logical structure and layout of tables in electronic", "orig": "Approaches to formalize the logical structure and layout of tables in electronic", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 43, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 509.438, "r_x1": 480.592, "r_y1": 509.438, "r_x2": 480.592, "r_y2": 500.641, "r_x3": 134.765, "r_y3": 500.641, "coord_origin": "TOPLEFT"}, "text": "documents date back more than two decades [16]. In the recent past, a wide", "orig": "documents date back more than two decades [16]. In the recent past, a wide", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 44, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 521.393, "r_x1": 164.401, "r_y1": 521.393, "r_x2": 164.401, "r_y2": 512.596, "r_x3": 134.765, "r_y3": 512.596, "coord_origin": "TOPLEFT"}, "text": "variety", "orig": "variety", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 45, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 169.581, "r_y0": 521.393, "r_x1": 177.605, "r_y1": 521.393, "r_x2": 177.605, "r_y2": 512.596, "r_x3": 169.581, "r_y3": 512.596, "coord_origin": "TOPLEFT"}, "text": "of", "orig": "of", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 46, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 182.786, "r_y0": 521.393, "r_x1": 223.77, "r_y1": 521.393, "r_x2": 223.77, "r_y2": 512.596, "r_x3": 182.786, "r_y3": 512.596, "coord_origin": "TOPLEFT"}, "text": "computer", "orig": "computer", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 47, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 228.95, "r_y0": 521.393, "r_x1": 254.183, "r_y1": 521.393, "r_x2": 254.183, "r_y2": 512.596, "r_x3": 228.95, "r_y3": 512.596, "coord_origin": "TOPLEFT"}, "text": "vision", "orig": "vision", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 48, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 259.363, "r_y0": 521.393, "r_x1": 321.047, "r_y1": 521.393, "r_x2": 321.047, "r_y2": 512.596, "r_x3": 259.363, "r_y3": 512.596, "coord_origin": "TOPLEFT"}, "text": "methods have", "orig": "methods have", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 49, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 326.237, "r_y0": 521.393, "r_x1": 346.435, "r_y1": 521.393, "r_x2": 346.435, "r_y2": 512.596, "r_x3": 326.237, "r_y3": 512.596, "coord_origin": "TOPLEFT"}, "text": "been", "orig": "been", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 50, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 351.616, "r_y0": 521.393, "r_x1": 388.441, "r_y1": 521.393, "r_x2": 388.441, "r_y2": 512.596, "r_x3": 351.616, "r_y3": 512.596, "coord_origin": "TOPLEFT"}, "text": "explored", "orig": "explored", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 51, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 393.631, "r_y0": 521.393, "r_x1": 402.485, "r_y1": 521.393, "r_x2": 402.485, "r_y2": 512.596, "r_x3": 393.631, "r_y3": 512.596, "coord_origin": "TOPLEFT"}, "text": "to", "orig": "to", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 52, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 407.666, "r_y0": 521.393, "r_x1": 433.117, "r_y1": 521.393, "r_x2": 433.117, "r_y2": 512.596, "r_x3": 407.666, "r_y3": 512.596, "coord_origin": "TOPLEFT"}, "text": "tackle", "orig": "tackle", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 53, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 438.307, "r_y0": 521.393, "r_x1": 452.141, "r_y1": 521.393, "r_x2": 452.141, "r_y2": 512.596, "r_x3": 438.307, "r_y3": 512.596, "coord_origin": "TOPLEFT"}, "text": "the", "orig": "the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 54, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 457.321, "r_y0": 521.393, "r_x1": 480.59, "r_y1": 521.393, "r_x2": 480.59, "r_y2": 512.596, "r_x3": 457.321, "r_y3": 512.596, "coord_origin": "TOPLEFT"}, "text": "prob-", "orig": "prob-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 55, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 533.3489999999999, "r_x1": 163.373, "r_y1": 533.3489999999999, "r_x2": 163.373, "r_y2": 524.552, "r_x3": 134.765, "r_y3": 524.552, "coord_origin": "TOPLEFT"}, "text": "lem of", "orig": "lem of", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 56, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 168.463, "r_y0": 533.3489999999999, "r_x1": 190.043, "r_y1": 533.3489999999999, "r_x2": 190.043, "r_y2": 524.552, "r_x3": 168.463, "r_y3": 524.552, "coord_origin": "TOPLEFT"}, "text": "table", "orig": "table", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 57, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 195.134, "r_y0": 533.3489999999999, "r_x1": 234.531, "r_y1": 533.3489999999999, "r_x2": 234.531, "r_y2": 524.552, "r_x3": 195.134, "r_y3": 524.552, "coord_origin": "TOPLEFT"}, "text": "structure", "orig": "structure", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 58, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 239.632, "r_y0": 533.3489999999999, "r_x1": 290.567, "r_y1": 533.3489999999999, "r_x2": 290.567, "r_y2": 524.552, "r_x3": 239.632, "r_y3": 524.552, "coord_origin": "TOPLEFT"}, "text": "recognition,", "orig": "recognition,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 59, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 295.658, "r_y0": 533.3489999999999, "r_x1": 308.384, "r_y1": 533.3489999999999, "r_x2": 308.384, "r_y2": 524.552, "r_x3": 295.658, "r_y3": 524.552, "coord_origin": "TOPLEFT"}, "text": "i.e.", "orig": "i.e.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 60, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 313.475, "r_y0": 533.3489999999999, "r_x1": 327.308, "r_y1": 533.3489999999999, "r_x2": 327.308, "r_y2": 524.552, "r_x3": 313.475, "r_y3": 524.552, "coord_origin": "TOPLEFT"}, "text": "the", "orig": "the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 61, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 332.399, "r_y0": 533.3489999999999, "r_x1": 362.335, "r_y1": 533.3489999999999, "r_x2": 362.335, "r_y2": 524.552, "r_x3": 332.399, "r_y3": 524.552, "coord_origin": "TOPLEFT"}, "text": "correct", "orig": "correct", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 62, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 367.426, "r_y0": 533.3489999999999, "r_x1": 424.15, "r_y1": 533.3489999999999, "r_x2": 424.15, "r_y2": 524.552, "r_x3": 367.426, "r_y3": 524.552, "coord_origin": "TOPLEFT"}, "text": "identification", "orig": "identification", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 63, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 429.241, "r_y0": 533.3489999999999, "r_x1": 437.264, "r_y1": 533.3489999999999, "r_x2": 437.264, "r_y2": 524.552, "r_x3": 429.241, "r_y3": 524.552, "coord_origin": "TOPLEFT"}, "text": "of", "orig": "of", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 64, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 442.355, "r_y0": 533.3489999999999, "r_x1": 480.59, "r_y1": 533.3489999999999, "r_x2": 480.59, "r_y2": 524.552, "r_x3": 442.355, "r_y3": 524.552, "coord_origin": "TOPLEFT"}, "text": "columns,", "orig": "columns,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 65, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 545.304, "r_x1": 480.59, "r_y1": 545.304, "r_x2": 480.59, "r_y2": 536.5070000000001, "r_x3": 134.765, "r_y3": 536.5070000000001, "coord_origin": "TOPLEFT"}, "text": "rows and spanning cells in a given table. Broadly speaking, the current deep-", "orig": "rows and spanning cells in a given table. Broadly speaking, the current deep-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 66, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 557.259, "r_x1": 480.589, "r_y1": 557.259, "r_x2": 480.589, "r_y2": 548.462, "r_x3": 134.765, "r_y3": 548.462, "coord_origin": "TOPLEFT"}, "text": "learning based approaches fall into three categories: object detection (OD) meth-", "orig": "learning based approaches fall into three categories: object detection (OD) meth-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 67, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 569.2139999999999, "r_x1": 152.252, "r_y1": 569.2139999999999, "r_x2": 152.252, "r_y2": 560.417, "r_x3": 134.765, "r_y3": 560.417, "coord_origin": "TOPLEFT"}, "text": "ods,", "orig": "ods,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 68, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 157.433, "r_y0": 569.2139999999999, "r_x1": 257.459, "r_y1": 569.2139999999999, "r_x2": 257.459, "r_y2": 560.417, "r_x3": 157.433, "r_y3": 560.417, "coord_origin": "TOPLEFT"}, "text": "Graph-Neural-Network", "orig": "Graph-Neural-Network", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 69, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 262.65, "r_y0": 569.2139999999999, "r_x1": 480.591, "r_y1": 569.2139999999999, "r_x2": 480.591, "r_y2": 560.417, "r_x3": 262.65, "r_y3": 560.417, "coord_origin": "TOPLEFT"}, "text": "(GNN) methods and Image-to-Markup-Sequence", "orig": "(GNN) methods and Image-to-Markup-Sequence", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 70, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 581.169, "r_x1": 484.121, "r_y1": 581.169, "r_x2": 484.121, "r_y2": 572.3720000000001, "r_x3": 134.765, "r_y3": 572.3720000000001, "coord_origin": "TOPLEFT"}, "text": "(Im2Seq) methods. Object-detection based methods [11,12,13,14,21] rely on table-", "orig": "(Im2Seq) methods. Object-detection based methods [11,12,13,14,21] rely on table-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 71, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 593.124, "r_x1": 480.596, "r_y1": 593.124, "r_x2": 480.596, "r_y2": 584.327, "r_x3": 134.765, "r_y3": 584.327, "coord_origin": "TOPLEFT"}, "text": "structure annotation using (overlapping) bounding boxes for training, and pro-", "orig": "structure annotation using (overlapping) bounding boxes for training, and pro-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 72, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 605.08, "r_x1": 480.589, "r_y1": 605.08, "r_x2": 480.589, "r_y2": 596.283, "r_x3": 134.765, "r_y3": 596.283, "coord_origin": "TOPLEFT"}, "text": "duce bounding-box predictions to define table cells, rows, and columns on a table", "orig": "duce bounding-box predictions to define table cells, rows, and columns on a table", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 73, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 617.035, "r_x1": 480.591, "r_y1": 617.035, "r_x2": 480.591, "r_y2": 608.238, "r_x3": 134.765, "r_y3": 608.238, "coord_origin": "TOPLEFT"}, "text": "image. Graph Neural Network (GNN) based methods [3,6,17,18], as the name", "orig": "image. Graph Neural Network (GNN) based methods [3,6,17,18], as the name", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 74, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 628.99, "r_x1": 480.586, "r_y1": 628.99, "r_x2": 480.586, "r_y2": 620.193, "r_x3": 134.765, "r_y3": 620.193, "coord_origin": "TOPLEFT"}, "text": "suggests, represent tables as graph structures. The graph nodes represent the", "orig": "suggests, represent tables as graph structures. The graph nodes represent the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 75, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 640.9449999999999, "r_x1": 480.589, "r_y1": 640.9449999999999, "r_x2": 480.589, "r_y2": 632.148, "r_x3": 134.765, "r_y3": 632.148, "coord_origin": "TOPLEFT"}, "text": "content of each table cell, an embedding vector from the table image, or geomet-", "orig": "content of each table cell, an embedding vector from the table image, or geomet-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 76, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 652.9, "r_x1": 480.589, "r_y1": 652.9, "r_x2": 480.589, "r_y2": 644.1030000000001, "r_x3": 134.765, "r_y3": 644.1030000000001, "coord_origin": "TOPLEFT"}, "text": "ric coordinates of the table cell. The edges of the graph define the relationship", "orig": "ric coordinates of the table cell. The edges of the graph define the relationship", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 77, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 664.856, "r_x1": 480.591, "r_y1": 664.856, "r_x2": 480.591, "r_y2": 656.059, "r_x3": 134.765, "r_y3": 656.059, "coord_origin": "TOPLEFT"}, "text": "between the nodes, e.g. if they belong to the same column, row, or table cell.", "orig": "between the nodes, e.g. if they belong to the same column, row, or table cell.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "Approaches to formalize the logical structure and layout of tables in electronic documents date back more than two decades [16]. In the recent past, a wide variety of computer vision methods have been explored to tackle the problem of table structure recognition, i.e. the correct identification of columns, rows and spanning cells in a given table. Broadly speaking, the current deeplearning based approaches fall into three categories: object detection (OD) methods, Graph-Neural-Network (GNN) methods and Image-to-Markup-Sequence (Im2Seq) methods. Object-detection based methods [11,12,13,14,21] rely on tablestructure annotation using (overlapping) bounding boxes for training, and produce bounding-box predictions to define table cells, rows, and columns on a table image. Graph Neural Network (GNN) based methods [3,6,17,18], as the name suggests, represent tables as graph structures. The graph nodes represent the content of each table cell, an embedding vector from the table image, or geometric coordinates of the table cell. The edges of the graph define the relationship between the nodes, e.g. if they belong to the same column, row, or table cell."}], "headers": [{"label": "page_header", "id": 5, "page_no": 2, "cluster": {"id": 5, "label": "page_header", "bbox": {"l": 194.478, "t": 91.49300000000005, "r": 447.543, "b": 102.78200000000004, "coord_origin": "TOPLEFT"}, "confidence": 0.9325801730155945, "cells": [{"index": 0, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 194.478, "r_y0": 102.78200000000004, "r_x1": 447.543, "r_y1": 102.78200000000004, "r_x2": 447.543, "r_y2": 91.49300000000005, "r_x3": 194.478, "r_y3": 91.49300000000005, "coord_origin": "TOPLEFT"}, "text": "Optimized Table Tokenization for Table Structure Recognition", "orig": "Optimized Table Tokenization for Table Structure Recognition", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "Optimized Table Tokenization for Table Structure Recognition"}, {"label": "page_header", "id": 6, "page_no": 2, "cluster": {"id": 6, "label": "page_header", "bbox": {"l": 475.984, "t": 91.49300000000005, "r": 480.591, "b": 102.78200000000004, "coord_origin": "TOPLEFT"}, "confidence": 0.8773486614227295, "cells": [{"index": 1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 475.984, "r_y0": 102.78200000000004, "r_x1": 480.591, "r_y1": 102.78200000000004, "r_x2": 480.591, "r_y2": 91.49300000000005, "r_x3": 475.984, "r_y3": 91.49300000000005, "coord_origin": "TOPLEFT"}, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "3"}]}}, {"page_no": 3, "size": {"width": 612.0, "height": 792.0}, "cells": [{"index": 0, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 102.78200000000004, "r_x1": 139.372, "r_y1": 102.78200000000004, "r_x2": 139.372, "r_y2": 91.49300000000005, "r_x3": 134.765, "r_y3": 91.49300000000005, "coord_origin": "TOPLEFT"}, "text": "4", "orig": "4", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 167.813, "r_y0": 102.78200000000004, "r_x1": 231.722, "r_y1": 102.78200000000004, "r_x2": 231.722, "r_y2": 91.49300000000005, "r_x3": 167.813, "r_y3": 91.49300000000005, "coord_origin": "TOPLEFT"}, "text": "M. Lysak, et al.", "orig": "M. Lysak, et al.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 2, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 127.731, "r_x1": 480.594, "r_y1": 127.731, "r_x2": 480.594, "r_y2": 118.93399999999997, "r_x3": 134.765, "r_y3": 118.93399999999997, "coord_origin": "TOPLEFT"}, "text": "Other work [20] aims at predicting a grid for each table and deciding which cells", "orig": "Other work [20] aims at predicting a grid for each table and deciding which cells", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 3, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 139.68600000000004, "r_x1": 480.588, "r_y1": 139.68600000000004, "r_x2": 480.588, "r_y2": 130.889, "r_x3": 134.765, "r_y3": 130.889, "coord_origin": "TOPLEFT"}, "text": "must be merged using an attention network. Im2Seq methods cast the problem", "orig": "must be merged using an attention network. Im2Seq methods cast the problem", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 4, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 151.64200000000005, "r_x1": 480.587, "r_y1": 151.64200000000005, "r_x2": 480.587, "r_y2": 142.84500000000003, "r_x3": 134.765, "r_y3": 142.84500000000003, "coord_origin": "TOPLEFT"}, "text": "as a sequence generation task [4,5,9,22], and therefore need an internal table-", "orig": "as a sequence generation task [4,5,9,22], and therefore need an internal table-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 5, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 163.59699999999998, "r_x1": 174.162, "r_y1": 163.59699999999998, "r_x2": 174.162, "r_y2": 154.79999999999995, "r_x3": 134.765, "r_y3": 154.79999999999995, "coord_origin": "TOPLEFT"}, "text": "structure", "orig": "structure", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 6, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 178.755, "r_y0": 163.59699999999998, "r_x1": 240.56, "r_y1": 163.59699999999998, "r_x2": 240.56, "r_y2": 154.79999999999995, "r_x3": 178.755, "r_y3": 154.79999999999995, "coord_origin": "TOPLEFT"}, "text": "representation", "orig": "representation", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 7, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 245.143, "r_y0": 163.59699999999998, "r_x1": 286.09, "r_y1": 163.59699999999998, "r_x2": 286.09, "r_y2": 154.79999999999995, "r_x3": 245.143, "r_y3": 154.79999999999995, "coord_origin": "TOPLEFT"}, "text": "language,", "orig": "language,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 8, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 290.683, "r_y0": 163.59699999999998, "r_x1": 327.144, "r_y1": 163.59699999999998, "r_x2": 327.144, "r_y2": 154.79999999999995, "r_x3": 290.683, "r_y3": 154.79999999999995, "coord_origin": "TOPLEFT"}, "text": "which is", "orig": "which is", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 9, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 331.727, "r_y0": 163.59699999999998, "r_x1": 353.584, "r_y1": 163.59699999999998, "r_x2": 353.584, "r_y2": 154.79999999999995, "r_x3": 331.727, "r_y3": 154.79999999999995, "coord_origin": "TOPLEFT"}, "text": "often", "orig": "often", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 10, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 358.176, "r_y0": 163.59699999999998, "r_x1": 480.588, "r_y1": 163.59699999999998, "r_x2": 480.588, "r_y2": 154.79999999999995, "r_x3": 358.176, "r_y3": 154.79999999999995, "coord_origin": "TOPLEFT"}, "text": "implemented with standard", "orig": "implemented with standard", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 11, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 175.55200000000002, "r_x1": 480.593, "r_y1": 175.55200000000002, "r_x2": 480.593, "r_y2": 166.755, "r_x3": 134.765, "r_y3": 166.755, "coord_origin": "TOPLEFT"}, "text": "markup languages (e.g. HTML, LaTeX, Markdown). In theory, Im2Seq methods", "orig": "markup languages (e.g. HTML, LaTeX, Markdown). In theory, Im2Seq methods", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 12, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 187.50699999999995, "r_x1": 480.596, "r_y1": 187.50699999999995, "r_x2": 480.596, "r_y2": 178.71000000000004, "r_x3": 134.765, "r_y3": 178.71000000000004, "coord_origin": "TOPLEFT"}, "text": "have a natural advantage over the OD and GNN methods by virtue of directly", "orig": "have a natural advantage over the OD and GNN methods by virtue of directly", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 13, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 199.462, "r_x1": 480.593, "r_y1": 199.462, "r_x2": 480.593, "r_y2": 190.66499999999996, "r_x3": 134.765, "r_y3": 190.66499999999996, "coord_origin": "TOPLEFT"}, "text": "predicting the table-structure. As such, no post-processing or rules are needed", "orig": "predicting the table-structure. As such, no post-processing or rules are needed", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 14, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 211.41700000000003, "r_x1": 143.065, "r_y1": 211.41700000000003, "r_x2": 143.065, "r_y2": 202.62, "r_x3": 134.765, "r_y3": 202.62, "coord_origin": "TOPLEFT"}, "text": "in", "orig": "in", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 15, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 147.329, "r_y0": 211.41700000000003, "r_x1": 480.594, "r_y1": 211.41700000000003, "r_x2": 480.594, "r_y2": 202.62, "r_x3": 147.329, "r_y3": 202.62, "coord_origin": "TOPLEFT"}, "text": "order to obtain the table-structure, which is necessary with OD and GNN", "orig": "order to obtain the table-structure, which is necessary with OD and GNN", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 16, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 223.37300000000005, "r_x1": 480.588, "r_y1": 223.37300000000005, "r_x2": 480.588, "r_y2": 214.57600000000002, "r_x3": 134.765, "r_y3": 214.57600000000002, "coord_origin": "TOPLEFT"}, "text": "approaches. In practice, this is not entirely true, because a predicted sequence", "orig": "approaches. In practice, this is not entirely true, because a predicted sequence", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 17, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 235.32799999999997, "r_x1": 480.59, "r_y1": 235.32799999999997, "r_x2": 480.59, "r_y2": 226.53099999999995, "r_x3": 134.765, "r_y3": 226.53099999999995, "coord_origin": "TOPLEFT"}, "text": "of table-structure markup does not necessarily have to be syntactically correct.", "orig": "of table-structure markup does not necessarily have to be syntactically correct.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 18, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 247.28300000000002, "r_x1": 480.596, "r_y1": 247.28300000000002, "r_x2": 480.596, "r_y2": 238.486, "r_x3": 134.765, "r_y3": 238.486, "coord_origin": "TOPLEFT"}, "text": "Hence, depending on the quality of the predicted sequence, some post-processing", "orig": "Hence, depending on the quality of the predicted sequence, some post-processing", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 19, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 259.23800000000006, "r_x1": 480.595, "r_y1": 259.23800000000006, "r_x2": 480.595, "r_y2": 250.44100000000003, "r_x3": 134.765, "r_y3": 250.44100000000003, "coord_origin": "TOPLEFT"}, "text": "needs to be performed to ensure a syntactically valid (let alone correct) sequence.", "orig": "needs to be performed to ensure a syntactically valid (let alone correct) sequence.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 20, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 149.709, "r_y0": 271.45399999999995, "r_x1": 199.213, "r_y1": 271.45399999999995, "r_x2": 199.213, "r_y2": 262.65700000000004, "r_x3": 149.709, "r_y3": 262.65700000000004, "coord_origin": "TOPLEFT"}, "text": "Within the", "orig": "Within the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 21, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 204.175, "r_y0": 271.45399999999995, "r_x1": 349.163, "r_y1": 271.45399999999995, "r_x2": 349.163, "r_y2": 262.65700000000004, "r_x3": 204.175, "r_y3": 262.65700000000004, "coord_origin": "TOPLEFT"}, "text": "Im2Seq method, we find several", "orig": "Im2Seq method, we find several", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 22, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 354.125, "r_y0": 271.45399999999995, "r_x1": 387.632, "r_y1": 271.45399999999995, "r_x2": 387.632, "r_y2": 262.65700000000004, "r_x3": 354.125, "r_y3": 262.65700000000004, "coord_origin": "TOPLEFT"}, "text": "popular", "orig": "popular", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 23, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 392.593, "r_y0": 271.45399999999995, "r_x1": 425.573, "r_y1": 271.45399999999995, "r_x2": 425.573, "r_y2": 262.65700000000004, "r_x3": 392.593, "r_y3": 262.65700000000004, "coord_origin": "TOPLEFT"}, "text": "models,", "orig": "models,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 24, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 430.535, "r_y0": 271.45399999999995, "r_x1": 480.593, "r_y1": 271.45399999999995, "r_x2": 480.593, "r_y2": 262.65700000000004, "r_x3": 430.535, "r_y3": 262.65700000000004, "coord_origin": "TOPLEFT"}, "text": "namely the", "orig": "namely the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 25, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 283.409, "r_x1": 480.592, "r_y1": 283.409, "r_x2": 480.592, "r_y2": 274.61199999999997, "r_x3": 134.765, "r_y3": 274.61199999999997, "coord_origin": "TOPLEFT"}, "text": "encoder-dual-decoder model (EDD) [22], TableFormer [9], Tabsplitter[2] and Ye", "orig": "encoder-dual-decoder model (EDD) [22], TableFormer [9], Tabsplitter[2] and Ye", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 26, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 295.364, "r_x1": 480.593, "r_y1": 295.364, "r_x2": 480.593, "r_y2": 286.567, "r_x3": 134.765, "r_y3": 286.567, "coord_origin": "TOPLEFT"}, "text": "et. al. [19]. EDD uses two consecutive long short-term memory (LSTM) decoders", "orig": "et. al. [19]. EDD uses two consecutive long short-term memory (LSTM) decoders", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 27, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 307.319, "r_x1": 342.021, "r_y1": 307.319, "r_x2": 342.021, "r_y2": 298.522, "r_x3": 134.765, "r_y3": 298.522, "coord_origin": "TOPLEFT"}, "text": "to predict a table in HTML representation. The", "orig": "to predict a table in HTML representation. The", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 28, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 345.064, "r_y0": 307.319, "r_x1": 393.047, "r_y1": 307.319, "r_x2": 393.047, "r_y2": 298.522, "r_x3": 345.064, "r_y3": 298.522, "coord_origin": "TOPLEFT"}, "text": "tag decoder", "orig": "tag decoder", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 29, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 397.167, "r_y0": 307.319, "r_x1": 480.591, "r_y1": 307.319, "r_x2": 480.591, "r_y2": 298.522, "r_x3": 397.167, "r_y3": 298.522, "coord_origin": "TOPLEFT"}, "text": "predicts a sequence", "orig": "predicts a sequence", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 30, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 319.275, "r_x1": 333.299, "r_y1": 319.275, "r_x2": 333.299, "r_y2": 310.478, "r_x3": 134.765, "r_y3": 310.478, "coord_origin": "TOPLEFT"}, "text": "of HTML tags. For each decoded table cell (", "orig": "of HTML tags. For each decoded table cell (", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 31, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 333.299, "r_y0": 319.275, "r_x1": 356.971, "r_y1": 319.275, "r_x2": 356.971, "r_y2": 310.478, "r_x3": 333.299, "r_y3": 310.478, "coord_origin": "TOPLEFT"}, "text": "<td>", "orig": "<td>", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 32, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 357.085, "r_y0": 319.275, "r_x1": 363.725, "r_y1": 319.275, "r_x2": 363.725, "r_y2": 310.478, "r_x3": 357.085, "r_y3": 310.478, "coord_origin": "TOPLEFT"}, "text": "),", "orig": "),", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 33, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 367.64, "r_y0": 319.275, "r_x1": 480.594, "r_y1": 319.275, "r_x2": 480.594, "r_y2": 310.478, "r_x3": 367.64, "r_y3": 310.478, "coord_origin": "TOPLEFT"}, "text": "the attention is passed to", "orig": "the attention is passed to", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 34, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 331.23, "r_x1": 148.598, "r_y1": 331.23, "r_x2": 148.598, "r_y2": 322.433, "r_x3": 134.765, "r_y3": 322.433, "coord_origin": "TOPLEFT"}, "text": "the", "orig": "the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 35, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 152.277, "r_y0": 331.23, "r_x1": 166.531, "r_y1": 331.23, "r_x2": 166.531, "r_y2": 322.433, "r_x3": 152.277, "r_y3": 322.433, "coord_origin": "TOPLEFT"}, "text": "cell", "orig": "cell", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 36, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 170.427, "r_y0": 331.23, "r_x1": 202.111, "r_y1": 331.23, "r_x2": 202.111, "r_y2": 322.433, "r_x3": 170.427, "r_y3": 322.433, "coord_origin": "TOPLEFT"}, "text": "decoder", "orig": "decoder", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 37, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 206.864, "r_y0": 331.23, "r_x1": 480.587, "r_y1": 331.23, "r_x2": 480.587, "r_y2": 322.433, "r_x3": 206.864, "r_y3": 322.433, "coord_origin": "TOPLEFT"}, "text": "to predict the content with an embedded OCR approach. The", "orig": "to predict the content with an embedded OCR approach. The", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 38, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 343.185, "r_x1": 480.595, "r_y1": 343.185, "r_x2": 480.595, "r_y2": 334.388, "r_x3": 134.765, "r_y3": 334.388, "coord_origin": "TOPLEFT"}, "text": "latter makes it susceptible to transcription errors in the cell content of the table.", "orig": "latter makes it susceptible to transcription errors in the cell content of the table.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 39, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 355.14, "r_x1": 480.587, "r_y1": 355.14, "r_x2": 480.587, "r_y2": 346.343, "r_x3": 134.765, "r_y3": 346.343, "coord_origin": "TOPLEFT"}, "text": "TableFormer address this reliance on OCRand uses two transformer decoders for", "orig": "TableFormer address this reliance on OCRand uses two transformer decoders for", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 40, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 367.095, "r_x1": 480.589, "r_y1": 367.095, "r_x2": 480.589, "r_y2": 358.298, "r_x3": 134.765, "r_y3": 358.298, "coord_origin": "TOPLEFT"}, "text": "HTML structure and cell bounding box prediction in an end-to-end architecture.", "orig": "HTML structure and cell bounding box prediction in an end-to-end architecture.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 41, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 379.05, "r_x1": 480.589, "r_y1": 379.05, "r_x2": 480.589, "r_y2": 370.253, "r_x3": 134.765, "r_y3": 370.253, "coord_origin": "TOPLEFT"}, "text": "The predicted cell bounding box is then used to extract text tokens from an", "orig": "The predicted cell bounding box is then used to extract text tokens from an", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 42, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 391.006, "r_x1": 480.594, "r_y1": 391.006, "r_x2": 480.594, "r_y2": 382.209, "r_x3": 134.765, "r_y3": 382.209, "coord_origin": "TOPLEFT"}, "text": "originating (digital) PDF page, circumventing any need for OCR. TabSplitter", "orig": "originating (digital) PDF page, circumventing any need for OCR. TabSplitter", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 43, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 402.961, "r_x1": 480.587, "r_y1": 402.961, "r_x2": 480.587, "r_y2": 394.164, "r_x3": 134.765, "r_y3": 394.164, "coord_origin": "TOPLEFT"}, "text": "[2] proposes a compact double-matrix representation of table rows and columns", "orig": "[2] proposes a compact double-matrix representation of table rows and columns", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 44, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 414.916, "r_x1": 480.596, "r_y1": 414.916, "r_x2": 480.596, "r_y2": 406.119, "r_x3": 134.765, "r_y3": 406.119, "coord_origin": "TOPLEFT"}, "text": "to do error detection and error correction of HTML structure sequences based", "orig": "to do error detection and error correction of HTML structure sequences based", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 45, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 426.871, "r_x1": 480.592, "r_y1": 426.871, "r_x2": 480.592, "r_y2": 418.074, "r_x3": 134.765, "r_y3": 418.074, "coord_origin": "TOPLEFT"}, "text": "on predictions from [19]. This compact double-matrix representation can not be", "orig": "on predictions from [19]. This compact double-matrix representation can not be", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 46, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 438.826, "r_x1": 480.588, "r_y1": 438.826, "r_x2": 480.588, "r_y2": 430.029, "r_x3": 134.765, "r_y3": 430.029, "coord_origin": "TOPLEFT"}, "text": "used directly by the Img2seq model training, so the model uses HTML as an", "orig": "used directly by the Img2seq model training, so the model uses HTML as an", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 47, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 450.781, "r_x1": 480.589, "r_y1": 450.781, "r_x2": 480.589, "r_y2": 441.984, "r_x3": 134.765, "r_y3": 441.984, "coord_origin": "TOPLEFT"}, "text": "intermediate form. Chi et. al. [4] introduce a data set and a baseline method", "orig": "intermediate form. Chi et. al. [4] introduce a data set and a baseline method", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 48, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 462.737, "r_x1": 384.575, "r_y1": 462.737, "r_x2": 384.575, "r_y2": 453.94, "r_x3": 134.765, "r_y3": 453.94, "coord_origin": "TOPLEFT"}, "text": "using bidirectional LSTMs to predict LaTeX code. Kayal", "orig": "using bidirectional LSTMs to predict LaTeX code. Kayal", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 49, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 391.559, "r_y0": 462.737, "r_x1": 480.588, "r_y1": 462.737, "r_x2": 480.588, "r_y2": 453.94, "r_x3": 391.559, "r_y3": 453.94, "coord_origin": "TOPLEFT"}, "text": "[5] introduces Gated", "orig": "[5] introduces Gated", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 50, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 474.692, "r_x1": 480.591, "r_y1": 474.692, "r_x2": 480.591, "r_y2": 465.895, "r_x3": 134.765, "r_y3": 465.895, "coord_origin": "TOPLEFT"}, "text": "ResNet transformers to predict LaTeX code, and a separate OCR module to", "orig": "ResNet transformers to predict LaTeX code, and a separate OCR module to", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 51, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 486.647, "r_x1": 203.686, "r_y1": 486.647, "r_x2": 203.686, "r_y2": 477.85, "r_x3": 134.765, "r_y3": 477.85, "coord_origin": "TOPLEFT"}, "text": "extract content.", "orig": "extract content.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 52, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 149.709, "r_y0": 498.863, "r_x1": 480.594, "r_y1": 498.863, "r_x2": 480.594, "r_y2": 490.066, "r_x3": 149.709, "r_y3": 490.066, "coord_origin": "TOPLEFT"}, "text": "Im2Seq approaches have shown to be well-suited for the TSR task and allow a", "orig": "Im2Seq approaches have shown to be well-suited for the TSR task and allow a", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 53, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 510.818, "r_x1": 480.589, "r_y1": 510.818, "r_x2": 480.589, "r_y2": 502.021, "r_x3": 134.765, "r_y3": 502.021, "coord_origin": "TOPLEFT"}, "text": "full end-to-end network design that can output the final table structure without", "orig": "full end-to-end network design that can output the final table structure without", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 54, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 522.773, "r_x1": 480.587, "r_y1": 522.773, "r_x2": 480.587, "r_y2": 513.976, "r_x3": 134.765, "r_y3": 513.976, "coord_origin": "TOPLEFT"}, "text": "pre- or post-processing logic. Furthermore, Im2Seq models have demonstrated", "orig": "pre- or post-processing logic. Furthermore, Im2Seq models have demonstrated", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 55, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 534.7280000000001, "r_x1": 176.662, "r_y1": 534.7280000000001, "r_x2": 176.662, "r_y2": 525.931, "r_x3": 134.765, "r_y3": 525.931, "coord_origin": "TOPLEFT"}, "text": "to deliver", "orig": "to deliver", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 56, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 180.896, "r_y0": 534.7280000000001, "r_x1": 246.551, "r_y1": 534.7280000000001, "r_x2": 246.551, "r_y2": 525.931, "r_x3": 180.896, "r_y3": 525.931, "coord_origin": "TOPLEFT"}, "text": "state-of-the-art", "orig": "state-of-the-art", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 57, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 250.785, "r_y0": 534.7280000000001, "r_x1": 480.59, "r_y1": 534.7280000000001, "r_x2": 480.59, "r_y2": 525.931, "r_x3": 250.785, "r_y3": 525.931, "coord_origin": "TOPLEFT"}, "text": "prediction accuracy [9]. This motivated the authors", "orig": "prediction accuracy [9]. This motivated the authors", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 58, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 546.683, "r_x1": 143.619, "r_y1": 546.683, "r_x2": 143.619, "r_y2": 537.886, "r_x3": 134.765, "r_y3": 537.886, "coord_origin": "TOPLEFT"}, "text": "to", "orig": "to", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 59, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 148.56, "r_y0": 546.683, "r_x1": 194.815, "r_y1": 546.683, "r_x2": 194.815, "r_y2": 537.886, "r_x3": 148.56, "r_y3": 537.886, "coord_origin": "TOPLEFT"}, "text": "investigate", "orig": "investigate", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 60, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 199.756, "r_y0": 546.683, "r_x1": 205.566, "r_y1": 546.683, "r_x2": 205.566, "r_y2": 537.886, "r_x3": 199.756, "r_y3": 537.886, "coord_origin": "TOPLEFT"}, "text": "if", "orig": "if", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 61, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 210.508, "r_y0": 546.683, "r_x1": 224.341, "r_y1": 546.683, "r_x2": 224.341, "r_y2": 537.886, "r_x3": 210.508, "r_y3": 537.886, "coord_origin": "TOPLEFT"}, "text": "the", "orig": "the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 62, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 229.272, "r_y0": 546.683, "r_x1": 283.004, "r_y1": 546.683, "r_x2": 283.004, "r_y2": 537.886, "r_x3": 229.272, "r_y3": 537.886, "coord_origin": "TOPLEFT"}, "text": "performance", "orig": "performance", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 63, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 287.945, "r_y0": 546.683, "r_x1": 312.018, "r_y1": 546.683, "r_x2": 312.018, "r_y2": 537.886, "r_x3": 287.945, "r_y3": 537.886, "coord_origin": "TOPLEFT"}, "text": "(both", "orig": "(both", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 64, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 316.949, "r_y0": 546.683, "r_x1": 325.249, "r_y1": 546.683, "r_x2": 325.249, "r_y2": 537.886, "r_x3": 316.949, "r_y3": 537.886, "coord_origin": "TOPLEFT"}, "text": "in", "orig": "in", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 65, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 330.19, "r_y0": 546.683, "r_x1": 368.122, "r_y1": 546.683, "r_x2": 368.122, "r_y2": 537.886, "r_x3": 330.19, "r_y3": 537.886, "coord_origin": "TOPLEFT"}, "text": "accuracy", "orig": "accuracy", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 66, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 373.063, "r_y0": 546.683, "r_x1": 432.535, "r_y1": 546.683, "r_x2": 432.535, "r_y2": 537.886, "r_x3": 373.063, "r_y3": 537.886, "coord_origin": "TOPLEFT"}, "text": "and inference", "orig": "and inference", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 67, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 437.477, "r_y0": 546.683, "r_x1": 460.716, "r_y1": 546.683, "r_x2": 460.716, "r_y2": 537.886, "r_x3": 437.477, "r_y3": 537.886, "coord_origin": "TOPLEFT"}, "text": "time)", "orig": "time)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 68, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 465.648, "r_y0": 546.683, "r_x1": 480.588, "r_y1": 546.683, "r_x2": 480.588, "r_y2": 537.886, "r_x3": 465.648, "r_y3": 537.886, "coord_origin": "TOPLEFT"}, "text": "can", "orig": "can", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 69, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 558.639, "r_x1": 480.59, "r_y1": 558.639, "r_x2": 480.59, "r_y2": 549.842, "r_x3": 134.765, "r_y3": 549.842, "coord_origin": "TOPLEFT"}, "text": "be further improved by optimising the table structure representation language.", "orig": "be further improved by optimising the table structure representation language.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 70, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 570.594, "r_x1": 183.086, "r_y1": 570.594, "r_x2": 183.086, "r_y2": 561.797, "r_x3": 134.765, "r_y3": 561.797, "coord_origin": "TOPLEFT"}, "text": "We believe", "orig": "We believe", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 71, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 187.977, "r_y0": 570.594, "r_x1": 204.079, "r_y1": 570.594, "r_x2": 204.079, "r_y2": 561.797, "r_x3": 187.977, "r_y3": 561.797, "coord_origin": "TOPLEFT"}, "text": "this", "orig": "this", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 72, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 208.96, "r_y0": 570.594, "r_x1": 215.655, "r_y1": 570.594, "r_x2": 215.655, "r_y2": 561.797, "r_x3": 208.96, "r_y3": 561.797, "coord_origin": "TOPLEFT"}, "text": "is", "orig": "is", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 73, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 220.547, "r_y0": 570.594, "r_x1": 271.217, "r_y1": 570.594, "r_x2": 271.217, "r_y2": 561.797, "r_x3": 220.547, "r_y3": 561.797, "coord_origin": "TOPLEFT"}, "text": "a necessary", "orig": "a necessary", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 74, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 276.108, "r_y0": 570.594, "r_x1": 293.87, "r_y1": 570.594, "r_x2": 293.87, "r_y2": 561.797, "r_x3": 276.108, "r_y3": 561.797, "coord_origin": "TOPLEFT"}, "text": "step", "orig": "step", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 75, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 298.751, "r_y0": 570.594, "r_x1": 325.342, "r_y1": 570.594, "r_x2": 325.342, "r_y2": 561.797, "r_x3": 298.751, "r_y3": 561.797, "coord_origin": "TOPLEFT"}, "text": "before", "orig": "before", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 76, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 330.223, "r_y0": 570.594, "r_x1": 360.436, "r_y1": 570.594, "r_x2": 360.436, "r_y2": 561.797, "r_x3": 330.223, "r_y3": 561.797, "coord_origin": "TOPLEFT"}, "text": "further", "orig": "further", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 77, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 365.327, "r_y0": 570.594, "r_x1": 409.067, "r_y1": 570.594, "r_x2": 409.067, "r_y2": 561.797, "r_x3": 365.327, "r_y3": 561.797, "coord_origin": "TOPLEFT"}, "text": "improving", "orig": "improving", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 78, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 413.949, "r_y0": 570.594, "r_x1": 441.09, "r_y1": 570.594, "r_x2": 441.09, "r_y2": 561.797, "r_x3": 413.949, "r_y3": 561.797, "coord_origin": "TOPLEFT"}, "text": "neural", "orig": "neural", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 79, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 445.982, "r_y0": 570.594, "r_x1": 480.589, "r_y1": 570.594, "r_x2": 480.589, "r_y2": 561.797, "r_x3": 445.982, "r_y3": 561.797, "coord_origin": "TOPLEFT"}, "text": "network", "orig": "network", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 80, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 582.549, "r_x1": 249.278, "r_y1": 582.549, "r_x2": 249.278, "r_y2": 573.752, "r_x3": 134.765, "r_y3": 573.752, "coord_origin": "TOPLEFT"}, "text": "architectures for this task.", "orig": "architectures for this task.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 81, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 616.1179999999999, "r_x1": 141.489, "r_y1": 616.1179999999999, "r_x2": 141.489, "r_y2": 605.55, "r_x3": 134.765, "r_y3": 605.55, "coord_origin": "TOPLEFT"}, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 82, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 154.938, "r_y0": 616.1179999999999, "r_x1": 269.624, "r_y1": 616.1179999999999, "r_x2": 269.624, "r_y2": 605.55, "r_x3": 154.938, "r_y3": 605.55, "coord_origin": "TOPLEFT"}, "text": "Problem Statement", "orig": "Problem Statement", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 83, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 640.9449999999999, "r_x1": 480.591, "r_y1": 640.9449999999999, "r_x2": 480.591, "r_y2": 632.148, "r_x3": 134.765, "r_y3": 632.148, "coord_origin": "TOPLEFT"}, "text": "All known Im2Seq based models for TSR fundamentally work in similar ways.", "orig": "All known Im2Seq based models for TSR fundamentally work in similar ways.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 84, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 652.9, "r_x1": 480.587, "r_y1": 652.9, "r_x2": 480.587, "r_y2": 644.1030000000001, "r_x3": 134.765, "r_y3": 644.1030000000001, "coord_origin": "TOPLEFT"}, "text": "Given an image of a table, the Im2Seq model predicts the structure of the table", "orig": "Given an image of a table, the Im2Seq model predicts the structure of the table", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 85, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 664.856, "r_x1": 480.594, "r_y1": 664.856, "r_x2": 480.594, "r_y2": 656.059, "r_x3": 134.765, "r_y3": 656.059, "coord_origin": "TOPLEFT"}, "text": "by generating a sequence of tokens. These tokens originate from a finite vocab-", "orig": "by generating a sequence of tokens. These tokens originate from a finite vocab-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "parsed_page": null, "predictions": {"layout": {"clusters": [{"id": 6, "label": "page_header", "bbox": {"l": 134.765, "t": 91.49300000000005, "r": 139.372, "b": 102.78200000000004, "coord_origin": "TOPLEFT"}, "confidence": 0.7890051603317261, "cells": [{"index": 0, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 102.78200000000004, "r_x1": 139.372, "r_y1": 102.78200000000004, "r_x2": 139.372, "r_y2": 91.49300000000005, "r_x3": 134.765, "r_y3": 91.49300000000005, "coord_origin": "TOPLEFT"}, "text": "4", "orig": "4", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 5, "label": "page_header", "bbox": {"l": 167.813, "t": 91.49300000000005, "r": 231.722, "b": 102.78200000000004, "coord_origin": "TOPLEFT"}, "confidence": 0.9045588374137878, "cells": [{"index": 1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 167.813, "r_y0": 102.78200000000004, "r_x1": 231.722, "r_y1": 102.78200000000004, "r_x2": 231.722, "r_y2": 91.49300000000005, "r_x3": 167.813, "r_y3": 91.49300000000005, "coord_origin": "TOPLEFT"}, "text": "M. Lysak, et al.", "orig": "M. Lysak, et al.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 2, "label": "text", "bbox": {"l": 134.765, "t": 118.93399999999997, "r": 480.596, "b": 259.23800000000006, "coord_origin": "TOPLEFT"}, "confidence": 0.9467443823814392, "cells": [{"index": 2, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 127.731, "r_x1": 480.594, "r_y1": 127.731, "r_x2": 480.594, "r_y2": 118.93399999999997, "r_x3": 134.765, "r_y3": 118.93399999999997, "coord_origin": "TOPLEFT"}, "text": "Other work [20] aims at predicting a grid for each table and deciding which cells", "orig": "Other work [20] aims at predicting a grid for each table and deciding which cells", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 3, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 139.68600000000004, "r_x1": 480.588, "r_y1": 139.68600000000004, "r_x2": 480.588, "r_y2": 130.889, "r_x3": 134.765, "r_y3": 130.889, "coord_origin": "TOPLEFT"}, "text": "must be merged using an attention network. Im2Seq methods cast the problem", "orig": "must be merged using an attention network. Im2Seq methods cast the problem", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 4, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 151.64200000000005, "r_x1": 480.587, "r_y1": 151.64200000000005, "r_x2": 480.587, "r_y2": 142.84500000000003, "r_x3": 134.765, "r_y3": 142.84500000000003, "coord_origin": "TOPLEFT"}, "text": "as a sequence generation task [4,5,9,22], and therefore need an internal table-", "orig": "as a sequence generation task [4,5,9,22], and therefore need an internal table-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 5, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 163.59699999999998, "r_x1": 174.162, "r_y1": 163.59699999999998, "r_x2": 174.162, "r_y2": 154.79999999999995, "r_x3": 134.765, "r_y3": 154.79999999999995, "coord_origin": "TOPLEFT"}, "text": "structure", "orig": "structure", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 6, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 178.755, "r_y0": 163.59699999999998, "r_x1": 240.56, "r_y1": 163.59699999999998, "r_x2": 240.56, "r_y2": 154.79999999999995, "r_x3": 178.755, "r_y3": 154.79999999999995, "coord_origin": "TOPLEFT"}, "text": "representation", "orig": "representation", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 7, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 245.143, "r_y0": 163.59699999999998, "r_x1": 286.09, "r_y1": 163.59699999999998, "r_x2": 286.09, "r_y2": 154.79999999999995, "r_x3": 245.143, "r_y3": 154.79999999999995, "coord_origin": "TOPLEFT"}, "text": "language,", "orig": "language,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 8, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 290.683, "r_y0": 163.59699999999998, "r_x1": 327.144, "r_y1": 163.59699999999998, "r_x2": 327.144, "r_y2": 154.79999999999995, "r_x3": 290.683, "r_y3": 154.79999999999995, "coord_origin": "TOPLEFT"}, "text": "which is", "orig": "which is", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 9, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 331.727, "r_y0": 163.59699999999998, "r_x1": 353.584, "r_y1": 163.59699999999998, "r_x2": 353.584, "r_y2": 154.79999999999995, "r_x3": 331.727, "r_y3": 154.79999999999995, "coord_origin": "TOPLEFT"}, "text": "often", "orig": "often", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 10, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 358.176, "r_y0": 163.59699999999998, "r_x1": 480.588, "r_y1": 163.59699999999998, "r_x2": 480.588, "r_y2": 154.79999999999995, "r_x3": 358.176, "r_y3": 154.79999999999995, "coord_origin": "TOPLEFT"}, "text": "implemented with standard", "orig": "implemented with standard", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 11, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 175.55200000000002, "r_x1": 480.593, "r_y1": 175.55200000000002, "r_x2": 480.593, "r_y2": 166.755, "r_x3": 134.765, "r_y3": 166.755, "coord_origin": "TOPLEFT"}, "text": "markup languages (e.g. HTML, LaTeX, Markdown). In theory, Im2Seq methods", "orig": "markup languages (e.g. HTML, LaTeX, Markdown). In theory, Im2Seq methods", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 12, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 187.50699999999995, "r_x1": 480.596, "r_y1": 187.50699999999995, "r_x2": 480.596, "r_y2": 178.71000000000004, "r_x3": 134.765, "r_y3": 178.71000000000004, "coord_origin": "TOPLEFT"}, "text": "have a natural advantage over the OD and GNN methods by virtue of directly", "orig": "have a natural advantage over the OD and GNN methods by virtue of directly", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 13, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 199.462, "r_x1": 480.593, "r_y1": 199.462, "r_x2": 480.593, "r_y2": 190.66499999999996, "r_x3": 134.765, "r_y3": 190.66499999999996, "coord_origin": "TOPLEFT"}, "text": "predicting the table-structure. As such, no post-processing or rules are needed", "orig": "predicting the table-structure. As such, no post-processing or rules are needed", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 14, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 211.41700000000003, "r_x1": 143.065, "r_y1": 211.41700000000003, "r_x2": 143.065, "r_y2": 202.62, "r_x3": 134.765, "r_y3": 202.62, "coord_origin": "TOPLEFT"}, "text": "in", "orig": "in", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 15, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 147.329, "r_y0": 211.41700000000003, "r_x1": 480.594, "r_y1": 211.41700000000003, "r_x2": 480.594, "r_y2": 202.62, "r_x3": 147.329, "r_y3": 202.62, "coord_origin": "TOPLEFT"}, "text": "order to obtain the table-structure, which is necessary with OD and GNN", "orig": "order to obtain the table-structure, which is necessary with OD and GNN", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 16, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 223.37300000000005, "r_x1": 480.588, "r_y1": 223.37300000000005, "r_x2": 480.588, "r_y2": 214.57600000000002, "r_x3": 134.765, "r_y3": 214.57600000000002, "coord_origin": "TOPLEFT"}, "text": "approaches. In practice, this is not entirely true, because a predicted sequence", "orig": "approaches. In practice, this is not entirely true, because a predicted sequence", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 17, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 235.32799999999997, "r_x1": 480.59, "r_y1": 235.32799999999997, "r_x2": 480.59, "r_y2": 226.53099999999995, "r_x3": 134.765, "r_y3": 226.53099999999995, "coord_origin": "TOPLEFT"}, "text": "of table-structure markup does not necessarily have to be syntactically correct.", "orig": "of table-structure markup does not necessarily have to be syntactically correct.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 18, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 247.28300000000002, "r_x1": 480.596, "r_y1": 247.28300000000002, "r_x2": 480.596, "r_y2": 238.486, "r_x3": 134.765, "r_y3": 238.486, "coord_origin": "TOPLEFT"}, "text": "Hence, depending on the quality of the predicted sequence, some post-processing", "orig": "Hence, depending on the quality of the predicted sequence, some post-processing", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 19, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 259.23800000000006, "r_x1": 480.595, "r_y1": 259.23800000000006, "r_x2": 480.595, "r_y2": 250.44100000000003, "r_x3": 134.765, "r_y3": 250.44100000000003, "coord_origin": "TOPLEFT"}, "text": "needs to be performed to ensure a syntactically valid (let alone correct) sequence.", "orig": "needs to be performed to ensure a syntactically valid (let alone correct) sequence.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 4, "label": "text", "bbox": {"l": 134.765, "t": 262.65700000000004, "r": 480.596, "b": 486.647, "coord_origin": "TOPLEFT"}, "confidence": 0.929087221622467, "cells": [{"index": 20, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 149.709, "r_y0": 271.45399999999995, "r_x1": 199.213, "r_y1": 271.45399999999995, "r_x2": 199.213, "r_y2": 262.65700000000004, "r_x3": 149.709, "r_y3": 262.65700000000004, "coord_origin": "TOPLEFT"}, "text": "Within the", "orig": "Within the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 21, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 204.175, "r_y0": 271.45399999999995, "r_x1": 349.163, "r_y1": 271.45399999999995, "r_x2": 349.163, "r_y2": 262.65700000000004, "r_x3": 204.175, "r_y3": 262.65700000000004, "coord_origin": "TOPLEFT"}, "text": "Im2Seq method, we find several", "orig": "Im2Seq method, we find several", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 22, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 354.125, "r_y0": 271.45399999999995, "r_x1": 387.632, "r_y1": 271.45399999999995, "r_x2": 387.632, "r_y2": 262.65700000000004, "r_x3": 354.125, "r_y3": 262.65700000000004, "coord_origin": "TOPLEFT"}, "text": "popular", "orig": "popular", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 23, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 392.593, "r_y0": 271.45399999999995, "r_x1": 425.573, "r_y1": 271.45399999999995, "r_x2": 425.573, "r_y2": 262.65700000000004, "r_x3": 392.593, "r_y3": 262.65700000000004, "coord_origin": "TOPLEFT"}, "text": "models,", "orig": "models,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 24, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 430.535, "r_y0": 271.45399999999995, "r_x1": 480.593, "r_y1": 271.45399999999995, "r_x2": 480.593, "r_y2": 262.65700000000004, "r_x3": 430.535, "r_y3": 262.65700000000004, "coord_origin": "TOPLEFT"}, "text": "namely the", "orig": "namely the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 25, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 283.409, "r_x1": 480.592, "r_y1": 283.409, "r_x2": 480.592, "r_y2": 274.61199999999997, "r_x3": 134.765, "r_y3": 274.61199999999997, "coord_origin": "TOPLEFT"}, "text": "encoder-dual-decoder model (EDD) [22], TableFormer [9], Tabsplitter[2] and Ye", "orig": "encoder-dual-decoder model (EDD) [22], TableFormer [9], Tabsplitter[2] and Ye", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 26, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 295.364, "r_x1": 480.593, "r_y1": 295.364, "r_x2": 480.593, "r_y2": 286.567, "r_x3": 134.765, "r_y3": 286.567, "coord_origin": "TOPLEFT"}, "text": "et. al. [19]. EDD uses two consecutive long short-term memory (LSTM) decoders", "orig": "et. al. [19]. EDD uses two consecutive long short-term memory (LSTM) decoders", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 27, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 307.319, "r_x1": 342.021, "r_y1": 307.319, "r_x2": 342.021, "r_y2": 298.522, "r_x3": 134.765, "r_y3": 298.522, "coord_origin": "TOPLEFT"}, "text": "to predict a table in HTML representation. The", "orig": "to predict a table in HTML representation. The", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 28, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 345.064, "r_y0": 307.319, "r_x1": 393.047, "r_y1": 307.319, "r_x2": 393.047, "r_y2": 298.522, "r_x3": 345.064, "r_y3": 298.522, "coord_origin": "TOPLEFT"}, "text": "tag decoder", "orig": "tag decoder", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 29, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 397.167, "r_y0": 307.319, "r_x1": 480.591, "r_y1": 307.319, "r_x2": 480.591, "r_y2": 298.522, "r_x3": 397.167, "r_y3": 298.522, "coord_origin": "TOPLEFT"}, "text": "predicts a sequence", "orig": "predicts a sequence", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 30, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 319.275, "r_x1": 333.299, "r_y1": 319.275, "r_x2": 333.299, "r_y2": 310.478, "r_x3": 134.765, "r_y3": 310.478, "coord_origin": "TOPLEFT"}, "text": "of HTML tags. For each decoded table cell (", "orig": "of HTML tags. For each decoded table cell (", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 31, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 333.299, "r_y0": 319.275, "r_x1": 356.971, "r_y1": 319.275, "r_x2": 356.971, "r_y2": 310.478, "r_x3": 333.299, "r_y3": 310.478, "coord_origin": "TOPLEFT"}, "text": "<td>", "orig": "<td>", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 32, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 357.085, "r_y0": 319.275, "r_x1": 363.725, "r_y1": 319.275, "r_x2": 363.725, "r_y2": 310.478, "r_x3": 357.085, "r_y3": 310.478, "coord_origin": "TOPLEFT"}, "text": "),", "orig": "),", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 33, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 367.64, "r_y0": 319.275, "r_x1": 480.594, "r_y1": 319.275, "r_x2": 480.594, "r_y2": 310.478, "r_x3": 367.64, "r_y3": 310.478, "coord_origin": "TOPLEFT"}, "text": "the attention is passed to", "orig": "the attention is passed to", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 34, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 331.23, "r_x1": 148.598, "r_y1": 331.23, "r_x2": 148.598, "r_y2": 322.433, "r_x3": 134.765, "r_y3": 322.433, "coord_origin": "TOPLEFT"}, "text": "the", "orig": "the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 35, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 152.277, "r_y0": 331.23, "r_x1": 166.531, "r_y1": 331.23, "r_x2": 166.531, "r_y2": 322.433, "r_x3": 152.277, "r_y3": 322.433, "coord_origin": "TOPLEFT"}, "text": "cell", "orig": "cell", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 36, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 170.427, "r_y0": 331.23, "r_x1": 202.111, "r_y1": 331.23, "r_x2": 202.111, "r_y2": 322.433, "r_x3": 170.427, "r_y3": 322.433, "coord_origin": "TOPLEFT"}, "text": "decoder", "orig": "decoder", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 37, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 206.864, "r_y0": 331.23, "r_x1": 480.587, "r_y1": 331.23, "r_x2": 480.587, "r_y2": 322.433, "r_x3": 206.864, "r_y3": 322.433, "coord_origin": "TOPLEFT"}, "text": "to predict the content with an embedded OCR approach. The", "orig": "to predict the content with an embedded OCR approach. The", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 38, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 343.185, "r_x1": 480.595, "r_y1": 343.185, "r_x2": 480.595, "r_y2": 334.388, "r_x3": 134.765, "r_y3": 334.388, "coord_origin": "TOPLEFT"}, "text": "latter makes it susceptible to transcription errors in the cell content of the table.", "orig": "latter makes it susceptible to transcription errors in the cell content of the table.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 39, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 355.14, "r_x1": 480.587, "r_y1": 355.14, "r_x2": 480.587, "r_y2": 346.343, "r_x3": 134.765, "r_y3": 346.343, "coord_origin": "TOPLEFT"}, "text": "TableFormer address this reliance on OCRand uses two transformer decoders for", "orig": "TableFormer address this reliance on OCRand uses two transformer decoders for", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 40, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 367.095, "r_x1": 480.589, "r_y1": 367.095, "r_x2": 480.589, "r_y2": 358.298, "r_x3": 134.765, "r_y3": 358.298, "coord_origin": "TOPLEFT"}, "text": "HTML structure and cell bounding box prediction in an end-to-end architecture.", "orig": "HTML structure and cell bounding box prediction in an end-to-end architecture.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 41, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 379.05, "r_x1": 480.589, "r_y1": 379.05, "r_x2": 480.589, "r_y2": 370.253, "r_x3": 134.765, "r_y3": 370.253, "coord_origin": "TOPLEFT"}, "text": "The predicted cell bounding box is then used to extract text tokens from an", "orig": "The predicted cell bounding box is then used to extract text tokens from an", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 42, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 391.006, "r_x1": 480.594, "r_y1": 391.006, "r_x2": 480.594, "r_y2": 382.209, "r_x3": 134.765, "r_y3": 382.209, "coord_origin": "TOPLEFT"}, "text": "originating (digital) PDF page, circumventing any need for OCR. TabSplitter", "orig": "originating (digital) PDF page, circumventing any need for OCR. TabSplitter", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 43, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 402.961, "r_x1": 480.587, "r_y1": 402.961, "r_x2": 480.587, "r_y2": 394.164, "r_x3": 134.765, "r_y3": 394.164, "coord_origin": "TOPLEFT"}, "text": "[2] proposes a compact double-matrix representation of table rows and columns", "orig": "[2] proposes a compact double-matrix representation of table rows and columns", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 44, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 414.916, "r_x1": 480.596, "r_y1": 414.916, "r_x2": 480.596, "r_y2": 406.119, "r_x3": 134.765, "r_y3": 406.119, "coord_origin": "TOPLEFT"}, "text": "to do error detection and error correction of HTML structure sequences based", "orig": "to do error detection and error correction of HTML structure sequences based", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 45, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 426.871, "r_x1": 480.592, "r_y1": 426.871, "r_x2": 480.592, "r_y2": 418.074, "r_x3": 134.765, "r_y3": 418.074, "coord_origin": "TOPLEFT"}, "text": "on predictions from [19]. This compact double-matrix representation can not be", "orig": "on predictions from [19]. This compact double-matrix representation can not be", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 46, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 438.826, "r_x1": 480.588, "r_y1": 438.826, "r_x2": 480.588, "r_y2": 430.029, "r_x3": 134.765, "r_y3": 430.029, "coord_origin": "TOPLEFT"}, "text": "used directly by the Img2seq model training, so the model uses HTML as an", "orig": "used directly by the Img2seq model training, so the model uses HTML as an", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 47, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 450.781, "r_x1": 480.589, "r_y1": 450.781, "r_x2": 480.589, "r_y2": 441.984, "r_x3": 134.765, "r_y3": 441.984, "coord_origin": "TOPLEFT"}, "text": "intermediate form. Chi et. al. [4] introduce a data set and a baseline method", "orig": "intermediate form. Chi et. al. [4] introduce a data set and a baseline method", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 48, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 462.737, "r_x1": 384.575, "r_y1": 462.737, "r_x2": 384.575, "r_y2": 453.94, "r_x3": 134.765, "r_y3": 453.94, "coord_origin": "TOPLEFT"}, "text": "using bidirectional LSTMs to predict LaTeX code. Kayal", "orig": "using bidirectional LSTMs to predict LaTeX code. Kayal", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 49, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 391.559, "r_y0": 462.737, "r_x1": 480.588, "r_y1": 462.737, "r_x2": 480.588, "r_y2": 453.94, "r_x3": 391.559, "r_y3": 453.94, "coord_origin": "TOPLEFT"}, "text": "[5] introduces Gated", "orig": "[5] introduces Gated", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 50, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 474.692, "r_x1": 480.591, "r_y1": 474.692, "r_x2": 480.591, "r_y2": 465.895, "r_x3": 134.765, "r_y3": 465.895, "coord_origin": "TOPLEFT"}, "text": "ResNet transformers to predict LaTeX code, and a separate OCR module to", "orig": "ResNet transformers to predict LaTeX code, and a separate OCR module to", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 51, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 486.647, "r_x1": 203.686, "r_y1": 486.647, "r_x2": 203.686, "r_y2": 477.85, "r_x3": 134.765, "r_y3": 477.85, "coord_origin": "TOPLEFT"}, "text": "extract content.", "orig": "extract content.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 0, "label": "text", "bbox": {"l": 134.765, "t": 490.066, "r": 480.594, "b": 582.549, "coord_origin": "TOPLEFT"}, "confidence": 0.9853583574295044, "cells": [{"index": 52, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 149.709, "r_y0": 498.863, "r_x1": 480.594, "r_y1": 498.863, "r_x2": 480.594, "r_y2": 490.066, "r_x3": 149.709, "r_y3": 490.066, "coord_origin": "TOPLEFT"}, "text": "Im2Seq approaches have shown to be well-suited for the TSR task and allow a", "orig": "Im2Seq approaches have shown to be well-suited for the TSR task and allow a", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 53, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 510.818, "r_x1": 480.589, "r_y1": 510.818, "r_x2": 480.589, "r_y2": 502.021, "r_x3": 134.765, "r_y3": 502.021, "coord_origin": "TOPLEFT"}, "text": "full end-to-end network design that can output the final table structure without", "orig": "full end-to-end network design that can output the final table structure without", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 54, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 522.773, "r_x1": 480.587, "r_y1": 522.773, "r_x2": 480.587, "r_y2": 513.976, "r_x3": 134.765, "r_y3": 513.976, "coord_origin": "TOPLEFT"}, "text": "pre- or post-processing logic. Furthermore, Im2Seq models have demonstrated", "orig": "pre- or post-processing logic. Furthermore, Im2Seq models have demonstrated", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 55, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 534.7280000000001, "r_x1": 176.662, "r_y1": 534.7280000000001, "r_x2": 176.662, "r_y2": 525.931, "r_x3": 134.765, "r_y3": 525.931, "coord_origin": "TOPLEFT"}, "text": "to deliver", "orig": "to deliver", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 56, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 180.896, "r_y0": 534.7280000000001, "r_x1": 246.551, "r_y1": 534.7280000000001, "r_x2": 246.551, "r_y2": 525.931, "r_x3": 180.896, "r_y3": 525.931, "coord_origin": "TOPLEFT"}, "text": "state-of-the-art", "orig": "state-of-the-art", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 57, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 250.785, "r_y0": 534.7280000000001, "r_x1": 480.59, "r_y1": 534.7280000000001, "r_x2": 480.59, "r_y2": 525.931, "r_x3": 250.785, "r_y3": 525.931, "coord_origin": "TOPLEFT"}, "text": "prediction accuracy [9]. This motivated the authors", "orig": "prediction accuracy [9]. This motivated the authors", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 58, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 546.683, "r_x1": 143.619, "r_y1": 546.683, "r_x2": 143.619, "r_y2": 537.886, "r_x3": 134.765, "r_y3": 537.886, "coord_origin": "TOPLEFT"}, "text": "to", "orig": "to", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 59, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 148.56, "r_y0": 546.683, "r_x1": 194.815, "r_y1": 546.683, "r_x2": 194.815, "r_y2": 537.886, "r_x3": 148.56, "r_y3": 537.886, "coord_origin": "TOPLEFT"}, "text": "investigate", "orig": "investigate", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 60, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 199.756, "r_y0": 546.683, "r_x1": 205.566, "r_y1": 546.683, "r_x2": 205.566, "r_y2": 537.886, "r_x3": 199.756, "r_y3": 537.886, "coord_origin": "TOPLEFT"}, "text": "if", "orig": "if", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 61, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 210.508, "r_y0": 546.683, "r_x1": 224.341, "r_y1": 546.683, "r_x2": 224.341, "r_y2": 537.886, "r_x3": 210.508, "r_y3": 537.886, "coord_origin": "TOPLEFT"}, "text": "the", "orig": "the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 62, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 229.272, "r_y0": 546.683, "r_x1": 283.004, "r_y1": 546.683, "r_x2": 283.004, "r_y2": 537.886, "r_x3": 229.272, "r_y3": 537.886, "coord_origin": "TOPLEFT"}, "text": "performance", "orig": "performance", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 63, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 287.945, "r_y0": 546.683, "r_x1": 312.018, "r_y1": 546.683, "r_x2": 312.018, "r_y2": 537.886, "r_x3": 287.945, "r_y3": 537.886, "coord_origin": "TOPLEFT"}, "text": "(both", "orig": "(both", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 64, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 316.949, "r_y0": 546.683, "r_x1": 325.249, "r_y1": 546.683, "r_x2": 325.249, "r_y2": 537.886, "r_x3": 316.949, "r_y3": 537.886, "coord_origin": "TOPLEFT"}, "text": "in", "orig": "in", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 65, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 330.19, "r_y0": 546.683, "r_x1": 368.122, "r_y1": 546.683, "r_x2": 368.122, "r_y2": 537.886, "r_x3": 330.19, "r_y3": 537.886, "coord_origin": "TOPLEFT"}, "text": "accuracy", "orig": "accuracy", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 66, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 373.063, "r_y0": 546.683, "r_x1": 432.535, "r_y1": 546.683, "r_x2": 432.535, "r_y2": 537.886, "r_x3": 373.063, "r_y3": 537.886, "coord_origin": "TOPLEFT"}, "text": "and inference", "orig": "and inference", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 67, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 437.477, "r_y0": 546.683, "r_x1": 460.716, "r_y1": 546.683, "r_x2": 460.716, "r_y2": 537.886, "r_x3": 437.477, "r_y3": 537.886, "coord_origin": "TOPLEFT"}, "text": "time)", "orig": "time)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 68, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 465.648, "r_y0": 546.683, "r_x1": 480.588, "r_y1": 546.683, "r_x2": 480.588, "r_y2": 537.886, "r_x3": 465.648, "r_y3": 537.886, "coord_origin": "TOPLEFT"}, "text": "can", "orig": "can", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 69, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 558.639, "r_x1": 480.59, "r_y1": 558.639, "r_x2": 480.59, "r_y2": 549.842, "r_x3": 134.765, "r_y3": 549.842, "coord_origin": "TOPLEFT"}, "text": "be further improved by optimising the table structure representation language.", "orig": "be further improved by optimising the table structure representation language.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 70, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 570.594, "r_x1": 183.086, "r_y1": 570.594, "r_x2": 183.086, "r_y2": 561.797, "r_x3": 134.765, "r_y3": 561.797, "coord_origin": "TOPLEFT"}, "text": "We believe", "orig": "We believe", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 71, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 187.977, "r_y0": 570.594, "r_x1": 204.079, "r_y1": 570.594, "r_x2": 204.079, "r_y2": 561.797, "r_x3": 187.977, "r_y3": 561.797, "coord_origin": "TOPLEFT"}, "text": "this", "orig": "this", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 72, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 208.96, "r_y0": 570.594, "r_x1": 215.655, "r_y1": 570.594, "r_x2": 215.655, "r_y2": 561.797, "r_x3": 208.96, "r_y3": 561.797, "coord_origin": "TOPLEFT"}, "text": "is", "orig": "is", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 73, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 220.547, "r_y0": 570.594, "r_x1": 271.217, "r_y1": 570.594, "r_x2": 271.217, "r_y2": 561.797, "r_x3": 220.547, "r_y3": 561.797, "coord_origin": "TOPLEFT"}, "text": "a necessary", "orig": "a necessary", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 74, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 276.108, "r_y0": 570.594, "r_x1": 293.87, "r_y1": 570.594, "r_x2": 293.87, "r_y2": 561.797, "r_x3": 276.108, "r_y3": 561.797, "coord_origin": "TOPLEFT"}, "text": "step", "orig": "step", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 75, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 298.751, "r_y0": 570.594, "r_x1": 325.342, "r_y1": 570.594, "r_x2": 325.342, "r_y2": 561.797, "r_x3": 298.751, "r_y3": 561.797, "coord_origin": "TOPLEFT"}, "text": "before", "orig": "before", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 76, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 330.223, "r_y0": 570.594, "r_x1": 360.436, "r_y1": 570.594, "r_x2": 360.436, "r_y2": 561.797, "r_x3": 330.223, "r_y3": 561.797, "coord_origin": "TOPLEFT"}, "text": "further", "orig": "further", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 77, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 365.327, "r_y0": 570.594, "r_x1": 409.067, "r_y1": 570.594, "r_x2": 409.067, "r_y2": 561.797, "r_x3": 365.327, "r_y3": 561.797, "coord_origin": "TOPLEFT"}, "text": "improving", "orig": "improving", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 78, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 413.949, "r_y0": 570.594, "r_x1": 441.09, "r_y1": 570.594, "r_x2": 441.09, "r_y2": 561.797, "r_x3": 413.949, "r_y3": 561.797, "coord_origin": "TOPLEFT"}, "text": "neural", "orig": "neural", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 79, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 445.982, "r_y0": 570.594, "r_x1": 480.589, "r_y1": 570.594, "r_x2": 480.589, "r_y2": 561.797, "r_x3": 445.982, "r_y3": 561.797, "coord_origin": "TOPLEFT"}, "text": "network", "orig": "network", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 80, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 582.549, "r_x1": 249.278, "r_y1": 582.549, "r_x2": 249.278, "r_y2": 573.752, "r_x3": 134.765, "r_y3": 573.752, "coord_origin": "TOPLEFT"}, "text": "architectures for this task.", "orig": "architectures for this task.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 3, "label": "section_header", "bbox": {"l": 134.765, "t": 605.55, "r": 269.624, "b": 616.1179999999999, "coord_origin": "TOPLEFT"}, "confidence": 0.9393903017044067, "cells": [{"index": 81, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 616.1179999999999, "r_x1": 141.489, "r_y1": 616.1179999999999, "r_x2": 141.489, "r_y2": 605.55, "r_x3": 134.765, "r_y3": 605.55, "coord_origin": "TOPLEFT"}, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 82, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 154.938, "r_y0": 616.1179999999999, "r_x1": 269.624, "r_y1": 616.1179999999999, "r_x2": 269.624, "r_y2": 605.55, "r_x3": 154.938, "r_y3": 605.55, "coord_origin": "TOPLEFT"}, "text": "Problem Statement", "orig": "Problem Statement", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 1, "label": "text", "bbox": {"l": 134.765, "t": 632.148, "r": 480.594, "b": 664.856, "coord_origin": "TOPLEFT"}, "confidence": 0.9692807197570801, "cells": [{"index": 83, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 640.9449999999999, "r_x1": 480.591, "r_y1": 640.9449999999999, "r_x2": 480.591, "r_y2": 632.148, "r_x3": 134.765, "r_y3": 632.148, "coord_origin": "TOPLEFT"}, "text": "All known Im2Seq based models for TSR fundamentally work in similar ways.", "orig": "All known Im2Seq based models for TSR fundamentally work in similar ways.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 84, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 652.9, "r_x1": 480.587, "r_y1": 652.9, "r_x2": 480.587, "r_y2": 644.1030000000001, "r_x3": 134.765, "r_y3": 644.1030000000001, "coord_origin": "TOPLEFT"}, "text": "Given an image of a table, the Im2Seq model predicts the structure of the table", "orig": "Given an image of a table, the Im2Seq model predicts the structure of the table", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 85, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 664.856, "r_x1": 480.594, "r_y1": 664.856, "r_x2": 480.594, "r_y2": 656.059, "r_x3": 134.765, "r_y3": 656.059, "coord_origin": "TOPLEFT"}, "text": "by generating a sequence of tokens. These tokens originate from a finite vocab-", "orig": "by generating a sequence of tokens. These tokens originate from a finite vocab-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}]}, "tablestructure": {"table_map": {}}, "figures_classification": null, "equations_prediction": null, "vlm_response": null}, "assembled": {"elements": [{"label": "page_header", "id": 6, "page_no": 3, "cluster": {"id": 6, "label": "page_header", "bbox": {"l": 134.765, "t": 91.49300000000005, "r": 139.372, "b": 102.78200000000004, "coord_origin": "TOPLEFT"}, "confidence": 0.7890051603317261, "cells": [{"index": 0, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 102.78200000000004, "r_x1": 139.372, "r_y1": 102.78200000000004, "r_x2": 139.372, "r_y2": 91.49300000000005, "r_x3": 134.765, "r_y3": 91.49300000000005, "coord_origin": "TOPLEFT"}, "text": "4", "orig": "4", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "4"}, {"label": "page_header", "id": 5, "page_no": 3, "cluster": {"id": 5, "label": "page_header", "bbox": {"l": 167.813, "t": 91.49300000000005, "r": 231.722, "b": 102.78200000000004, "coord_origin": "TOPLEFT"}, "confidence": 0.9045588374137878, "cells": [{"index": 1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 167.813, "r_y0": 102.78200000000004, "r_x1": 231.722, "r_y1": 102.78200000000004, "r_x2": 231.722, "r_y2": 91.49300000000005, "r_x3": 167.813, "r_y3": 91.49300000000005, "coord_origin": "TOPLEFT"}, "text": "M. Lysak, et al.", "orig": "M. Lysak, et al.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "M. Lysak, et al."}, {"label": "text", "id": 2, "page_no": 3, "cluster": {"id": 2, "label": "text", "bbox": {"l": 134.765, "t": 118.93399999999997, "r": 480.596, "b": 259.23800000000006, "coord_origin": "TOPLEFT"}, "confidence": 0.9467443823814392, "cells": [{"index": 2, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 127.731, "r_x1": 480.594, "r_y1": 127.731, "r_x2": 480.594, "r_y2": 118.93399999999997, "r_x3": 134.765, "r_y3": 118.93399999999997, "coord_origin": "TOPLEFT"}, "text": "Other work [20] aims at predicting a grid for each table and deciding which cells", "orig": "Other work [20] aims at predicting a grid for each table and deciding which cells", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 3, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 139.68600000000004, "r_x1": 480.588, "r_y1": 139.68600000000004, "r_x2": 480.588, "r_y2": 130.889, "r_x3": 134.765, "r_y3": 130.889, "coord_origin": "TOPLEFT"}, "text": "must be merged using an attention network. Im2Seq methods cast the problem", "orig": "must be merged using an attention network. Im2Seq methods cast the problem", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 4, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 151.64200000000005, "r_x1": 480.587, "r_y1": 151.64200000000005, "r_x2": 480.587, "r_y2": 142.84500000000003, "r_x3": 134.765, "r_y3": 142.84500000000003, "coord_origin": "TOPLEFT"}, "text": "as a sequence generation task [4,5,9,22], and therefore need an internal table-", "orig": "as a sequence generation task [4,5,9,22], and therefore need an internal table-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 5, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 163.59699999999998, "r_x1": 174.162, "r_y1": 163.59699999999998, "r_x2": 174.162, "r_y2": 154.79999999999995, "r_x3": 134.765, "r_y3": 154.79999999999995, "coord_origin": "TOPLEFT"}, "text": "structure", "orig": "structure", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 6, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 178.755, "r_y0": 163.59699999999998, "r_x1": 240.56, "r_y1": 163.59699999999998, "r_x2": 240.56, "r_y2": 154.79999999999995, "r_x3": 178.755, "r_y3": 154.79999999999995, "coord_origin": "TOPLEFT"}, "text": "representation", "orig": "representation", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 7, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 245.143, "r_y0": 163.59699999999998, "r_x1": 286.09, "r_y1": 163.59699999999998, "r_x2": 286.09, "r_y2": 154.79999999999995, "r_x3": 245.143, "r_y3": 154.79999999999995, "coord_origin": "TOPLEFT"}, "text": "language,", "orig": "language,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 8, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 290.683, "r_y0": 163.59699999999998, "r_x1": 327.144, "r_y1": 163.59699999999998, "r_x2": 327.144, "r_y2": 154.79999999999995, "r_x3": 290.683, "r_y3": 154.79999999999995, "coord_origin": "TOPLEFT"}, "text": "which is", "orig": "which is", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 9, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 331.727, "r_y0": 163.59699999999998, "r_x1": 353.584, "r_y1": 163.59699999999998, "r_x2": 353.584, "r_y2": 154.79999999999995, "r_x3": 331.727, "r_y3": 154.79999999999995, "coord_origin": "TOPLEFT"}, "text": "often", "orig": "often", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 10, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 358.176, "r_y0": 163.59699999999998, "r_x1": 480.588, "r_y1": 163.59699999999998, "r_x2": 480.588, "r_y2": 154.79999999999995, "r_x3": 358.176, "r_y3": 154.79999999999995, "coord_origin": "TOPLEFT"}, "text": "implemented with standard", "orig": "implemented with standard", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 11, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 175.55200000000002, "r_x1": 480.593, "r_y1": 175.55200000000002, "r_x2": 480.593, "r_y2": 166.755, "r_x3": 134.765, "r_y3": 166.755, "coord_origin": "TOPLEFT"}, "text": "markup languages (e.g. HTML, LaTeX, Markdown). In theory, Im2Seq methods", "orig": "markup languages (e.g. HTML, LaTeX, Markdown). In theory, Im2Seq methods", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 12, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 187.50699999999995, "r_x1": 480.596, "r_y1": 187.50699999999995, "r_x2": 480.596, "r_y2": 178.71000000000004, "r_x3": 134.765, "r_y3": 178.71000000000004, "coord_origin": "TOPLEFT"}, "text": "have a natural advantage over the OD and GNN methods by virtue of directly", "orig": "have a natural advantage over the OD and GNN methods by virtue of directly", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 13, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 199.462, "r_x1": 480.593, "r_y1": 199.462, "r_x2": 480.593, "r_y2": 190.66499999999996, "r_x3": 134.765, "r_y3": 190.66499999999996, "coord_origin": "TOPLEFT"}, "text": "predicting the table-structure. As such, no post-processing or rules are needed", "orig": "predicting the table-structure. As such, no post-processing or rules are needed", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 14, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 211.41700000000003, "r_x1": 143.065, "r_y1": 211.41700000000003, "r_x2": 143.065, "r_y2": 202.62, "r_x3": 134.765, "r_y3": 202.62, "coord_origin": "TOPLEFT"}, "text": "in", "orig": "in", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 15, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 147.329, "r_y0": 211.41700000000003, "r_x1": 480.594, "r_y1": 211.41700000000003, "r_x2": 480.594, "r_y2": 202.62, "r_x3": 147.329, "r_y3": 202.62, "coord_origin": "TOPLEFT"}, "text": "order to obtain the table-structure, which is necessary with OD and GNN", "orig": "order to obtain the table-structure, which is necessary with OD and GNN", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 16, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 223.37300000000005, "r_x1": 480.588, "r_y1": 223.37300000000005, "r_x2": 480.588, "r_y2": 214.57600000000002, "r_x3": 134.765, "r_y3": 214.57600000000002, "coord_origin": "TOPLEFT"}, "text": "approaches. In practice, this is not entirely true, because a predicted sequence", "orig": "approaches. In practice, this is not entirely true, because a predicted sequence", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 17, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 235.32799999999997, "r_x1": 480.59, "r_y1": 235.32799999999997, "r_x2": 480.59, "r_y2": 226.53099999999995, "r_x3": 134.765, "r_y3": 226.53099999999995, "coord_origin": "TOPLEFT"}, "text": "of table-structure markup does not necessarily have to be syntactically correct.", "orig": "of table-structure markup does not necessarily have to be syntactically correct.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 18, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 247.28300000000002, "r_x1": 480.596, "r_y1": 247.28300000000002, "r_x2": 480.596, "r_y2": 238.486, "r_x3": 134.765, "r_y3": 238.486, "coord_origin": "TOPLEFT"}, "text": "Hence, depending on the quality of the predicted sequence, some post-processing", "orig": "Hence, depending on the quality of the predicted sequence, some post-processing", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 19, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 259.23800000000006, "r_x1": 480.595, "r_y1": 259.23800000000006, "r_x2": 480.595, "r_y2": 250.44100000000003, "r_x3": 134.765, "r_y3": 250.44100000000003, "coord_origin": "TOPLEFT"}, "text": "needs to be performed to ensure a syntactically valid (let alone correct) sequence.", "orig": "needs to be performed to ensure a syntactically valid (let alone correct) sequence.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "Other work [20] aims at predicting a grid for each table and deciding which cells must be merged using an attention network. Im2Seq methods cast the problem as a sequence generation task [4,5,9,22], and therefore need an internal tablestructure representation language, which is often implemented with standard markup languages (e.g. HTML, LaTeX, Markdown). In theory, Im2Seq methods have a natural advantage over the OD and GNN methods by virtue of directly predicting the table-structure. As such, no post-processing or rules are needed in order to obtain the table-structure, which is necessary with OD and GNN approaches. In practice, this is not entirely true, because a predicted sequence of table-structure markup does not necessarily have to be syntactically correct. Hence, depending on the quality of the predicted sequence, some post-processing needs to be performed to ensure a syntactically valid (let alone correct) sequence."}, {"label": "text", "id": 4, "page_no": 3, "cluster": {"id": 4, "label": "text", "bbox": {"l": 134.765, "t": 262.65700000000004, "r": 480.596, "b": 486.647, "coord_origin": "TOPLEFT"}, "confidence": 0.929087221622467, "cells": [{"index": 20, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 149.709, "r_y0": 271.45399999999995, "r_x1": 199.213, "r_y1": 271.45399999999995, "r_x2": 199.213, "r_y2": 262.65700000000004, "r_x3": 149.709, "r_y3": 262.65700000000004, "coord_origin": "TOPLEFT"}, "text": "Within the", "orig": "Within the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 21, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 204.175, "r_y0": 271.45399999999995, "r_x1": 349.163, "r_y1": 271.45399999999995, "r_x2": 349.163, "r_y2": 262.65700000000004, "r_x3": 204.175, "r_y3": 262.65700000000004, "coord_origin": "TOPLEFT"}, "text": "Im2Seq method, we find several", "orig": "Im2Seq method, we find several", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 22, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 354.125, "r_y0": 271.45399999999995, "r_x1": 387.632, "r_y1": 271.45399999999995, "r_x2": 387.632, "r_y2": 262.65700000000004, "r_x3": 354.125, "r_y3": 262.65700000000004, "coord_origin": "TOPLEFT"}, "text": "popular", "orig": "popular", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 23, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 392.593, "r_y0": 271.45399999999995, "r_x1": 425.573, "r_y1": 271.45399999999995, "r_x2": 425.573, "r_y2": 262.65700000000004, "r_x3": 392.593, "r_y3": 262.65700000000004, "coord_origin": "TOPLEFT"}, "text": "models,", "orig": "models,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 24, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 430.535, "r_y0": 271.45399999999995, "r_x1": 480.593, "r_y1": 271.45399999999995, "r_x2": 480.593, "r_y2": 262.65700000000004, "r_x3": 430.535, "r_y3": 262.65700000000004, "coord_origin": "TOPLEFT"}, "text": "namely the", "orig": "namely the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 25, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 283.409, "r_x1": 480.592, "r_y1": 283.409, "r_x2": 480.592, "r_y2": 274.61199999999997, "r_x3": 134.765, "r_y3": 274.61199999999997, "coord_origin": "TOPLEFT"}, "text": "encoder-dual-decoder model (EDD) [22], TableFormer [9], Tabsplitter[2] and Ye", "orig": "encoder-dual-decoder model (EDD) [22], TableFormer [9], Tabsplitter[2] and Ye", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 26, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 295.364, "r_x1": 480.593, "r_y1": 295.364, "r_x2": 480.593, "r_y2": 286.567, "r_x3": 134.765, "r_y3": 286.567, "coord_origin": "TOPLEFT"}, "text": "et. al. [19]. EDD uses two consecutive long short-term memory (LSTM) decoders", "orig": "et. al. [19]. EDD uses two consecutive long short-term memory (LSTM) decoders", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 27, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 307.319, "r_x1": 342.021, "r_y1": 307.319, "r_x2": 342.021, "r_y2": 298.522, "r_x3": 134.765, "r_y3": 298.522, "coord_origin": "TOPLEFT"}, "text": "to predict a table in HTML representation. The", "orig": "to predict a table in HTML representation. The", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 28, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 345.064, "r_y0": 307.319, "r_x1": 393.047, "r_y1": 307.319, "r_x2": 393.047, "r_y2": 298.522, "r_x3": 345.064, "r_y3": 298.522, "coord_origin": "TOPLEFT"}, "text": "tag decoder", "orig": "tag decoder", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 29, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 397.167, "r_y0": 307.319, "r_x1": 480.591, "r_y1": 307.319, "r_x2": 480.591, "r_y2": 298.522, "r_x3": 397.167, "r_y3": 298.522, "coord_origin": "TOPLEFT"}, "text": "predicts a sequence", "orig": "predicts a sequence", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 30, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 319.275, "r_x1": 333.299, "r_y1": 319.275, "r_x2": 333.299, "r_y2": 310.478, "r_x3": 134.765, "r_y3": 310.478, "coord_origin": "TOPLEFT"}, "text": "of HTML tags. For each decoded table cell (", "orig": "of HTML tags. For each decoded table cell (", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 31, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 333.299, "r_y0": 319.275, "r_x1": 356.971, "r_y1": 319.275, "r_x2": 356.971, "r_y2": 310.478, "r_x3": 333.299, "r_y3": 310.478, "coord_origin": "TOPLEFT"}, "text": "<td>", "orig": "<td>", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 32, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 357.085, "r_y0": 319.275, "r_x1": 363.725, "r_y1": 319.275, "r_x2": 363.725, "r_y2": 310.478, "r_x3": 357.085, "r_y3": 310.478, "coord_origin": "TOPLEFT"}, "text": "),", "orig": "),", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 33, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 367.64, "r_y0": 319.275, "r_x1": 480.594, "r_y1": 319.275, "r_x2": 480.594, "r_y2": 310.478, "r_x3": 367.64, "r_y3": 310.478, "coord_origin": "TOPLEFT"}, "text": "the attention is passed to", "orig": "the attention is passed to", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 34, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 331.23, "r_x1": 148.598, "r_y1": 331.23, "r_x2": 148.598, "r_y2": 322.433, "r_x3": 134.765, "r_y3": 322.433, "coord_origin": "TOPLEFT"}, "text": "the", "orig": "the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 35, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 152.277, "r_y0": 331.23, "r_x1": 166.531, "r_y1": 331.23, "r_x2": 166.531, "r_y2": 322.433, "r_x3": 152.277, "r_y3": 322.433, "coord_origin": "TOPLEFT"}, "text": "cell", "orig": "cell", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 36, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 170.427, "r_y0": 331.23, "r_x1": 202.111, "r_y1": 331.23, "r_x2": 202.111, "r_y2": 322.433, "r_x3": 170.427, "r_y3": 322.433, "coord_origin": "TOPLEFT"}, "text": "decoder", "orig": "decoder", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 37, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 206.864, "r_y0": 331.23, "r_x1": 480.587, "r_y1": 331.23, "r_x2": 480.587, "r_y2": 322.433, "r_x3": 206.864, "r_y3": 322.433, "coord_origin": "TOPLEFT"}, "text": "to predict the content with an embedded OCR approach. The", "orig": "to predict the content with an embedded OCR approach. The", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 38, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 343.185, "r_x1": 480.595, "r_y1": 343.185, "r_x2": 480.595, "r_y2": 334.388, "r_x3": 134.765, "r_y3": 334.388, "coord_origin": "TOPLEFT"}, "text": "latter makes it susceptible to transcription errors in the cell content of the table.", "orig": "latter makes it susceptible to transcription errors in the cell content of the table.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 39, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 355.14, "r_x1": 480.587, "r_y1": 355.14, "r_x2": 480.587, "r_y2": 346.343, "r_x3": 134.765, "r_y3": 346.343, "coord_origin": "TOPLEFT"}, "text": "TableFormer address this reliance on OCRand uses two transformer decoders for", "orig": "TableFormer address this reliance on OCRand uses two transformer decoders for", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 40, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 367.095, "r_x1": 480.589, "r_y1": 367.095, "r_x2": 480.589, "r_y2": 358.298, "r_x3": 134.765, "r_y3": 358.298, "coord_origin": "TOPLEFT"}, "text": "HTML structure and cell bounding box prediction in an end-to-end architecture.", "orig": "HTML structure and cell bounding box prediction in an end-to-end architecture.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 41, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 379.05, "r_x1": 480.589, "r_y1": 379.05, "r_x2": 480.589, "r_y2": 370.253, "r_x3": 134.765, "r_y3": 370.253, "coord_origin": "TOPLEFT"}, "text": "The predicted cell bounding box is then used to extract text tokens from an", "orig": "The predicted cell bounding box is then used to extract text tokens from an", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 42, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 391.006, "r_x1": 480.594, "r_y1": 391.006, "r_x2": 480.594, "r_y2": 382.209, "r_x3": 134.765, "r_y3": 382.209, "coord_origin": "TOPLEFT"}, "text": "originating (digital) PDF page, circumventing any need for OCR. TabSplitter", "orig": "originating (digital) PDF page, circumventing any need for OCR. TabSplitter", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 43, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 402.961, "r_x1": 480.587, "r_y1": 402.961, "r_x2": 480.587, "r_y2": 394.164, "r_x3": 134.765, "r_y3": 394.164, "coord_origin": "TOPLEFT"}, "text": "[2] proposes a compact double-matrix representation of table rows and columns", "orig": "[2] proposes a compact double-matrix representation of table rows and columns", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 44, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 414.916, "r_x1": 480.596, "r_y1": 414.916, "r_x2": 480.596, "r_y2": 406.119, "r_x3": 134.765, "r_y3": 406.119, "coord_origin": "TOPLEFT"}, "text": "to do error detection and error correction of HTML structure sequences based", "orig": "to do error detection and error correction of HTML structure sequences based", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 45, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 426.871, "r_x1": 480.592, "r_y1": 426.871, "r_x2": 480.592, "r_y2": 418.074, "r_x3": 134.765, "r_y3": 418.074, "coord_origin": "TOPLEFT"}, "text": "on predictions from [19]. This compact double-matrix representation can not be", "orig": "on predictions from [19]. This compact double-matrix representation can not be", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 46, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 438.826, "r_x1": 480.588, "r_y1": 438.826, "r_x2": 480.588, "r_y2": 430.029, "r_x3": 134.765, "r_y3": 430.029, "coord_origin": "TOPLEFT"}, "text": "used directly by the Img2seq model training, so the model uses HTML as an", "orig": "used directly by the Img2seq model training, so the model uses HTML as an", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 47, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 450.781, "r_x1": 480.589, "r_y1": 450.781, "r_x2": 480.589, "r_y2": 441.984, "r_x3": 134.765, "r_y3": 441.984, "coord_origin": "TOPLEFT"}, "text": "intermediate form. Chi et. al. [4] introduce a data set and a baseline method", "orig": "intermediate form. Chi et. al. [4] introduce a data set and a baseline method", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 48, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 462.737, "r_x1": 384.575, "r_y1": 462.737, "r_x2": 384.575, "r_y2": 453.94, "r_x3": 134.765, "r_y3": 453.94, "coord_origin": "TOPLEFT"}, "text": "using bidirectional LSTMs to predict LaTeX code. Kayal", "orig": "using bidirectional LSTMs to predict LaTeX code. Kayal", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 49, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 391.559, "r_y0": 462.737, "r_x1": 480.588, "r_y1": 462.737, "r_x2": 480.588, "r_y2": 453.94, "r_x3": 391.559, "r_y3": 453.94, "coord_origin": "TOPLEFT"}, "text": "[5] introduces Gated", "orig": "[5] introduces Gated", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 50, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 474.692, "r_x1": 480.591, "r_y1": 474.692, "r_x2": 480.591, "r_y2": 465.895, "r_x3": 134.765, "r_y3": 465.895, "coord_origin": "TOPLEFT"}, "text": "ResNet transformers to predict LaTeX code, and a separate OCR module to", "orig": "ResNet transformers to predict LaTeX code, and a separate OCR module to", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 51, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 486.647, "r_x1": 203.686, "r_y1": 486.647, "r_x2": 203.686, "r_y2": 477.85, "r_x3": 134.765, "r_y3": 477.85, "coord_origin": "TOPLEFT"}, "text": "extract content.", "orig": "extract content.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "Within the Im2Seq method, we find several popular models, namely the encoder-dual-decoder model (EDD) [22], TableFormer [9], Tabsplitter[2] and Ye et. al. [19]. EDD uses two consecutive long short-term memory (LSTM) decoders to predict a table in HTML representation. The tag decoder predicts a sequence of HTML tags. For each decoded table cell ( <td> ), the attention is passed to the cell decoder to predict the content with an embedded OCR approach. The latter makes it susceptible to transcription errors in the cell content of the table. TableFormer address this reliance on OCRand uses two transformer decoders for HTML structure and cell bounding box prediction in an end-to-end architecture. The predicted cell bounding box is then used to extract text tokens from an originating (digital) PDF page, circumventing any need for OCR. TabSplitter [2] proposes a compact double-matrix representation of table rows and columns to do error detection and error correction of HTML structure sequences based on predictions from [19]. This compact double-matrix representation can not be used directly by the Img2seq model training, so the model uses HTML as an intermediate form. Chi et. al. [4] introduce a data set and a baseline method using bidirectional LSTMs to predict LaTeX code. Kayal [5] introduces Gated ResNet transformers to predict LaTeX code, and a separate OCR module to extract content."}, {"label": "text", "id": 0, "page_no": 3, "cluster": {"id": 0, "label": "text", "bbox": {"l": 134.765, "t": 490.066, "r": 480.594, "b": 582.549, "coord_origin": "TOPLEFT"}, "confidence": 0.9853583574295044, "cells": [{"index": 52, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 149.709, "r_y0": 498.863, "r_x1": 480.594, "r_y1": 498.863, "r_x2": 480.594, "r_y2": 490.066, "r_x3": 149.709, "r_y3": 490.066, "coord_origin": "TOPLEFT"}, "text": "Im2Seq approaches have shown to be well-suited for the TSR task and allow a", "orig": "Im2Seq approaches have shown to be well-suited for the TSR task and allow a", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 53, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 510.818, "r_x1": 480.589, "r_y1": 510.818, "r_x2": 480.589, "r_y2": 502.021, "r_x3": 134.765, "r_y3": 502.021, "coord_origin": "TOPLEFT"}, "text": "full end-to-end network design that can output the final table structure without", "orig": "full end-to-end network design that can output the final table structure without", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 54, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 522.773, "r_x1": 480.587, "r_y1": 522.773, "r_x2": 480.587, "r_y2": 513.976, "r_x3": 134.765, "r_y3": 513.976, "coord_origin": "TOPLEFT"}, "text": "pre- or post-processing logic. Furthermore, Im2Seq models have demonstrated", "orig": "pre- or post-processing logic. Furthermore, Im2Seq models have demonstrated", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 55, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 534.7280000000001, "r_x1": 176.662, "r_y1": 534.7280000000001, "r_x2": 176.662, "r_y2": 525.931, "r_x3": 134.765, "r_y3": 525.931, "coord_origin": "TOPLEFT"}, "text": "to deliver", "orig": "to deliver", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 56, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 180.896, "r_y0": 534.7280000000001, "r_x1": 246.551, "r_y1": 534.7280000000001, "r_x2": 246.551, "r_y2": 525.931, "r_x3": 180.896, "r_y3": 525.931, "coord_origin": "TOPLEFT"}, "text": "state-of-the-art", "orig": "state-of-the-art", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 57, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 250.785, "r_y0": 534.7280000000001, "r_x1": 480.59, "r_y1": 534.7280000000001, "r_x2": 480.59, "r_y2": 525.931, "r_x3": 250.785, "r_y3": 525.931, "coord_origin": "TOPLEFT"}, "text": "prediction accuracy [9]. This motivated the authors", "orig": "prediction accuracy [9]. This motivated the authors", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 58, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 546.683, "r_x1": 143.619, "r_y1": 546.683, "r_x2": 143.619, "r_y2": 537.886, "r_x3": 134.765, "r_y3": 537.886, "coord_origin": "TOPLEFT"}, "text": "to", "orig": "to", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 59, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 148.56, "r_y0": 546.683, "r_x1": 194.815, "r_y1": 546.683, "r_x2": 194.815, "r_y2": 537.886, "r_x3": 148.56, "r_y3": 537.886, "coord_origin": "TOPLEFT"}, "text": "investigate", "orig": "investigate", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 60, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 199.756, "r_y0": 546.683, "r_x1": 205.566, "r_y1": 546.683, "r_x2": 205.566, "r_y2": 537.886, "r_x3": 199.756, "r_y3": 537.886, "coord_origin": "TOPLEFT"}, "text": "if", "orig": "if", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 61, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 210.508, "r_y0": 546.683, "r_x1": 224.341, "r_y1": 546.683, "r_x2": 224.341, "r_y2": 537.886, "r_x3": 210.508, "r_y3": 537.886, "coord_origin": "TOPLEFT"}, "text": "the", "orig": "the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 62, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 229.272, "r_y0": 546.683, "r_x1": 283.004, "r_y1": 546.683, "r_x2": 283.004, "r_y2": 537.886, "r_x3": 229.272, "r_y3": 537.886, "coord_origin": "TOPLEFT"}, "text": "performance", "orig": "performance", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 63, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 287.945, "r_y0": 546.683, "r_x1": 312.018, "r_y1": 546.683, "r_x2": 312.018, "r_y2": 537.886, "r_x3": 287.945, "r_y3": 537.886, "coord_origin": "TOPLEFT"}, "text": "(both", "orig": "(both", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 64, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 316.949, "r_y0": 546.683, "r_x1": 325.249, "r_y1": 546.683, "r_x2": 325.249, "r_y2": 537.886, "r_x3": 316.949, "r_y3": 537.886, "coord_origin": "TOPLEFT"}, "text": "in", "orig": "in", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 65, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 330.19, "r_y0": 546.683, "r_x1": 368.122, "r_y1": 546.683, "r_x2": 368.122, "r_y2": 537.886, "r_x3": 330.19, "r_y3": 537.886, "coord_origin": "TOPLEFT"}, "text": "accuracy", "orig": "accuracy", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 66, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 373.063, "r_y0": 546.683, "r_x1": 432.535, "r_y1": 546.683, "r_x2": 432.535, "r_y2": 537.886, "r_x3": 373.063, "r_y3": 537.886, "coord_origin": "TOPLEFT"}, "text": "and inference", "orig": "and inference", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 67, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 437.477, "r_y0": 546.683, "r_x1": 460.716, "r_y1": 546.683, "r_x2": 460.716, "r_y2": 537.886, "r_x3": 437.477, "r_y3": 537.886, "coord_origin": "TOPLEFT"}, "text": "time)", "orig": "time)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 68, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 465.648, "r_y0": 546.683, "r_x1": 480.588, "r_y1": 546.683, "r_x2": 480.588, "r_y2": 537.886, "r_x3": 465.648, "r_y3": 537.886, "coord_origin": "TOPLEFT"}, "text": "can", "orig": "can", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 69, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 558.639, "r_x1": 480.59, "r_y1": 558.639, "r_x2": 480.59, "r_y2": 549.842, "r_x3": 134.765, "r_y3": 549.842, "coord_origin": "TOPLEFT"}, "text": "be further improved by optimising the table structure representation language.", "orig": "be further improved by optimising the table structure representation language.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 70, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 570.594, "r_x1": 183.086, "r_y1": 570.594, "r_x2": 183.086, "r_y2": 561.797, "r_x3": 134.765, "r_y3": 561.797, "coord_origin": "TOPLEFT"}, "text": "We believe", "orig": "We believe", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 71, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 187.977, "r_y0": 570.594, "r_x1": 204.079, "r_y1": 570.594, "r_x2": 204.079, "r_y2": 561.797, "r_x3": 187.977, "r_y3": 561.797, "coord_origin": "TOPLEFT"}, "text": "this", "orig": "this", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 72, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 208.96, "r_y0": 570.594, "r_x1": 215.655, "r_y1": 570.594, "r_x2": 215.655, "r_y2": 561.797, "r_x3": 208.96, "r_y3": 561.797, "coord_origin": "TOPLEFT"}, "text": "is", "orig": "is", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 73, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 220.547, "r_y0": 570.594, "r_x1": 271.217, "r_y1": 570.594, "r_x2": 271.217, "r_y2": 561.797, "r_x3": 220.547, "r_y3": 561.797, "coord_origin": "TOPLEFT"}, "text": "a necessary", "orig": "a necessary", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 74, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 276.108, "r_y0": 570.594, "r_x1": 293.87, "r_y1": 570.594, "r_x2": 293.87, "r_y2": 561.797, "r_x3": 276.108, "r_y3": 561.797, "coord_origin": "TOPLEFT"}, "text": "step", "orig": "step", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 75, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 298.751, "r_y0": 570.594, "r_x1": 325.342, "r_y1": 570.594, "r_x2": 325.342, "r_y2": 561.797, "r_x3": 298.751, "r_y3": 561.797, "coord_origin": "TOPLEFT"}, "text": "before", "orig": "before", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 76, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 330.223, "r_y0": 570.594, "r_x1": 360.436, "r_y1": 570.594, "r_x2": 360.436, "r_y2": 561.797, "r_x3": 330.223, "r_y3": 561.797, "coord_origin": "TOPLEFT"}, "text": "further", "orig": "further", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 77, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 365.327, "r_y0": 570.594, "r_x1": 409.067, "r_y1": 570.594, "r_x2": 409.067, "r_y2": 561.797, "r_x3": 365.327, "r_y3": 561.797, "coord_origin": "TOPLEFT"}, "text": "improving", "orig": "improving", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 78, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 413.949, "r_y0": 570.594, "r_x1": 441.09, "r_y1": 570.594, "r_x2": 441.09, "r_y2": 561.797, "r_x3": 413.949, "r_y3": 561.797, "coord_origin": "TOPLEFT"}, "text": "neural", "orig": "neural", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 79, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 445.982, "r_y0": 570.594, "r_x1": 480.589, "r_y1": 570.594, "r_x2": 480.589, "r_y2": 561.797, "r_x3": 445.982, "r_y3": 561.797, "coord_origin": "TOPLEFT"}, "text": "network", "orig": "network", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 80, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 582.549, "r_x1": 249.278, "r_y1": 582.549, "r_x2": 249.278, "r_y2": 573.752, "r_x3": 134.765, "r_y3": 573.752, "coord_origin": "TOPLEFT"}, "text": "architectures for this task.", "orig": "architectures for this task.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "Im2Seq approaches have shown to be well-suited for the TSR task and allow a full end-to-end network design that can output the final table structure without pre- or post-processing logic. Furthermore, Im2Seq models have demonstrated to deliver state-of-the-art prediction accuracy [9]. This motivated the authors to investigate if the performance (both in accuracy and inference time) can be further improved by optimising the table structure representation language. We believe this is a necessary step before further improving neural network architectures for this task."}, {"label": "section_header", "id": 3, "page_no": 3, "cluster": {"id": 3, "label": "section_header", "bbox": {"l": 134.765, "t": 605.55, "r": 269.624, "b": 616.1179999999999, "coord_origin": "TOPLEFT"}, "confidence": 0.9393903017044067, "cells": [{"index": 81, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 616.1179999999999, "r_x1": 141.489, "r_y1": 616.1179999999999, "r_x2": 141.489, "r_y2": 605.55, "r_x3": 134.765, "r_y3": 605.55, "coord_origin": "TOPLEFT"}, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 82, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 154.938, "r_y0": 616.1179999999999, "r_x1": 269.624, "r_y1": 616.1179999999999, "r_x2": 269.624, "r_y2": 605.55, "r_x3": 154.938, "r_y3": 605.55, "coord_origin": "TOPLEFT"}, "text": "Problem Statement", "orig": "Problem Statement", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "3 Problem Statement"}, {"label": "text", "id": 1, "page_no": 3, "cluster": {"id": 1, "label": "text", "bbox": {"l": 134.765, "t": 632.148, "r": 480.594, "b": 664.856, "coord_origin": "TOPLEFT"}, "confidence": 0.9692807197570801, "cells": [{"index": 83, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 640.9449999999999, "r_x1": 480.591, "r_y1": 640.9449999999999, "r_x2": 480.591, "r_y2": 632.148, "r_x3": 134.765, "r_y3": 632.148, "coord_origin": "TOPLEFT"}, "text": "All known Im2Seq based models for TSR fundamentally work in similar ways.", "orig": "All known Im2Seq based models for TSR fundamentally work in similar ways.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 84, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 652.9, "r_x1": 480.587, "r_y1": 652.9, "r_x2": 480.587, "r_y2": 644.1030000000001, "r_x3": 134.765, "r_y3": 644.1030000000001, "coord_origin": "TOPLEFT"}, "text": "Given an image of a table, the Im2Seq model predicts the structure of the table", "orig": "Given an image of a table, the Im2Seq model predicts the structure of the table", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 85, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 664.856, "r_x1": 480.594, "r_y1": 664.856, "r_x2": 480.594, "r_y2": 656.059, "r_x3": 134.765, "r_y3": 656.059, "coord_origin": "TOPLEFT"}, "text": "by generating a sequence of tokens. These tokens originate from a finite vocab-", "orig": "by generating a sequence of tokens. These tokens originate from a finite vocab-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "All known Im2Seq based models for TSR fundamentally work in similar ways. Given an image of a table, the Im2Seq model predicts the structure of the table by generating a sequence of tokens. These tokens originate from a finite vocab-"}], "body": [{"label": "text", "id": 2, "page_no": 3, "cluster": {"id": 2, "label": "text", "bbox": {"l": 134.765, "t": 118.93399999999997, "r": 480.596, "b": 259.23800000000006, "coord_origin": "TOPLEFT"}, "confidence": 0.9467443823814392, "cells": [{"index": 2, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 127.731, "r_x1": 480.594, "r_y1": 127.731, "r_x2": 480.594, "r_y2": 118.93399999999997, "r_x3": 134.765, "r_y3": 118.93399999999997, "coord_origin": "TOPLEFT"}, "text": "Other work [20] aims at predicting a grid for each table and deciding which cells", "orig": "Other work [20] aims at predicting a grid for each table and deciding which cells", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 3, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 139.68600000000004, "r_x1": 480.588, "r_y1": 139.68600000000004, "r_x2": 480.588, "r_y2": 130.889, "r_x3": 134.765, "r_y3": 130.889, "coord_origin": "TOPLEFT"}, "text": "must be merged using an attention network. Im2Seq methods cast the problem", "orig": "must be merged using an attention network. Im2Seq methods cast the problem", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 4, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 151.64200000000005, "r_x1": 480.587, "r_y1": 151.64200000000005, "r_x2": 480.587, "r_y2": 142.84500000000003, "r_x3": 134.765, "r_y3": 142.84500000000003, "coord_origin": "TOPLEFT"}, "text": "as a sequence generation task [4,5,9,22], and therefore need an internal table-", "orig": "as a sequence generation task [4,5,9,22], and therefore need an internal table-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 5, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 163.59699999999998, "r_x1": 174.162, "r_y1": 163.59699999999998, "r_x2": 174.162, "r_y2": 154.79999999999995, "r_x3": 134.765, "r_y3": 154.79999999999995, "coord_origin": "TOPLEFT"}, "text": "structure", "orig": "structure", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 6, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 178.755, "r_y0": 163.59699999999998, "r_x1": 240.56, "r_y1": 163.59699999999998, "r_x2": 240.56, "r_y2": 154.79999999999995, "r_x3": 178.755, "r_y3": 154.79999999999995, "coord_origin": "TOPLEFT"}, "text": "representation", "orig": "representation", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 7, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 245.143, "r_y0": 163.59699999999998, "r_x1": 286.09, "r_y1": 163.59699999999998, "r_x2": 286.09, "r_y2": 154.79999999999995, "r_x3": 245.143, "r_y3": 154.79999999999995, "coord_origin": "TOPLEFT"}, "text": "language,", "orig": "language,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 8, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 290.683, "r_y0": 163.59699999999998, "r_x1": 327.144, "r_y1": 163.59699999999998, "r_x2": 327.144, "r_y2": 154.79999999999995, "r_x3": 290.683, "r_y3": 154.79999999999995, "coord_origin": "TOPLEFT"}, "text": "which is", "orig": "which is", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 9, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 331.727, "r_y0": 163.59699999999998, "r_x1": 353.584, "r_y1": 163.59699999999998, "r_x2": 353.584, "r_y2": 154.79999999999995, "r_x3": 331.727, "r_y3": 154.79999999999995, "coord_origin": "TOPLEFT"}, "text": "often", "orig": "often", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 10, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 358.176, "r_y0": 163.59699999999998, "r_x1": 480.588, "r_y1": 163.59699999999998, "r_x2": 480.588, "r_y2": 154.79999999999995, "r_x3": 358.176, "r_y3": 154.79999999999995, "coord_origin": "TOPLEFT"}, "text": "implemented with standard", "orig": "implemented with standard", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 11, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 175.55200000000002, "r_x1": 480.593, "r_y1": 175.55200000000002, "r_x2": 480.593, "r_y2": 166.755, "r_x3": 134.765, "r_y3": 166.755, "coord_origin": "TOPLEFT"}, "text": "markup languages (e.g. HTML, LaTeX, Markdown). In theory, Im2Seq methods", "orig": "markup languages (e.g. HTML, LaTeX, Markdown). In theory, Im2Seq methods", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 12, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 187.50699999999995, "r_x1": 480.596, "r_y1": 187.50699999999995, "r_x2": 480.596, "r_y2": 178.71000000000004, "r_x3": 134.765, "r_y3": 178.71000000000004, "coord_origin": "TOPLEFT"}, "text": "have a natural advantage over the OD and GNN methods by virtue of directly", "orig": "have a natural advantage over the OD and GNN methods by virtue of directly", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 13, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 199.462, "r_x1": 480.593, "r_y1": 199.462, "r_x2": 480.593, "r_y2": 190.66499999999996, "r_x3": 134.765, "r_y3": 190.66499999999996, "coord_origin": "TOPLEFT"}, "text": "predicting the table-structure. As such, no post-processing or rules are needed", "orig": "predicting the table-structure. As such, no post-processing or rules are needed", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 14, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 211.41700000000003, "r_x1": 143.065, "r_y1": 211.41700000000003, "r_x2": 143.065, "r_y2": 202.62, "r_x3": 134.765, "r_y3": 202.62, "coord_origin": "TOPLEFT"}, "text": "in", "orig": "in", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 15, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 147.329, "r_y0": 211.41700000000003, "r_x1": 480.594, "r_y1": 211.41700000000003, "r_x2": 480.594, "r_y2": 202.62, "r_x3": 147.329, "r_y3": 202.62, "coord_origin": "TOPLEFT"}, "text": "order to obtain the table-structure, which is necessary with OD and GNN", "orig": "order to obtain the table-structure, which is necessary with OD and GNN", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 16, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 223.37300000000005, "r_x1": 480.588, "r_y1": 223.37300000000005, "r_x2": 480.588, "r_y2": 214.57600000000002, "r_x3": 134.765, "r_y3": 214.57600000000002, "coord_origin": "TOPLEFT"}, "text": "approaches. In practice, this is not entirely true, because a predicted sequence", "orig": "approaches. In practice, this is not entirely true, because a predicted sequence", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 17, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 235.32799999999997, "r_x1": 480.59, "r_y1": 235.32799999999997, "r_x2": 480.59, "r_y2": 226.53099999999995, "r_x3": 134.765, "r_y3": 226.53099999999995, "coord_origin": "TOPLEFT"}, "text": "of table-structure markup does not necessarily have to be syntactically correct.", "orig": "of table-structure markup does not necessarily have to be syntactically correct.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 18, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 247.28300000000002, "r_x1": 480.596, "r_y1": 247.28300000000002, "r_x2": 480.596, "r_y2": 238.486, "r_x3": 134.765, "r_y3": 238.486, "coord_origin": "TOPLEFT"}, "text": "Hence, depending on the quality of the predicted sequence, some post-processing", "orig": "Hence, depending on the quality of the predicted sequence, some post-processing", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 19, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 259.23800000000006, "r_x1": 480.595, "r_y1": 259.23800000000006, "r_x2": 480.595, "r_y2": 250.44100000000003, "r_x3": 134.765, "r_y3": 250.44100000000003, "coord_origin": "TOPLEFT"}, "text": "needs to be performed to ensure a syntactically valid (let alone correct) sequence.", "orig": "needs to be performed to ensure a syntactically valid (let alone correct) sequence.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "Other work [20] aims at predicting a grid for each table and deciding which cells must be merged using an attention network. Im2Seq methods cast the problem as a sequence generation task [4,5,9,22], and therefore need an internal tablestructure representation language, which is often implemented with standard markup languages (e.g. HTML, LaTeX, Markdown). In theory, Im2Seq methods have a natural advantage over the OD and GNN methods by virtue of directly predicting the table-structure. As such, no post-processing or rules are needed in order to obtain the table-structure, which is necessary with OD and GNN approaches. In practice, this is not entirely true, because a predicted sequence of table-structure markup does not necessarily have to be syntactically correct. Hence, depending on the quality of the predicted sequence, some post-processing needs to be performed to ensure a syntactically valid (let alone correct) sequence."}, {"label": "text", "id": 4, "page_no": 3, "cluster": {"id": 4, "label": "text", "bbox": {"l": 134.765, "t": 262.65700000000004, "r": 480.596, "b": 486.647, "coord_origin": "TOPLEFT"}, "confidence": 0.929087221622467, "cells": [{"index": 20, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 149.709, "r_y0": 271.45399999999995, "r_x1": 199.213, "r_y1": 271.45399999999995, "r_x2": 199.213, "r_y2": 262.65700000000004, "r_x3": 149.709, "r_y3": 262.65700000000004, "coord_origin": "TOPLEFT"}, "text": "Within the", "orig": "Within the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 21, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 204.175, "r_y0": 271.45399999999995, "r_x1": 349.163, "r_y1": 271.45399999999995, "r_x2": 349.163, "r_y2": 262.65700000000004, "r_x3": 204.175, "r_y3": 262.65700000000004, "coord_origin": "TOPLEFT"}, "text": "Im2Seq method, we find several", "orig": "Im2Seq method, we find several", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 22, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 354.125, "r_y0": 271.45399999999995, "r_x1": 387.632, "r_y1": 271.45399999999995, "r_x2": 387.632, "r_y2": 262.65700000000004, "r_x3": 354.125, "r_y3": 262.65700000000004, "coord_origin": "TOPLEFT"}, "text": "popular", "orig": "popular", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 23, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 392.593, "r_y0": 271.45399999999995, "r_x1": 425.573, "r_y1": 271.45399999999995, "r_x2": 425.573, "r_y2": 262.65700000000004, "r_x3": 392.593, "r_y3": 262.65700000000004, "coord_origin": "TOPLEFT"}, "text": "models,", "orig": "models,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 24, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 430.535, "r_y0": 271.45399999999995, "r_x1": 480.593, "r_y1": 271.45399999999995, "r_x2": 480.593, "r_y2": 262.65700000000004, "r_x3": 430.535, "r_y3": 262.65700000000004, "coord_origin": "TOPLEFT"}, "text": "namely the", "orig": "namely the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 25, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 283.409, "r_x1": 480.592, "r_y1": 283.409, "r_x2": 480.592, "r_y2": 274.61199999999997, "r_x3": 134.765, "r_y3": 274.61199999999997, "coord_origin": "TOPLEFT"}, "text": "encoder-dual-decoder model (EDD) [22], TableFormer [9], Tabsplitter[2] and Ye", "orig": "encoder-dual-decoder model (EDD) [22], TableFormer [9], Tabsplitter[2] and Ye", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 26, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 295.364, "r_x1": 480.593, "r_y1": 295.364, "r_x2": 480.593, "r_y2": 286.567, "r_x3": 134.765, "r_y3": 286.567, "coord_origin": "TOPLEFT"}, "text": "et. al. [19]. EDD uses two consecutive long short-term memory (LSTM) decoders", "orig": "et. al. [19]. EDD uses two consecutive long short-term memory (LSTM) decoders", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 27, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 307.319, "r_x1": 342.021, "r_y1": 307.319, "r_x2": 342.021, "r_y2": 298.522, "r_x3": 134.765, "r_y3": 298.522, "coord_origin": "TOPLEFT"}, "text": "to predict a table in HTML representation. The", "orig": "to predict a table in HTML representation. The", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 28, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 345.064, "r_y0": 307.319, "r_x1": 393.047, "r_y1": 307.319, "r_x2": 393.047, "r_y2": 298.522, "r_x3": 345.064, "r_y3": 298.522, "coord_origin": "TOPLEFT"}, "text": "tag decoder", "orig": "tag decoder", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 29, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 397.167, "r_y0": 307.319, "r_x1": 480.591, "r_y1": 307.319, "r_x2": 480.591, "r_y2": 298.522, "r_x3": 397.167, "r_y3": 298.522, "coord_origin": "TOPLEFT"}, "text": "predicts a sequence", "orig": "predicts a sequence", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 30, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 319.275, "r_x1": 333.299, "r_y1": 319.275, "r_x2": 333.299, "r_y2": 310.478, "r_x3": 134.765, "r_y3": 310.478, "coord_origin": "TOPLEFT"}, "text": "of HTML tags. For each decoded table cell (", "orig": "of HTML tags. For each decoded table cell (", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 31, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 333.299, "r_y0": 319.275, "r_x1": 356.971, "r_y1": 319.275, "r_x2": 356.971, "r_y2": 310.478, "r_x3": 333.299, "r_y3": 310.478, "coord_origin": "TOPLEFT"}, "text": "<td>", "orig": "<td>", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 32, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 357.085, "r_y0": 319.275, "r_x1": 363.725, "r_y1": 319.275, "r_x2": 363.725, "r_y2": 310.478, "r_x3": 357.085, "r_y3": 310.478, "coord_origin": "TOPLEFT"}, "text": "),", "orig": "),", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 33, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 367.64, "r_y0": 319.275, "r_x1": 480.594, "r_y1": 319.275, "r_x2": 480.594, "r_y2": 310.478, "r_x3": 367.64, "r_y3": 310.478, "coord_origin": "TOPLEFT"}, "text": "the attention is passed to", "orig": "the attention is passed to", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 34, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 331.23, "r_x1": 148.598, "r_y1": 331.23, "r_x2": 148.598, "r_y2": 322.433, "r_x3": 134.765, "r_y3": 322.433, "coord_origin": "TOPLEFT"}, "text": "the", "orig": "the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 35, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 152.277, "r_y0": 331.23, "r_x1": 166.531, "r_y1": 331.23, "r_x2": 166.531, "r_y2": 322.433, "r_x3": 152.277, "r_y3": 322.433, "coord_origin": "TOPLEFT"}, "text": "cell", "orig": "cell", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 36, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 170.427, "r_y0": 331.23, "r_x1": 202.111, "r_y1": 331.23, "r_x2": 202.111, "r_y2": 322.433, "r_x3": 170.427, "r_y3": 322.433, "coord_origin": "TOPLEFT"}, "text": "decoder", "orig": "decoder", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 37, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 206.864, "r_y0": 331.23, "r_x1": 480.587, "r_y1": 331.23, "r_x2": 480.587, "r_y2": 322.433, "r_x3": 206.864, "r_y3": 322.433, "coord_origin": "TOPLEFT"}, "text": "to predict the content with an embedded OCR approach. The", "orig": "to predict the content with an embedded OCR approach. The", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 38, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 343.185, "r_x1": 480.595, "r_y1": 343.185, "r_x2": 480.595, "r_y2": 334.388, "r_x3": 134.765, "r_y3": 334.388, "coord_origin": "TOPLEFT"}, "text": "latter makes it susceptible to transcription errors in the cell content of the table.", "orig": "latter makes it susceptible to transcription errors in the cell content of the table.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 39, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 355.14, "r_x1": 480.587, "r_y1": 355.14, "r_x2": 480.587, "r_y2": 346.343, "r_x3": 134.765, "r_y3": 346.343, "coord_origin": "TOPLEFT"}, "text": "TableFormer address this reliance on OCRand uses two transformer decoders for", "orig": "TableFormer address this reliance on OCRand uses two transformer decoders for", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 40, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 367.095, "r_x1": 480.589, "r_y1": 367.095, "r_x2": 480.589, "r_y2": 358.298, "r_x3": 134.765, "r_y3": 358.298, "coord_origin": "TOPLEFT"}, "text": "HTML structure and cell bounding box prediction in an end-to-end architecture.", "orig": "HTML structure and cell bounding box prediction in an end-to-end architecture.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 41, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 379.05, "r_x1": 480.589, "r_y1": 379.05, "r_x2": 480.589, "r_y2": 370.253, "r_x3": 134.765, "r_y3": 370.253, "coord_origin": "TOPLEFT"}, "text": "The predicted cell bounding box is then used to extract text tokens from an", "orig": "The predicted cell bounding box is then used to extract text tokens from an", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 42, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 391.006, "r_x1": 480.594, "r_y1": 391.006, "r_x2": 480.594, "r_y2": 382.209, "r_x3": 134.765, "r_y3": 382.209, "coord_origin": "TOPLEFT"}, "text": "originating (digital) PDF page, circumventing any need for OCR. TabSplitter", "orig": "originating (digital) PDF page, circumventing any need for OCR. TabSplitter", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 43, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 402.961, "r_x1": 480.587, "r_y1": 402.961, "r_x2": 480.587, "r_y2": 394.164, "r_x3": 134.765, "r_y3": 394.164, "coord_origin": "TOPLEFT"}, "text": "[2] proposes a compact double-matrix representation of table rows and columns", "orig": "[2] proposes a compact double-matrix representation of table rows and columns", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 44, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 414.916, "r_x1": 480.596, "r_y1": 414.916, "r_x2": 480.596, "r_y2": 406.119, "r_x3": 134.765, "r_y3": 406.119, "coord_origin": "TOPLEFT"}, "text": "to do error detection and error correction of HTML structure sequences based", "orig": "to do error detection and error correction of HTML structure sequences based", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 45, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 426.871, "r_x1": 480.592, "r_y1": 426.871, "r_x2": 480.592, "r_y2": 418.074, "r_x3": 134.765, "r_y3": 418.074, "coord_origin": "TOPLEFT"}, "text": "on predictions from [19]. This compact double-matrix representation can not be", "orig": "on predictions from [19]. This compact double-matrix representation can not be", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 46, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 438.826, "r_x1": 480.588, "r_y1": 438.826, "r_x2": 480.588, "r_y2": 430.029, "r_x3": 134.765, "r_y3": 430.029, "coord_origin": "TOPLEFT"}, "text": "used directly by the Img2seq model training, so the model uses HTML as an", "orig": "used directly by the Img2seq model training, so the model uses HTML as an", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 47, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 450.781, "r_x1": 480.589, "r_y1": 450.781, "r_x2": 480.589, "r_y2": 441.984, "r_x3": 134.765, "r_y3": 441.984, "coord_origin": "TOPLEFT"}, "text": "intermediate form. Chi et. al. [4] introduce a data set and a baseline method", "orig": "intermediate form. Chi et. al. [4] introduce a data set and a baseline method", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 48, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 462.737, "r_x1": 384.575, "r_y1": 462.737, "r_x2": 384.575, "r_y2": 453.94, "r_x3": 134.765, "r_y3": 453.94, "coord_origin": "TOPLEFT"}, "text": "using bidirectional LSTMs to predict LaTeX code. Kayal", "orig": "using bidirectional LSTMs to predict LaTeX code. Kayal", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 49, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 391.559, "r_y0": 462.737, "r_x1": 480.588, "r_y1": 462.737, "r_x2": 480.588, "r_y2": 453.94, "r_x3": 391.559, "r_y3": 453.94, "coord_origin": "TOPLEFT"}, "text": "[5] introduces Gated", "orig": "[5] introduces Gated", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 50, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 474.692, "r_x1": 480.591, "r_y1": 474.692, "r_x2": 480.591, "r_y2": 465.895, "r_x3": 134.765, "r_y3": 465.895, "coord_origin": "TOPLEFT"}, "text": "ResNet transformers to predict LaTeX code, and a separate OCR module to", "orig": "ResNet transformers to predict LaTeX code, and a separate OCR module to", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 51, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 486.647, "r_x1": 203.686, "r_y1": 486.647, "r_x2": 203.686, "r_y2": 477.85, "r_x3": 134.765, "r_y3": 477.85, "coord_origin": "TOPLEFT"}, "text": "extract content.", "orig": "extract content.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "Within the Im2Seq method, we find several popular models, namely the encoder-dual-decoder model (EDD) [22], TableFormer [9], Tabsplitter[2] and Ye et. al. [19]. EDD uses two consecutive long short-term memory (LSTM) decoders to predict a table in HTML representation. The tag decoder predicts a sequence of HTML tags. For each decoded table cell ( <td> ), the attention is passed to the cell decoder to predict the content with an embedded OCR approach. The latter makes it susceptible to transcription errors in the cell content of the table. TableFormer address this reliance on OCRand uses two transformer decoders for HTML structure and cell bounding box prediction in an end-to-end architecture. The predicted cell bounding box is then used to extract text tokens from an originating (digital) PDF page, circumventing any need for OCR. TabSplitter [2] proposes a compact double-matrix representation of table rows and columns to do error detection and error correction of HTML structure sequences based on predictions from [19]. This compact double-matrix representation can not be used directly by the Img2seq model training, so the model uses HTML as an intermediate form. Chi et. al. [4] introduce a data set and a baseline method using bidirectional LSTMs to predict LaTeX code. Kayal [5] introduces Gated ResNet transformers to predict LaTeX code, and a separate OCR module to extract content."}, {"label": "text", "id": 0, "page_no": 3, "cluster": {"id": 0, "label": "text", "bbox": {"l": 134.765, "t": 490.066, "r": 480.594, "b": 582.549, "coord_origin": "TOPLEFT"}, "confidence": 0.9853583574295044, "cells": [{"index": 52, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 149.709, "r_y0": 498.863, "r_x1": 480.594, "r_y1": 498.863, "r_x2": 480.594, "r_y2": 490.066, "r_x3": 149.709, "r_y3": 490.066, "coord_origin": "TOPLEFT"}, "text": "Im2Seq approaches have shown to be well-suited for the TSR task and allow a", "orig": "Im2Seq approaches have shown to be well-suited for the TSR task and allow a", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 53, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 510.818, "r_x1": 480.589, "r_y1": 510.818, "r_x2": 480.589, "r_y2": 502.021, "r_x3": 134.765, "r_y3": 502.021, "coord_origin": "TOPLEFT"}, "text": "full end-to-end network design that can output the final table structure without", "orig": "full end-to-end network design that can output the final table structure without", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 54, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 522.773, "r_x1": 480.587, "r_y1": 522.773, "r_x2": 480.587, "r_y2": 513.976, "r_x3": 134.765, "r_y3": 513.976, "coord_origin": "TOPLEFT"}, "text": "pre- or post-processing logic. Furthermore, Im2Seq models have demonstrated", "orig": "pre- or post-processing logic. Furthermore, Im2Seq models have demonstrated", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 55, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 534.7280000000001, "r_x1": 176.662, "r_y1": 534.7280000000001, "r_x2": 176.662, "r_y2": 525.931, "r_x3": 134.765, "r_y3": 525.931, "coord_origin": "TOPLEFT"}, "text": "to deliver", "orig": "to deliver", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 56, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 180.896, "r_y0": 534.7280000000001, "r_x1": 246.551, "r_y1": 534.7280000000001, "r_x2": 246.551, "r_y2": 525.931, "r_x3": 180.896, "r_y3": 525.931, "coord_origin": "TOPLEFT"}, "text": "state-of-the-art", "orig": "state-of-the-art", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 57, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 250.785, "r_y0": 534.7280000000001, "r_x1": 480.59, "r_y1": 534.7280000000001, "r_x2": 480.59, "r_y2": 525.931, "r_x3": 250.785, "r_y3": 525.931, "coord_origin": "TOPLEFT"}, "text": "prediction accuracy [9]. This motivated the authors", "orig": "prediction accuracy [9]. This motivated the authors", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 58, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 546.683, "r_x1": 143.619, "r_y1": 546.683, "r_x2": 143.619, "r_y2": 537.886, "r_x3": 134.765, "r_y3": 537.886, "coord_origin": "TOPLEFT"}, "text": "to", "orig": "to", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 59, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 148.56, "r_y0": 546.683, "r_x1": 194.815, "r_y1": 546.683, "r_x2": 194.815, "r_y2": 537.886, "r_x3": 148.56, "r_y3": 537.886, "coord_origin": "TOPLEFT"}, "text": "investigate", "orig": "investigate", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 60, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 199.756, "r_y0": 546.683, "r_x1": 205.566, "r_y1": 546.683, "r_x2": 205.566, "r_y2": 537.886, "r_x3": 199.756, "r_y3": 537.886, "coord_origin": "TOPLEFT"}, "text": "if", "orig": "if", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 61, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 210.508, "r_y0": 546.683, "r_x1": 224.341, "r_y1": 546.683, "r_x2": 224.341, "r_y2": 537.886, "r_x3": 210.508, "r_y3": 537.886, "coord_origin": "TOPLEFT"}, "text": "the", "orig": "the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 62, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 229.272, "r_y0": 546.683, "r_x1": 283.004, "r_y1": 546.683, "r_x2": 283.004, "r_y2": 537.886, "r_x3": 229.272, "r_y3": 537.886, "coord_origin": "TOPLEFT"}, "text": "performance", "orig": "performance", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 63, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 287.945, "r_y0": 546.683, "r_x1": 312.018, "r_y1": 546.683, "r_x2": 312.018, "r_y2": 537.886, "r_x3": 287.945, "r_y3": 537.886, "coord_origin": "TOPLEFT"}, "text": "(both", "orig": "(both", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 64, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 316.949, "r_y0": 546.683, "r_x1": 325.249, "r_y1": 546.683, "r_x2": 325.249, "r_y2": 537.886, "r_x3": 316.949, "r_y3": 537.886, "coord_origin": "TOPLEFT"}, "text": "in", "orig": "in", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 65, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 330.19, "r_y0": 546.683, "r_x1": 368.122, "r_y1": 546.683, "r_x2": 368.122, "r_y2": 537.886, "r_x3": 330.19, "r_y3": 537.886, "coord_origin": "TOPLEFT"}, "text": "accuracy", "orig": "accuracy", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 66, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 373.063, "r_y0": 546.683, "r_x1": 432.535, "r_y1": 546.683, "r_x2": 432.535, "r_y2": 537.886, "r_x3": 373.063, "r_y3": 537.886, "coord_origin": "TOPLEFT"}, "text": "and inference", "orig": "and inference", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 67, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 437.477, "r_y0": 546.683, "r_x1": 460.716, "r_y1": 546.683, "r_x2": 460.716, "r_y2": 537.886, "r_x3": 437.477, "r_y3": 537.886, "coord_origin": "TOPLEFT"}, "text": "time)", "orig": "time)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 68, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 465.648, "r_y0": 546.683, "r_x1": 480.588, "r_y1": 546.683, "r_x2": 480.588, "r_y2": 537.886, "r_x3": 465.648, "r_y3": 537.886, "coord_origin": "TOPLEFT"}, "text": "can", "orig": "can", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 69, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 558.639, "r_x1": 480.59, "r_y1": 558.639, "r_x2": 480.59, "r_y2": 549.842, "r_x3": 134.765, "r_y3": 549.842, "coord_origin": "TOPLEFT"}, "text": "be further improved by optimising the table structure representation language.", "orig": "be further improved by optimising the table structure representation language.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 70, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 570.594, "r_x1": 183.086, "r_y1": 570.594, "r_x2": 183.086, "r_y2": 561.797, "r_x3": 134.765, "r_y3": 561.797, "coord_origin": "TOPLEFT"}, "text": "We believe", "orig": "We believe", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 71, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 187.977, "r_y0": 570.594, "r_x1": 204.079, "r_y1": 570.594, "r_x2": 204.079, "r_y2": 561.797, "r_x3": 187.977, "r_y3": 561.797, "coord_origin": "TOPLEFT"}, "text": "this", "orig": "this", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 72, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 208.96, "r_y0": 570.594, "r_x1": 215.655, "r_y1": 570.594, "r_x2": 215.655, "r_y2": 561.797, "r_x3": 208.96, "r_y3": 561.797, "coord_origin": "TOPLEFT"}, "text": "is", "orig": "is", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 73, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 220.547, "r_y0": 570.594, "r_x1": 271.217, "r_y1": 570.594, "r_x2": 271.217, "r_y2": 561.797, "r_x3": 220.547, "r_y3": 561.797, "coord_origin": "TOPLEFT"}, "text": "a necessary", "orig": "a necessary", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 74, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 276.108, "r_y0": 570.594, "r_x1": 293.87, "r_y1": 570.594, "r_x2": 293.87, "r_y2": 561.797, "r_x3": 276.108, "r_y3": 561.797, "coord_origin": "TOPLEFT"}, "text": "step", "orig": "step", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 75, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 298.751, "r_y0": 570.594, "r_x1": 325.342, "r_y1": 570.594, "r_x2": 325.342, "r_y2": 561.797, "r_x3": 298.751, "r_y3": 561.797, "coord_origin": "TOPLEFT"}, "text": "before", "orig": "before", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 76, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 330.223, "r_y0": 570.594, "r_x1": 360.436, "r_y1": 570.594, "r_x2": 360.436, "r_y2": 561.797, "r_x3": 330.223, "r_y3": 561.797, "coord_origin": "TOPLEFT"}, "text": "further", "orig": "further", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 77, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 365.327, "r_y0": 570.594, "r_x1": 409.067, "r_y1": 570.594, "r_x2": 409.067, "r_y2": 561.797, "r_x3": 365.327, "r_y3": 561.797, "coord_origin": "TOPLEFT"}, "text": "improving", "orig": "improving", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 78, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 413.949, "r_y0": 570.594, "r_x1": 441.09, "r_y1": 570.594, "r_x2": 441.09, "r_y2": 561.797, "r_x3": 413.949, "r_y3": 561.797, "coord_origin": "TOPLEFT"}, "text": "neural", "orig": "neural", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 79, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 445.982, "r_y0": 570.594, "r_x1": 480.589, "r_y1": 570.594, "r_x2": 480.589, "r_y2": 561.797, "r_x3": 445.982, "r_y3": 561.797, "coord_origin": "TOPLEFT"}, "text": "network", "orig": "network", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 80, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 582.549, "r_x1": 249.278, "r_y1": 582.549, "r_x2": 249.278, "r_y2": 573.752, "r_x3": 134.765, "r_y3": 573.752, "coord_origin": "TOPLEFT"}, "text": "architectures for this task.", "orig": "architectures for this task.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "Im2Seq approaches have shown to be well-suited for the TSR task and allow a full end-to-end network design that can output the final table structure without pre- or post-processing logic. Furthermore, Im2Seq models have demonstrated to deliver state-of-the-art prediction accuracy [9]. This motivated the authors to investigate if the performance (both in accuracy and inference time) can be further improved by optimising the table structure representation language. We believe this is a necessary step before further improving neural network architectures for this task."}, {"label": "section_header", "id": 3, "page_no": 3, "cluster": {"id": 3, "label": "section_header", "bbox": {"l": 134.765, "t": 605.55, "r": 269.624, "b": 616.1179999999999, "coord_origin": "TOPLEFT"}, "confidence": 0.9393903017044067, "cells": [{"index": 81, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 616.1179999999999, "r_x1": 141.489, "r_y1": 616.1179999999999, "r_x2": 141.489, "r_y2": 605.55, "r_x3": 134.765, "r_y3": 605.55, "coord_origin": "TOPLEFT"}, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 82, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 154.938, "r_y0": 616.1179999999999, "r_x1": 269.624, "r_y1": 616.1179999999999, "r_x2": 269.624, "r_y2": 605.55, "r_x3": 154.938, "r_y3": 605.55, "coord_origin": "TOPLEFT"}, "text": "Problem Statement", "orig": "Problem Statement", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "3 Problem Statement"}, {"label": "text", "id": 1, "page_no": 3, "cluster": {"id": 1, "label": "text", "bbox": {"l": 134.765, "t": 632.148, "r": 480.594, "b": 664.856, "coord_origin": "TOPLEFT"}, "confidence": 0.9692807197570801, "cells": [{"index": 83, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 640.9449999999999, "r_x1": 480.591, "r_y1": 640.9449999999999, "r_x2": 480.591, "r_y2": 632.148, "r_x3": 134.765, "r_y3": 632.148, "coord_origin": "TOPLEFT"}, "text": "All known Im2Seq based models for TSR fundamentally work in similar ways.", "orig": "All known Im2Seq based models for TSR fundamentally work in similar ways.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 84, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 652.9, "r_x1": 480.587, "r_y1": 652.9, "r_x2": 480.587, "r_y2": 644.1030000000001, "r_x3": 134.765, "r_y3": 644.1030000000001, "coord_origin": "TOPLEFT"}, "text": "Given an image of a table, the Im2Seq model predicts the structure of the table", "orig": "Given an image of a table, the Im2Seq model predicts the structure of the table", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 85, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 664.856, "r_x1": 480.594, "r_y1": 664.856, "r_x2": 480.594, "r_y2": 656.059, "r_x3": 134.765, "r_y3": 656.059, "coord_origin": "TOPLEFT"}, "text": "by generating a sequence of tokens. These tokens originate from a finite vocab-", "orig": "by generating a sequence of tokens. These tokens originate from a finite vocab-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "All known Im2Seq based models for TSR fundamentally work in similar ways. Given an image of a table, the Im2Seq model predicts the structure of the table by generating a sequence of tokens. These tokens originate from a finite vocab-"}], "headers": [{"label": "page_header", "id": 6, "page_no": 3, "cluster": {"id": 6, "label": "page_header", "bbox": {"l": 134.765, "t": 91.49300000000005, "r": 139.372, "b": 102.78200000000004, "coord_origin": "TOPLEFT"}, "confidence": 0.7890051603317261, "cells": [{"index": 0, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 102.78200000000004, "r_x1": 139.372, "r_y1": 102.78200000000004, "r_x2": 139.372, "r_y2": 91.49300000000005, "r_x3": 134.765, "r_y3": 91.49300000000005, "coord_origin": "TOPLEFT"}, "text": "4", "orig": "4", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "4"}, {"label": "page_header", "id": 5, "page_no": 3, "cluster": {"id": 5, "label": "page_header", "bbox": {"l": 167.813, "t": 91.49300000000005, "r": 231.722, "b": 102.78200000000004, "coord_origin": "TOPLEFT"}, "confidence": 0.9045588374137878, "cells": [{"index": 1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 167.813, "r_y0": 102.78200000000004, "r_x1": 231.722, "r_y1": 102.78200000000004, "r_x2": 231.722, "r_y2": 91.49300000000005, "r_x3": 167.813, "r_y3": 91.49300000000005, "coord_origin": "TOPLEFT"}, "text": "M. Lysak, et al.", "orig": "M. Lysak, et al.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "M. Lysak, et al."}]}}, {"page_no": 4, "size": {"width": 612.0, "height": 792.0}, "cells": [{"index": 0, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 194.478, "r_y0": 102.78200000000004, "r_x1": 447.543, "r_y1": 102.78200000000004, "r_x2": 447.543, "r_y2": 91.49300000000005, "r_x3": 194.478, "r_y3": 91.49300000000005, "coord_origin": "TOPLEFT"}, "text": "Optimized Table Tokenization for Table Structure Recognition", "orig": "Optimized Table Tokenization for Table Structure Recognition", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 475.984, "r_y0": 102.78200000000004, "r_x1": 480.591, "r_y1": 102.78200000000004, "r_x2": 480.591, "r_y2": 91.49300000000005, "r_x3": 475.984, "r_y3": 91.49300000000005, "coord_origin": "TOPLEFT"}, "text": "5", "orig": "5", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 2, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 127.731, "r_x1": 480.586, "r_y1": 127.731, "r_x2": 480.586, "r_y2": 118.93399999999997, "r_x3": 134.765, "r_y3": 118.93399999999997, "coord_origin": "TOPLEFT"}, "text": "ulary and can be interpreted as a table structure. For example, with the HTML", "orig": "ulary and can be interpreted as a table structure. For example, with the HTML", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 3, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 139.68600000000004, "r_x1": 162.485, "r_y1": 139.68600000000004, "r_x2": 162.485, "r_y2": 130.889, "r_x3": 134.765, "r_y3": 130.889, "coord_origin": "TOPLEFT"}, "text": "tokens", "orig": "tokens", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 4, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 166.368, "r_y0": 139.68600000000004, "r_x1": 201.749, "r_y1": 139.68600000000004, "r_x2": 201.749, "r_y2": 130.889, "r_x3": 166.368, "r_y3": 130.889, "coord_origin": "TOPLEFT"}, "text": "<table>", "orig": "<table>", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 5, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 201.749, "r_y0": 139.68600000000004, "r_x1": 204.516, "r_y1": 139.68600000000004, "r_x2": 204.516, "r_y2": 130.889, "r_x3": 201.749, "r_y3": 130.889, "coord_origin": "TOPLEFT"}, "text": ",", "orig": ",", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 6, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 208.397, "r_y0": 139.68600000000004, "r_x1": 248.869, "r_y1": 139.68600000000004, "r_x2": 248.869, "r_y2": 130.889, "r_x3": 208.397, "r_y3": 130.889, "coord_origin": "TOPLEFT"}, "text": "</table>", "orig": "</table>", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 7, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 248.869, "r_y0": 139.68600000000004, "r_x1": 251.636, "r_y1": 139.68600000000004, "r_x2": 251.636, "r_y2": 130.889, "r_x3": 248.869, "r_y3": 130.889, "coord_origin": "TOPLEFT"}, "text": ",", "orig": ",", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 8, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 255.517, "r_y0": 139.68600000000004, "r_x1": 278.298, "r_y1": 139.68600000000004, "r_x2": 278.298, "r_y2": 130.889, "r_x3": 255.517, "r_y3": 130.889, "coord_origin": "TOPLEFT"}, "text": "<tr>", "orig": "<tr>", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 9, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 278.298, "r_y0": 139.68600000000004, "r_x1": 281.065, "r_y1": 139.68600000000004, "r_x2": 281.065, "r_y2": 130.889, "r_x3": 278.298, "r_y3": 130.889, "coord_origin": "TOPLEFT"}, "text": ",", "orig": ",", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 10, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 284.946, "r_y0": 139.68600000000004, "r_x1": 312.818, "r_y1": 139.68600000000004, "r_x2": 312.818, "r_y2": 130.889, "r_x3": 284.946, "r_y3": 130.889, "coord_origin": "TOPLEFT"}, "text": "</tr>", "orig": "</tr>", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 11, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 312.818, "r_y0": 139.68600000000004, "r_x1": 315.585, "r_y1": 139.68600000000004, "r_x2": 315.585, "r_y2": 130.889, "r_x3": 312.818, "r_y3": 130.889, "coord_origin": "TOPLEFT"}, "text": ",", "orig": ",", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 12, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 319.466, "r_y0": 139.68600000000004, "r_x1": 343.138, "r_y1": 139.68600000000004, "r_x2": 343.138, "r_y2": 130.889, "r_x3": 319.466, "r_y3": 130.889, "coord_origin": "TOPLEFT"}, "text": "<td>", "orig": "<td>", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 13, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 347.132, "r_y0": 139.68600000000004, "r_x1": 363.179, "r_y1": 139.68600000000004, "r_x2": 363.179, "r_y2": 130.889, "r_x3": 347.132, "r_y3": 130.889, "coord_origin": "TOPLEFT"}, "text": "and", "orig": "and", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 14, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 367.06, "r_y0": 139.68600000000004, "r_x1": 395.823, "r_y1": 139.68600000000004, "r_x2": 395.823, "r_y2": 130.889, "r_x3": 367.06, "r_y3": 130.889, "coord_origin": "TOPLEFT"}, "text": "</td>", "orig": "</td>", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 15, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 395.823, "r_y0": 139.68600000000004, "r_x1": 398.59, "r_y1": 139.68600000000004, "r_x2": 398.59, "r_y2": 130.889, "r_x3": 395.823, "r_y3": 130.889, "coord_origin": "TOPLEFT"}, "text": ",", "orig": ",", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 16, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 402.475, "r_y0": 139.68600000000004, "r_x1": 480.592, "r_y1": 139.68600000000004, "r_x2": 480.592, "r_y2": 130.889, "r_x3": 402.475, "r_y3": 130.889, "coord_origin": "TOPLEFT"}, "text": "one can construct", "orig": "one can construct", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 17, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 151.64200000000005, "r_x1": 480.594, "r_y1": 151.64200000000005, "r_x2": 480.594, "r_y2": 142.84500000000003, "r_x3": 134.765, "r_y3": 142.84500000000003, "coord_origin": "TOPLEFT"}, "text": "simple table structures without any spanning cells. In reality though, one needs", "orig": "simple table structures without any spanning cells. In reality though, one needs", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 18, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 163.59699999999998, "r_x1": 480.586, "r_y1": 163.59699999999998, "r_x2": 480.586, "r_y2": 154.79999999999995, "r_x3": 134.765, "r_y3": 154.79999999999995, "coord_origin": "TOPLEFT"}, "text": "at least 28 HTML tokens to describe the most common complex tables observed", "orig": "at least 28 HTML tokens to describe the most common complex tables observed", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 19, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 175.55200000000002, "r_x1": 480.594, "r_y1": 175.55200000000002, "r_x2": 480.594, "r_y2": 166.755, "r_x3": 134.765, "r_y3": 166.755, "coord_origin": "TOPLEFT"}, "text": "in real-world documents [21,22], due to a variety of spanning cells definitions in", "orig": "in real-world documents [21,22], due to a variety of spanning cells definitions in", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 20, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 187.50699999999995, "r_x1": 261.926, "r_y1": 187.50699999999995, "r_x2": 261.926, "r_y2": 178.71000000000004, "r_x3": 134.765, "r_y3": 178.71000000000004, "coord_origin": "TOPLEFT"}, "text": "the HTML token vocabulary.", "orig": "the HTML token vocabulary.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 21, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 145.607, "r_y0": 229.005, "r_x1": 173.486, "r_y1": 229.005, "r_x2": 173.486, "r_y2": 221.07899999999995, "r_x3": 145.607, "r_y3": 221.07899999999995, "coord_origin": "TOPLEFT"}, "text": "Fig. 2.", "orig": "Fig. 2.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 22, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 176.56, "r_y0": 230.15300000000002, "r_x1": 469.752, "r_y1": 230.15300000000002, "r_x2": 469.752, "r_y2": 218.86400000000003, "r_x3": 176.56, "r_y3": 218.86400000000003, "coord_origin": "TOPLEFT"}, "text": "Frequency of tokens in HTML and OTSL as they appear in PubTabNet.", "orig": "Frequency of tokens in HTML and OTSL as they appear in PubTabNet.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 23, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 149.709, "r_y0": 377.004, "r_x1": 480.593, "r_y1": 377.004, "r_x2": 480.593, "r_y2": 368.207, "r_x3": 149.709, "r_y3": 368.207, "coord_origin": "TOPLEFT"}, "text": "Obviously, HTML and other general-purpose markup languages were not de-", "orig": "Obviously, HTML and other general-purpose markup languages were not de-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 24, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 388.959, "r_x1": 480.587, "r_y1": 388.959, "r_x2": 480.587, "r_y2": 380.162, "r_x3": 134.765, "r_y3": 380.162, "coord_origin": "TOPLEFT"}, "text": "signed for Im2Seq models. As such, they have some serious drawbacks. First, the", "orig": "signed for Im2Seq models. As such, they have some serious drawbacks. First, the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 25, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 400.914, "r_x1": 480.592, "r_y1": 400.914, "r_x2": 480.592, "r_y2": 392.117, "r_x3": 134.765, "r_y3": 392.117, "coord_origin": "TOPLEFT"}, "text": "token vocabulary needs to be artificially large in order to describe all plausible", "orig": "token vocabulary needs to be artificially large in order to describe all plausible", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 26, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 412.869, "r_x1": 480.59, "r_y1": 412.869, "r_x2": 480.59, "r_y2": 404.072, "r_x3": 134.765, "r_y3": 404.072, "coord_origin": "TOPLEFT"}, "text": "tabular structures. Since most Im2Seq models use an autoregressive approach,", "orig": "tabular structures. Since most Im2Seq models use an autoregressive approach,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 27, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 424.825, "r_x1": 480.589, "r_y1": 424.825, "r_x2": 480.589, "r_y2": 416.028, "r_x3": 134.765, "r_y3": 416.028, "coord_origin": "TOPLEFT"}, "text": "they generate the sequence token by token. Therefore, to reduce inference time,", "orig": "they generate the sequence token by token. Therefore, to reduce inference time,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 28, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 436.78, "r_x1": 480.593, "r_y1": 436.78, "r_x2": 480.593, "r_y2": 427.983, "r_x3": 134.765, "r_y3": 427.983, "coord_origin": "TOPLEFT"}, "text": "a shorter sequence length is critical. Every table-cell is represented by at least", "orig": "a shorter sequence length is critical. Every table-cell is represented by at least", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 29, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 448.735, "r_x1": 187.934, "r_y1": 448.735, "r_x2": 187.934, "r_y2": 439.938, "r_x3": 134.765, "r_y3": 439.938, "coord_origin": "TOPLEFT"}, "text": "two tokens (", "orig": "two tokens (", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 30, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 187.931, "r_y0": 448.735, "r_x1": 211.603, "r_y1": 448.735, "r_x2": 211.603, "r_y2": 439.938, "r_x3": 187.931, "r_y3": 439.938, "coord_origin": "TOPLEFT"}, "text": "<td>", "orig": "<td>", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 31, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 214.754, "r_y0": 448.735, "r_x1": 230.801, "r_y1": 448.735, "r_x2": 230.801, "r_y2": 439.938, "r_x3": 214.754, "r_y3": 439.938, "coord_origin": "TOPLEFT"}, "text": "and", "orig": "and", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 32, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 233.839, "r_y0": 448.735, "r_x1": 262.602, "r_y1": 448.735, "r_x2": 262.602, "r_y2": 439.938, "r_x3": 233.839, "r_y3": 439.938, "coord_origin": "TOPLEFT"}, "text": "</td>", "orig": "</td>", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 33, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 262.716, "r_y0": 448.735, "r_x1": 480.59, "r_y1": 448.735, "r_x2": 480.59, "r_y2": 439.938, "r_x3": 262.716, "r_y3": 439.938, "coord_origin": "TOPLEFT"}, "text": "). Furthermore, when tokenizing the HTML struc-", "orig": "). Furthermore, when tokenizing the HTML struc-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 34, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 460.69, "r_x1": 155.266, "r_y1": 460.69, "r_x2": 155.266, "r_y2": 451.893, "r_x3": 134.765, "r_y3": 451.893, "coord_origin": "TOPLEFT"}, "text": "ture,", "orig": "ture,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 35, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 159.789, "r_y0": 460.69, "r_x1": 260.86, "r_y1": 460.69, "r_x2": 260.86, "r_y2": 451.893, "r_x3": 159.789, "r_y3": 451.893, "coord_origin": "TOPLEFT"}, "text": "one needs to explicitly", "orig": "one needs to explicitly", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 36, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 265.383, "r_y0": 460.69, "r_x1": 480.588, "r_y1": 460.69, "r_x2": 480.588, "r_y2": 451.893, "r_x3": 265.383, "r_y3": 451.893, "coord_origin": "TOPLEFT"}, "text": "enumerate possible column-spans and row-spans", "orig": "enumerate possible column-spans and row-spans", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 37, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 472.645, "r_x1": 480.587, "r_y1": 472.645, "r_x2": 480.587, "r_y2": 463.848, "r_x3": 134.765, "r_y3": 463.848, "coord_origin": "TOPLEFT"}, "text": "as words. In practice, this ends up requiring 28 different HTML tokens (when", "orig": "as words. In practice, this ends up requiring 28 different HTML tokens (when", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 38, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 484.601, "r_x1": 480.587, "r_y1": 484.601, "r_x2": 480.587, "r_y2": 475.804, "r_x3": 134.765, "r_y3": 475.804, "coord_origin": "TOPLEFT"}, "text": "including column- and row-spans up to 10 cells) just to describe every table in", "orig": "including column- and row-spans up to 10 cells) just to describe every table in", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 39, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 496.556, "r_x1": 480.591, "r_y1": 496.556, "r_x2": 480.591, "r_y2": 487.759, "r_x3": 134.765, "r_y3": 487.759, "coord_origin": "TOPLEFT"}, "text": "the PubTabNet dataset. Clearly, not every token is equally represented, as is", "orig": "the PubTabNet dataset. Clearly, not every token is equally represented, as is", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 40, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 508.511, "r_x1": 480.593, "r_y1": 508.511, "r_x2": 480.593, "r_y2": 499.714, "r_x3": 134.765, "r_y3": 499.714, "coord_origin": "TOPLEFT"}, "text": "depicted in Figure 2. This skewed distribution of tokens in combination with", "orig": "depicted in Figure 2. This skewed distribution of tokens in combination with", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 41, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 520.466, "r_x1": 480.595, "r_y1": 520.466, "r_x2": 480.595, "r_y2": 511.669, "r_x3": 134.765, "r_y3": 511.669, "coord_origin": "TOPLEFT"}, "text": "variable token row-length makes it challenging for models to learn the HTML", "orig": "variable token row-length makes it challenging for models to learn the HTML", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 42, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 532.421, "r_x1": 176.929, "r_y1": 532.421, "r_x2": 176.929, "r_y2": 523.624, "r_x3": 134.765, "r_y3": 523.624, "coord_origin": "TOPLEFT"}, "text": "structure.", "orig": "structure.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 43, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 149.709, "r_y0": 544.84, "r_x1": 480.593, "r_y1": 544.84, "r_x2": 480.593, "r_y2": 536.043, "r_x3": 149.709, "r_y3": 536.043, "coord_origin": "TOPLEFT"}, "text": "Additionally, it would be desirable if the representation would easily allow", "orig": "Additionally, it would be desirable if the representation would easily allow", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 44, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 556.795, "r_x1": 480.591, "r_y1": 556.795, "r_x2": 480.591, "r_y2": 547.998, "r_x3": 134.765, "r_y3": 547.998, "coord_origin": "TOPLEFT"}, "text": "an early detection of invalid sequences on-the-go, before the prediction of the", "orig": "an early detection of invalid sequences on-the-go, before the prediction of the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 45, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 568.75, "r_x1": 480.59, "r_y1": 568.75, "r_x2": 480.59, "r_y2": 559.953, "r_x3": 134.765, "r_y3": 559.953, "coord_origin": "TOPLEFT"}, "text": "entire table structure is completed. HTML is not well-suited for this purpose as", "orig": "entire table structure is completed. HTML is not well-suited for this purpose as", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 46, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 580.706, "r_x1": 452.189, "r_y1": 580.706, "r_x2": 452.189, "r_y2": 571.909, "r_x3": 134.765, "r_y3": 571.909, "coord_origin": "TOPLEFT"}, "text": "the verification of incomplete sequences is non-trivial or even impossible.", "orig": "the verification of incomplete sequences is non-trivial or even impossible.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 47, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 149.709, "r_y0": 593.124, "r_x1": 480.593, "r_y1": 593.124, "r_x2": 480.593, "r_y2": 584.327, "r_x3": 149.709, "r_y3": 584.327, "coord_origin": "TOPLEFT"}, "text": "In a valid HTML table, the token sequence must describe a 2D grid of table", "orig": "In a valid HTML table, the token sequence must describe a 2D grid of table", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 48, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 605.08, "r_x1": 155.846, "r_y1": 605.08, "r_x2": 155.846, "r_y2": 596.283, "r_x3": 134.765, "r_y3": 596.283, "coord_origin": "TOPLEFT"}, "text": "cells,", "orig": "cells,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 49, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 160.09, "r_y0": 605.08, "r_x1": 199.514, "r_y1": 605.08, "r_x2": 199.514, "r_y2": 596.283, "r_x3": 160.09, "r_y3": 596.283, "coord_origin": "TOPLEFT"}, "text": "serialised", "orig": "serialised", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 50, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 203.758, "r_y0": 605.08, "r_x1": 212.058, "r_y1": 605.08, "r_x2": 212.058, "r_y2": 596.283, "r_x3": 203.758, "r_y3": 596.283, "coord_origin": "TOPLEFT"}, "text": "in", "orig": "in", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 51, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 216.302, "r_y0": 605.08, "r_x1": 480.59, "r_y1": 605.08, "r_x2": 480.59, "r_y2": 596.283, "r_x3": 216.302, "r_y3": 596.283, "coord_origin": "TOPLEFT"}, "text": "row-major ordering, where each row and each column have", "orig": "row-major ordering, where each row and each column have", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 52, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 617.035, "r_x1": 480.594, "r_y1": 617.035, "r_x2": 480.594, "r_y2": 608.238, "r_x3": 134.765, "r_y3": 608.238, "coord_origin": "TOPLEFT"}, "text": "the same length (while considering row- and column-spans). Furthermore, every", "orig": "the same length (while considering row- and column-spans). Furthermore, every", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 53, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 628.99, "r_x1": 480.591, "r_y1": 628.99, "r_x2": 480.591, "r_y2": 620.193, "r_x3": 134.765, "r_y3": 620.193, "coord_origin": "TOPLEFT"}, "text": "opening tag in HTML needs to be matched by a closing tag in a correct hierar-", "orig": "opening tag in HTML needs to be matched by a closing tag in a correct hierar-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 54, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 640.9449999999999, "r_x1": 480.586, "r_y1": 640.9449999999999, "r_x2": 480.586, "r_y2": 632.148, "r_x3": 134.765, "r_y3": 632.148, "coord_origin": "TOPLEFT"}, "text": "chical manner. Since the number of tokens for each table row and column can", "orig": "chical manner. Since the number of tokens for each table row and column can", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 55, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 652.9, "r_x1": 480.592, "r_y1": 652.9, "r_x2": 480.592, "r_y2": 644.1030000000001, "r_x3": 134.765, "r_y3": 644.1030000000001, "coord_origin": "TOPLEFT"}, "text": "vary significantly, especially for large tables with many row- and column-spans,", "orig": "vary significantly, especially for large tables with many row- and column-spans,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 56, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 664.855, "r_x1": 141.405, "r_y1": 664.855, "r_x2": 141.405, "r_y2": 656.058, "r_x3": 134.765, "r_y3": 656.058, "coord_origin": "TOPLEFT"}, "text": "it", "orig": "it", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 57, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 145.281, "r_y0": 664.855, "r_x1": 151.975, "r_y1": 664.855, "r_x2": 151.975, "r_y2": 656.058, "r_x3": 145.281, "r_y3": 656.058, "coord_origin": "TOPLEFT"}, "text": "is", "orig": "is", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 58, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 155.861, "r_y0": 664.855, "r_x1": 480.595, "r_y1": 664.855, "r_x2": 480.595, "r_y2": 656.058, "r_x3": 155.861, "r_y3": 656.058, "coord_origin": "TOPLEFT"}, "text": "complex to verify the consistency of predicted structures during sequence", "orig": "complex to verify the consistency of predicted structures during sequence", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "parsed_page": null, "predictions": {"layout": {"clusters": [{"id": 5, "label": "page_header", "bbox": {"l": 194.478, "t": 91.49300000000005, "r": 447.543, "b": 102.78200000000004, "coord_origin": "TOPLEFT"}, "confidence": 0.9269194602966309, "cells": [{"index": 0, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 194.478, "r_y0": 102.78200000000004, "r_x1": 447.543, "r_y1": 102.78200000000004, "r_x2": 447.543, "r_y2": 91.49300000000005, "r_x3": 194.478, "r_y3": 91.49300000000005, "coord_origin": "TOPLEFT"}, "text": "Optimized Table Tokenization for Table Structure Recognition", "orig": "Optimized Table Tokenization for Table Structure Recognition", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 6, "label": "page_header", "bbox": {"l": 475.984, "t": 91.49300000000005, "r": 480.591, "b": 102.78200000000004, "coord_origin": "TOPLEFT"}, "confidence": 0.8696112036705017, "cells": [{"index": 1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 475.984, "r_y0": 102.78200000000004, "r_x1": 480.591, "r_y1": 102.78200000000004, "r_x2": 480.591, "r_y2": 91.49300000000005, "r_x3": 475.984, "r_y3": 91.49300000000005, "coord_origin": "TOPLEFT"}, "text": "5", "orig": "5", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 0, "label": "text", "bbox": {"l": 134.765, "t": 118.93399999999997, "r": 480.594, "b": 187.50699999999995, "coord_origin": "TOPLEFT"}, "confidence": 0.9857171773910522, "cells": [{"index": 2, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 127.731, "r_x1": 480.586, "r_y1": 127.731, "r_x2": 480.586, "r_y2": 118.93399999999997, "r_x3": 134.765, "r_y3": 118.93399999999997, "coord_origin": "TOPLEFT"}, "text": "ulary and can be interpreted as a table structure. For example, with the HTML", "orig": "ulary and can be interpreted as a table structure. For example, with the HTML", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 3, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 139.68600000000004, "r_x1": 162.485, "r_y1": 139.68600000000004, "r_x2": 162.485, "r_y2": 130.889, "r_x3": 134.765, "r_y3": 130.889, "coord_origin": "TOPLEFT"}, "text": "tokens", "orig": "tokens", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 4, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 166.368, "r_y0": 139.68600000000004, "r_x1": 201.749, "r_y1": 139.68600000000004, "r_x2": 201.749, "r_y2": 130.889, "r_x3": 166.368, "r_y3": 130.889, "coord_origin": "TOPLEFT"}, "text": "<table>", "orig": "<table>", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 5, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 201.749, "r_y0": 139.68600000000004, "r_x1": 204.516, "r_y1": 139.68600000000004, "r_x2": 204.516, "r_y2": 130.889, "r_x3": 201.749, "r_y3": 130.889, "coord_origin": "TOPLEFT"}, "text": ",", "orig": ",", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 6, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 208.397, "r_y0": 139.68600000000004, "r_x1": 248.869, "r_y1": 139.68600000000004, "r_x2": 248.869, "r_y2": 130.889, "r_x3": 208.397, "r_y3": 130.889, "coord_origin": "TOPLEFT"}, "text": "</table>", "orig": "</table>", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 7, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 248.869, "r_y0": 139.68600000000004, "r_x1": 251.636, "r_y1": 139.68600000000004, "r_x2": 251.636, "r_y2": 130.889, "r_x3": 248.869, "r_y3": 130.889, "coord_origin": "TOPLEFT"}, "text": ",", "orig": ",", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 8, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 255.517, "r_y0": 139.68600000000004, "r_x1": 278.298, "r_y1": 139.68600000000004, "r_x2": 278.298, "r_y2": 130.889, "r_x3": 255.517, "r_y3": 130.889, "coord_origin": "TOPLEFT"}, "text": "<tr>", "orig": "<tr>", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 9, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 278.298, "r_y0": 139.68600000000004, "r_x1": 281.065, "r_y1": 139.68600000000004, "r_x2": 281.065, "r_y2": 130.889, "r_x3": 278.298, "r_y3": 130.889, "coord_origin": "TOPLEFT"}, "text": ",", "orig": ",", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 10, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 284.946, "r_y0": 139.68600000000004, "r_x1": 312.818, "r_y1": 139.68600000000004, "r_x2": 312.818, "r_y2": 130.889, "r_x3": 284.946, "r_y3": 130.889, "coord_origin": "TOPLEFT"}, "text": "</tr>", "orig": "</tr>", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 11, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 312.818, "r_y0": 139.68600000000004, "r_x1": 315.585, "r_y1": 139.68600000000004, "r_x2": 315.585, "r_y2": 130.889, "r_x3": 312.818, "r_y3": 130.889, "coord_origin": "TOPLEFT"}, "text": ",", "orig": ",", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 12, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 319.466, "r_y0": 139.68600000000004, "r_x1": 343.138, "r_y1": 139.68600000000004, "r_x2": 343.138, "r_y2": 130.889, "r_x3": 319.466, "r_y3": 130.889, "coord_origin": "TOPLEFT"}, "text": "<td>", "orig": "<td>", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 13, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 347.132, "r_y0": 139.68600000000004, "r_x1": 363.179, "r_y1": 139.68600000000004, "r_x2": 363.179, "r_y2": 130.889, "r_x3": 347.132, "r_y3": 130.889, "coord_origin": "TOPLEFT"}, "text": "and", "orig": "and", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 14, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 367.06, "r_y0": 139.68600000000004, "r_x1": 395.823, "r_y1": 139.68600000000004, "r_x2": 395.823, "r_y2": 130.889, "r_x3": 367.06, "r_y3": 130.889, "coord_origin": "TOPLEFT"}, "text": "</td>", "orig": "</td>", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 15, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 395.823, "r_y0": 139.68600000000004, "r_x1": 398.59, "r_y1": 139.68600000000004, "r_x2": 398.59, "r_y2": 130.889, "r_x3": 395.823, "r_y3": 130.889, "coord_origin": "TOPLEFT"}, "text": ",", "orig": ",", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 16, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 402.475, "r_y0": 139.68600000000004, "r_x1": 480.592, "r_y1": 139.68600000000004, "r_x2": 480.592, "r_y2": 130.889, "r_x3": 402.475, "r_y3": 130.889, "coord_origin": "TOPLEFT"}, "text": "one can construct", "orig": "one can construct", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 17, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 151.64200000000005, "r_x1": 480.594, "r_y1": 151.64200000000005, "r_x2": 480.594, "r_y2": 142.84500000000003, "r_x3": 134.765, "r_y3": 142.84500000000003, "coord_origin": "TOPLEFT"}, "text": "simple table structures without any spanning cells. In reality though, one needs", "orig": "simple table structures without any spanning cells. In reality though, one needs", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 18, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 163.59699999999998, "r_x1": 480.586, "r_y1": 163.59699999999998, "r_x2": 480.586, "r_y2": 154.79999999999995, "r_x3": 134.765, "r_y3": 154.79999999999995, "coord_origin": "TOPLEFT"}, "text": "at least 28 HTML tokens to describe the most common complex tables observed", "orig": "at least 28 HTML tokens to describe the most common complex tables observed", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 19, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 175.55200000000002, "r_x1": 480.594, "r_y1": 175.55200000000002, "r_x2": 480.594, "r_y2": 166.755, "r_x3": 134.765, "r_y3": 166.755, "coord_origin": "TOPLEFT"}, "text": "in real-world documents [21,22], due to a variety of spanning cells definitions in", "orig": "in real-world documents [21,22], due to a variety of spanning cells definitions in", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 20, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 187.50699999999995, "r_x1": 261.926, "r_y1": 187.50699999999995, "r_x2": 261.926, "r_y2": 178.71000000000004, "r_x3": 134.765, "r_y3": 178.71000000000004, "coord_origin": "TOPLEFT"}, "text": "the HTML token vocabulary.", "orig": "the HTML token vocabulary.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 7, "label": "caption", "bbox": {"l": 145.607, "t": 218.86400000000003, "r": 469.752, "b": 230.15300000000002, "coord_origin": "TOPLEFT"}, "confidence": 0.8472551703453064, "cells": [{"index": 21, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 145.607, "r_y0": 229.005, "r_x1": 173.486, "r_y1": 229.005, "r_x2": 173.486, "r_y2": 221.07899999999995, "r_x3": 145.607, "r_y3": 221.07899999999995, "coord_origin": "TOPLEFT"}, "text": "Fig. 2.", "orig": "Fig. 2.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 22, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 176.56, "r_y0": 230.15300000000002, "r_x1": 469.752, "r_y1": 230.15300000000002, "r_x2": 469.752, "r_y2": 218.86400000000003, "r_x3": 176.56, "r_y3": 218.86400000000003, "coord_origin": "TOPLEFT"}, "text": "Frequency of tokens in HTML and OTSL as they appear in PubTabNet.", "orig": "Frequency of tokens in HTML and OTSL as they appear in PubTabNet.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 1, "label": "text", "bbox": {"l": 134.765, "t": 368.207, "r": 480.595, "b": 532.421, "coord_origin": "TOPLEFT"}, "confidence": 0.9844799637794495, "cells": [{"index": 23, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 149.709, "r_y0": 377.004, "r_x1": 480.593, "r_y1": 377.004, "r_x2": 480.593, "r_y2": 368.207, "r_x3": 149.709, "r_y3": 368.207, "coord_origin": "TOPLEFT"}, "text": "Obviously, HTML and other general-purpose markup languages were not de-", "orig": "Obviously, HTML and other general-purpose markup languages were not de-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 24, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 388.959, "r_x1": 480.587, "r_y1": 388.959, "r_x2": 480.587, "r_y2": 380.162, "r_x3": 134.765, "r_y3": 380.162, "coord_origin": "TOPLEFT"}, "text": "signed for Im2Seq models. As such, they have some serious drawbacks. First, the", "orig": "signed for Im2Seq models. As such, they have some serious drawbacks. First, the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 25, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 400.914, "r_x1": 480.592, "r_y1": 400.914, "r_x2": 480.592, "r_y2": 392.117, "r_x3": 134.765, "r_y3": 392.117, "coord_origin": "TOPLEFT"}, "text": "token vocabulary needs to be artificially large in order to describe all plausible", "orig": "token vocabulary needs to be artificially large in order to describe all plausible", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 26, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 412.869, "r_x1": 480.59, "r_y1": 412.869, "r_x2": 480.59, "r_y2": 404.072, "r_x3": 134.765, "r_y3": 404.072, "coord_origin": "TOPLEFT"}, "text": "tabular structures. Since most Im2Seq models use an autoregressive approach,", "orig": "tabular structures. Since most Im2Seq models use an autoregressive approach,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 27, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 424.825, "r_x1": 480.589, "r_y1": 424.825, "r_x2": 480.589, "r_y2": 416.028, "r_x3": 134.765, "r_y3": 416.028, "coord_origin": "TOPLEFT"}, "text": "they generate the sequence token by token. Therefore, to reduce inference time,", "orig": "they generate the sequence token by token. Therefore, to reduce inference time,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 28, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 436.78, "r_x1": 480.593, "r_y1": 436.78, "r_x2": 480.593, "r_y2": 427.983, "r_x3": 134.765, "r_y3": 427.983, "coord_origin": "TOPLEFT"}, "text": "a shorter sequence length is critical. Every table-cell is represented by at least", "orig": "a shorter sequence length is critical. Every table-cell is represented by at least", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 29, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 448.735, "r_x1": 187.934, "r_y1": 448.735, "r_x2": 187.934, "r_y2": 439.938, "r_x3": 134.765, "r_y3": 439.938, "coord_origin": "TOPLEFT"}, "text": "two tokens (", "orig": "two tokens (", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 30, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 187.931, "r_y0": 448.735, "r_x1": 211.603, "r_y1": 448.735, "r_x2": 211.603, "r_y2": 439.938, "r_x3": 187.931, "r_y3": 439.938, "coord_origin": "TOPLEFT"}, "text": "<td>", "orig": "<td>", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 31, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 214.754, "r_y0": 448.735, "r_x1": 230.801, "r_y1": 448.735, "r_x2": 230.801, "r_y2": 439.938, "r_x3": 214.754, "r_y3": 439.938, "coord_origin": "TOPLEFT"}, "text": "and", "orig": "and", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 32, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 233.839, "r_y0": 448.735, "r_x1": 262.602, "r_y1": 448.735, "r_x2": 262.602, "r_y2": 439.938, "r_x3": 233.839, "r_y3": 439.938, "coord_origin": "TOPLEFT"}, "text": "</td>", "orig": "</td>", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 33, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 262.716, "r_y0": 448.735, "r_x1": 480.59, "r_y1": 448.735, "r_x2": 480.59, "r_y2": 439.938, "r_x3": 262.716, "r_y3": 439.938, "coord_origin": "TOPLEFT"}, "text": "). Furthermore, when tokenizing the HTML struc-", "orig": "). Furthermore, when tokenizing the HTML struc-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 34, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 460.69, "r_x1": 155.266, "r_y1": 460.69, "r_x2": 155.266, "r_y2": 451.893, "r_x3": 134.765, "r_y3": 451.893, "coord_origin": "TOPLEFT"}, "text": "ture,", "orig": "ture,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 35, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 159.789, "r_y0": 460.69, "r_x1": 260.86, "r_y1": 460.69, "r_x2": 260.86, "r_y2": 451.893, "r_x3": 159.789, "r_y3": 451.893, "coord_origin": "TOPLEFT"}, "text": "one needs to explicitly", "orig": "one needs to explicitly", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 36, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 265.383, "r_y0": 460.69, "r_x1": 480.588, "r_y1": 460.69, "r_x2": 480.588, "r_y2": 451.893, "r_x3": 265.383, "r_y3": 451.893, "coord_origin": "TOPLEFT"}, "text": "enumerate possible column-spans and row-spans", "orig": "enumerate possible column-spans and row-spans", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 37, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 472.645, "r_x1": 480.587, "r_y1": 472.645, "r_x2": 480.587, "r_y2": 463.848, "r_x3": 134.765, "r_y3": 463.848, "coord_origin": "TOPLEFT"}, "text": "as words. In practice, this ends up requiring 28 different HTML tokens (when", "orig": "as words. In practice, this ends up requiring 28 different HTML tokens (when", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 38, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 484.601, "r_x1": 480.587, "r_y1": 484.601, "r_x2": 480.587, "r_y2": 475.804, "r_x3": 134.765, "r_y3": 475.804, "coord_origin": "TOPLEFT"}, "text": "including column- and row-spans up to 10 cells) just to describe every table in", "orig": "including column- and row-spans up to 10 cells) just to describe every table in", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 39, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 496.556, "r_x1": 480.591, "r_y1": 496.556, "r_x2": 480.591, "r_y2": 487.759, "r_x3": 134.765, "r_y3": 487.759, "coord_origin": "TOPLEFT"}, "text": "the PubTabNet dataset. Clearly, not every token is equally represented, as is", "orig": "the PubTabNet dataset. Clearly, not every token is equally represented, as is", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 40, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 508.511, "r_x1": 480.593, "r_y1": 508.511, "r_x2": 480.593, "r_y2": 499.714, "r_x3": 134.765, "r_y3": 499.714, "coord_origin": "TOPLEFT"}, "text": "depicted in Figure 2. This skewed distribution of tokens in combination with", "orig": "depicted in Figure 2. This skewed distribution of tokens in combination with", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 41, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 520.466, "r_x1": 480.595, "r_y1": 520.466, "r_x2": 480.595, "r_y2": 511.669, "r_x3": 134.765, "r_y3": 511.669, "coord_origin": "TOPLEFT"}, "text": "variable token row-length makes it challenging for models to learn the HTML", "orig": "variable token row-length makes it challenging for models to learn the HTML", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 42, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 532.421, "r_x1": 176.929, "r_y1": 532.421, "r_x2": 176.929, "r_y2": 523.624, "r_x3": 134.765, "r_y3": 523.624, "coord_origin": "TOPLEFT"}, "text": "structure.", "orig": "structure.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 3, "label": "text", "bbox": {"l": 134.765, "t": 536.043, "r": 480.593, "b": 580.706, "coord_origin": "TOPLEFT"}, "confidence": 0.978394627571106, "cells": [{"index": 43, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 149.709, "r_y0": 544.84, "r_x1": 480.593, "r_y1": 544.84, "r_x2": 480.593, "r_y2": 536.043, "r_x3": 149.709, "r_y3": 536.043, "coord_origin": "TOPLEFT"}, "text": "Additionally, it would be desirable if the representation would easily allow", "orig": "Additionally, it would be desirable if the representation would easily allow", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 44, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 556.795, "r_x1": 480.591, "r_y1": 556.795, "r_x2": 480.591, "r_y2": 547.998, "r_x3": 134.765, "r_y3": 547.998, "coord_origin": "TOPLEFT"}, "text": "an early detection of invalid sequences on-the-go, before the prediction of the", "orig": "an early detection of invalid sequences on-the-go, before the prediction of the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 45, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 568.75, "r_x1": 480.59, "r_y1": 568.75, "r_x2": 480.59, "r_y2": 559.953, "r_x3": 134.765, "r_y3": 559.953, "coord_origin": "TOPLEFT"}, "text": "entire table structure is completed. HTML is not well-suited for this purpose as", "orig": "entire table structure is completed. HTML is not well-suited for this purpose as", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 46, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 580.706, "r_x1": 452.189, "r_y1": 580.706, "r_x2": 452.189, "r_y2": 571.909, "r_x3": 134.765, "r_y3": 571.909, "coord_origin": "TOPLEFT"}, "text": "the verification of incomplete sequences is non-trivial or even impossible.", "orig": "the verification of incomplete sequences is non-trivial or even impossible.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 2, "label": "text", "bbox": {"l": 134.765, "t": 584.327, "r": 480.595, "b": 664.855, "coord_origin": "TOPLEFT"}, "confidence": 0.9838283061981201, "cells": [{"index": 47, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 149.709, "r_y0": 593.124, "r_x1": 480.593, "r_y1": 593.124, "r_x2": 480.593, "r_y2": 584.327, "r_x3": 149.709, "r_y3": 584.327, "coord_origin": "TOPLEFT"}, "text": "In a valid HTML table, the token sequence must describe a 2D grid of table", "orig": "In a valid HTML table, the token sequence must describe a 2D grid of table", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 48, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 605.08, "r_x1": 155.846, "r_y1": 605.08, "r_x2": 155.846, "r_y2": 596.283, "r_x3": 134.765, "r_y3": 596.283, "coord_origin": "TOPLEFT"}, "text": "cells,", "orig": "cells,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 49, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 160.09, "r_y0": 605.08, "r_x1": 199.514, "r_y1": 605.08, "r_x2": 199.514, "r_y2": 596.283, "r_x3": 160.09, "r_y3": 596.283, "coord_origin": "TOPLEFT"}, "text": "serialised", "orig": "serialised", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 50, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 203.758, "r_y0": 605.08, "r_x1": 212.058, "r_y1": 605.08, "r_x2": 212.058, "r_y2": 596.283, "r_x3": 203.758, "r_y3": 596.283, "coord_origin": "TOPLEFT"}, "text": "in", "orig": "in", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 51, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 216.302, "r_y0": 605.08, "r_x1": 480.59, "r_y1": 605.08, "r_x2": 480.59, "r_y2": 596.283, "r_x3": 216.302, "r_y3": 596.283, "coord_origin": "TOPLEFT"}, "text": "row-major ordering, where each row and each column have", "orig": "row-major ordering, where each row and each column have", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 52, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 617.035, "r_x1": 480.594, "r_y1": 617.035, "r_x2": 480.594, "r_y2": 608.238, "r_x3": 134.765, "r_y3": 608.238, "coord_origin": "TOPLEFT"}, "text": "the same length (while considering row- and column-spans). Furthermore, every", "orig": "the same length (while considering row- and column-spans). Furthermore, every", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 53, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 628.99, "r_x1": 480.591, "r_y1": 628.99, "r_x2": 480.591, "r_y2": 620.193, "r_x3": 134.765, "r_y3": 620.193, "coord_origin": "TOPLEFT"}, "text": "opening tag in HTML needs to be matched by a closing tag in a correct hierar-", "orig": "opening tag in HTML needs to be matched by a closing tag in a correct hierar-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 54, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 640.9449999999999, "r_x1": 480.586, "r_y1": 640.9449999999999, "r_x2": 480.586, "r_y2": 632.148, "r_x3": 134.765, "r_y3": 632.148, "coord_origin": "TOPLEFT"}, "text": "chical manner. Since the number of tokens for each table row and column can", "orig": "chical manner. Since the number of tokens for each table row and column can", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 55, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 652.9, "r_x1": 480.592, "r_y1": 652.9, "r_x2": 480.592, "r_y2": 644.1030000000001, "r_x3": 134.765, "r_y3": 644.1030000000001, "coord_origin": "TOPLEFT"}, "text": "vary significantly, especially for large tables with many row- and column-spans,", "orig": "vary significantly, especially for large tables with many row- and column-spans,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 56, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 664.855, "r_x1": 141.405, "r_y1": 664.855, "r_x2": 141.405, "r_y2": 656.058, "r_x3": 134.765, "r_y3": 656.058, "coord_origin": "TOPLEFT"}, "text": "it", "orig": "it", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 57, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 145.281, "r_y0": 664.855, "r_x1": 151.975, "r_y1": 664.855, "r_x2": 151.975, "r_y2": 656.058, "r_x3": 145.281, "r_y3": 656.058, "coord_origin": "TOPLEFT"}, "text": "is", "orig": "is", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 58, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 155.861, "r_y0": 664.855, "r_x1": 480.595, "r_y1": 664.855, "r_x2": 480.595, "r_y2": 656.058, "r_x3": 155.861, "r_y3": 656.058, "coord_origin": "TOPLEFT"}, "text": "complex to verify the consistency of predicted structures during sequence", "orig": "complex to verify the consistency of predicted structures during sequence", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 4, "label": "picture", "bbox": {"l": 137.41448974609375, "t": 233.51231384277344, "r": 476.5608215332031, "b": 340.2304992675781, "coord_origin": "TOPLEFT"}, "confidence": 0.9387977123260498, "cells": [], "children": []}]}, "tablestructure": {"table_map": {}}, "figures_classification": null, "equations_prediction": null, "vlm_response": null}, "assembled": {"elements": [{"label": "page_header", "id": 5, "page_no": 4, "cluster": {"id": 5, "label": "page_header", "bbox": {"l": 194.478, "t": 91.49300000000005, "r": 447.543, "b": 102.78200000000004, "coord_origin": "TOPLEFT"}, "confidence": 0.9269194602966309, "cells": [{"index": 0, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 194.478, "r_y0": 102.78200000000004, "r_x1": 447.543, "r_y1": 102.78200000000004, "r_x2": 447.543, "r_y2": 91.49300000000005, "r_x3": 194.478, "r_y3": 91.49300000000005, "coord_origin": "TOPLEFT"}, "text": "Optimized Table Tokenization for Table Structure Recognition", "orig": "Optimized Table Tokenization for Table Structure Recognition", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "Optimized Table Tokenization for Table Structure Recognition"}, {"label": "page_header", "id": 6, "page_no": 4, "cluster": {"id": 6, "label": "page_header", "bbox": {"l": 475.984, "t": 91.49300000000005, "r": 480.591, "b": 102.78200000000004, "coord_origin": "TOPLEFT"}, "confidence": 0.8696112036705017, "cells": [{"index": 1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 475.984, "r_y0": 102.78200000000004, "r_x1": 480.591, "r_y1": 102.78200000000004, "r_x2": 480.591, "r_y2": 91.49300000000005, "r_x3": 475.984, "r_y3": 91.49300000000005, "coord_origin": "TOPLEFT"}, "text": "5", "orig": "5", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "5"}, {"label": "text", "id": 0, "page_no": 4, "cluster": {"id": 0, "label": "text", "bbox": {"l": 134.765, "t": 118.93399999999997, "r": 480.594, "b": 187.50699999999995, "coord_origin": "TOPLEFT"}, "confidence": 0.9857171773910522, "cells": [{"index": 2, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 127.731, "r_x1": 480.586, "r_y1": 127.731, "r_x2": 480.586, "r_y2": 118.93399999999997, "r_x3": 134.765, "r_y3": 118.93399999999997, "coord_origin": "TOPLEFT"}, "text": "ulary and can be interpreted as a table structure. For example, with the HTML", "orig": "ulary and can be interpreted as a table structure. For example, with the HTML", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 3, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 139.68600000000004, "r_x1": 162.485, "r_y1": 139.68600000000004, "r_x2": 162.485, "r_y2": 130.889, "r_x3": 134.765, "r_y3": 130.889, "coord_origin": "TOPLEFT"}, "text": "tokens", "orig": "tokens", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 4, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 166.368, "r_y0": 139.68600000000004, "r_x1": 201.749, "r_y1": 139.68600000000004, "r_x2": 201.749, "r_y2": 130.889, "r_x3": 166.368, "r_y3": 130.889, "coord_origin": "TOPLEFT"}, "text": "<table>", "orig": "<table>", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 5, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 201.749, "r_y0": 139.68600000000004, "r_x1": 204.516, "r_y1": 139.68600000000004, "r_x2": 204.516, "r_y2": 130.889, "r_x3": 201.749, "r_y3": 130.889, "coord_origin": "TOPLEFT"}, "text": ",", "orig": ",", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 6, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 208.397, "r_y0": 139.68600000000004, "r_x1": 248.869, "r_y1": 139.68600000000004, "r_x2": 248.869, "r_y2": 130.889, "r_x3": 208.397, "r_y3": 130.889, "coord_origin": "TOPLEFT"}, "text": "</table>", "orig": "</table>", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 7, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 248.869, "r_y0": 139.68600000000004, "r_x1": 251.636, "r_y1": 139.68600000000004, "r_x2": 251.636, "r_y2": 130.889, "r_x3": 248.869, "r_y3": 130.889, "coord_origin": "TOPLEFT"}, "text": ",", "orig": ",", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 8, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 255.517, "r_y0": 139.68600000000004, "r_x1": 278.298, "r_y1": 139.68600000000004, "r_x2": 278.298, "r_y2": 130.889, "r_x3": 255.517, "r_y3": 130.889, "coord_origin": "TOPLEFT"}, "text": "<tr>", "orig": "<tr>", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 9, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 278.298, "r_y0": 139.68600000000004, "r_x1": 281.065, "r_y1": 139.68600000000004, "r_x2": 281.065, "r_y2": 130.889, "r_x3": 278.298, "r_y3": 130.889, "coord_origin": "TOPLEFT"}, "text": ",", "orig": ",", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 10, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 284.946, "r_y0": 139.68600000000004, "r_x1": 312.818, "r_y1": 139.68600000000004, "r_x2": 312.818, "r_y2": 130.889, "r_x3": 284.946, "r_y3": 130.889, "coord_origin": "TOPLEFT"}, "text": "</tr>", "orig": "</tr>", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 11, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 312.818, "r_y0": 139.68600000000004, "r_x1": 315.585, "r_y1": 139.68600000000004, "r_x2": 315.585, "r_y2": 130.889, "r_x3": 312.818, "r_y3": 130.889, "coord_origin": "TOPLEFT"}, "text": ",", "orig": ",", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 12, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 319.466, "r_y0": 139.68600000000004, "r_x1": 343.138, "r_y1": 139.68600000000004, "r_x2": 343.138, "r_y2": 130.889, "r_x3": 319.466, "r_y3": 130.889, "coord_origin": "TOPLEFT"}, "text": "<td>", "orig": "<td>", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 13, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 347.132, "r_y0": 139.68600000000004, "r_x1": 363.179, "r_y1": 139.68600000000004, "r_x2": 363.179, "r_y2": 130.889, "r_x3": 347.132, "r_y3": 130.889, "coord_origin": "TOPLEFT"}, "text": "and", "orig": "and", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 14, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 367.06, "r_y0": 139.68600000000004, "r_x1": 395.823, "r_y1": 139.68600000000004, "r_x2": 395.823, "r_y2": 130.889, "r_x3": 367.06, "r_y3": 130.889, "coord_origin": "TOPLEFT"}, "text": "</td>", "orig": "</td>", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 15, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 395.823, "r_y0": 139.68600000000004, "r_x1": 398.59, "r_y1": 139.68600000000004, "r_x2": 398.59, "r_y2": 130.889, "r_x3": 395.823, "r_y3": 130.889, "coord_origin": "TOPLEFT"}, "text": ",", "orig": ",", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 16, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 402.475, "r_y0": 139.68600000000004, "r_x1": 480.592, "r_y1": 139.68600000000004, "r_x2": 480.592, "r_y2": 130.889, "r_x3": 402.475, "r_y3": 130.889, "coord_origin": "TOPLEFT"}, "text": "one can construct", "orig": "one can construct", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 17, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 151.64200000000005, "r_x1": 480.594, "r_y1": 151.64200000000005, "r_x2": 480.594, "r_y2": 142.84500000000003, "r_x3": 134.765, "r_y3": 142.84500000000003, "coord_origin": "TOPLEFT"}, "text": "simple table structures without any spanning cells. In reality though, one needs", "orig": "simple table structures without any spanning cells. In reality though, one needs", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 18, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 163.59699999999998, "r_x1": 480.586, "r_y1": 163.59699999999998, "r_x2": 480.586, "r_y2": 154.79999999999995, "r_x3": 134.765, "r_y3": 154.79999999999995, "coord_origin": "TOPLEFT"}, "text": "at least 28 HTML tokens to describe the most common complex tables observed", "orig": "at least 28 HTML tokens to describe the most common complex tables observed", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 19, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 175.55200000000002, "r_x1": 480.594, "r_y1": 175.55200000000002, "r_x2": 480.594, "r_y2": 166.755, "r_x3": 134.765, "r_y3": 166.755, "coord_origin": "TOPLEFT"}, "text": "in real-world documents [21,22], due to a variety of spanning cells definitions in", "orig": "in real-world documents [21,22], due to a variety of spanning cells definitions in", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 20, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 187.50699999999995, "r_x1": 261.926, "r_y1": 187.50699999999995, "r_x2": 261.926, "r_y2": 178.71000000000004, "r_x3": 134.765, "r_y3": 178.71000000000004, "coord_origin": "TOPLEFT"}, "text": "the HTML token vocabulary.", "orig": "the HTML token vocabulary.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "ulary and can be interpreted as a table structure. For example, with the HTML tokens <table> , </table> , <tr> , </tr> , <td> and </td> , one can construct simple table structures without any spanning cells. In reality though, one needs at least 28 HTML tokens to describe the most common complex tables observed in real-world documents [21,22], due to a variety of spanning cells definitions in the HTML token vocabulary."}, {"label": "caption", "id": 7, "page_no": 4, "cluster": {"id": 7, "label": "caption", "bbox": {"l": 145.607, "t": 218.86400000000003, "r": 469.752, "b": 230.15300000000002, "coord_origin": "TOPLEFT"}, "confidence": 0.8472551703453064, "cells": [{"index": 21, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 145.607, "r_y0": 229.005, "r_x1": 173.486, "r_y1": 229.005, "r_x2": 173.486, "r_y2": 221.07899999999995, "r_x3": 145.607, "r_y3": 221.07899999999995, "coord_origin": "TOPLEFT"}, "text": "Fig. 2.", "orig": "Fig. 2.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 22, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 176.56, "r_y0": 230.15300000000002, "r_x1": 469.752, "r_y1": 230.15300000000002, "r_x2": 469.752, "r_y2": 218.86400000000003, "r_x3": 176.56, "r_y3": 218.86400000000003, "coord_origin": "TOPLEFT"}, "text": "Frequency of tokens in HTML and OTSL as they appear in PubTabNet.", "orig": "Frequency of tokens in HTML and OTSL as they appear in PubTabNet.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "Fig. 2. Frequency of tokens in HTML and OTSL as they appear in PubTabNet."}, {"label": "text", "id": 1, "page_no": 4, "cluster": {"id": 1, "label": "text", "bbox": {"l": 134.765, "t": 368.207, "r": 480.595, "b": 532.421, "coord_origin": "TOPLEFT"}, "confidence": 0.9844799637794495, "cells": [{"index": 23, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 149.709, "r_y0": 377.004, "r_x1": 480.593, "r_y1": 377.004, "r_x2": 480.593, "r_y2": 368.207, "r_x3": 149.709, "r_y3": 368.207, "coord_origin": "TOPLEFT"}, "text": "Obviously, HTML and other general-purpose markup languages were not de-", "orig": "Obviously, HTML and other general-purpose markup languages were not de-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 24, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 388.959, "r_x1": 480.587, "r_y1": 388.959, "r_x2": 480.587, "r_y2": 380.162, "r_x3": 134.765, "r_y3": 380.162, "coord_origin": "TOPLEFT"}, "text": "signed for Im2Seq models. As such, they have some serious drawbacks. First, the", "orig": "signed for Im2Seq models. As such, they have some serious drawbacks. First, the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 25, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 400.914, "r_x1": 480.592, "r_y1": 400.914, "r_x2": 480.592, "r_y2": 392.117, "r_x3": 134.765, "r_y3": 392.117, "coord_origin": "TOPLEFT"}, "text": "token vocabulary needs to be artificially large in order to describe all plausible", "orig": "token vocabulary needs to be artificially large in order to describe all plausible", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 26, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 412.869, "r_x1": 480.59, "r_y1": 412.869, "r_x2": 480.59, "r_y2": 404.072, "r_x3": 134.765, "r_y3": 404.072, "coord_origin": "TOPLEFT"}, "text": "tabular structures. Since most Im2Seq models use an autoregressive approach,", "orig": "tabular structures. Since most Im2Seq models use an autoregressive approach,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 27, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 424.825, "r_x1": 480.589, "r_y1": 424.825, "r_x2": 480.589, "r_y2": 416.028, "r_x3": 134.765, "r_y3": 416.028, "coord_origin": "TOPLEFT"}, "text": "they generate the sequence token by token. Therefore, to reduce inference time,", "orig": "they generate the sequence token by token. Therefore, to reduce inference time,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 28, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 436.78, "r_x1": 480.593, "r_y1": 436.78, "r_x2": 480.593, "r_y2": 427.983, "r_x3": 134.765, "r_y3": 427.983, "coord_origin": "TOPLEFT"}, "text": "a shorter sequence length is critical. Every table-cell is represented by at least", "orig": "a shorter sequence length is critical. Every table-cell is represented by at least", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 29, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 448.735, "r_x1": 187.934, "r_y1": 448.735, "r_x2": 187.934, "r_y2": 439.938, "r_x3": 134.765, "r_y3": 439.938, "coord_origin": "TOPLEFT"}, "text": "two tokens (", "orig": "two tokens (", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 30, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 187.931, "r_y0": 448.735, "r_x1": 211.603, "r_y1": 448.735, "r_x2": 211.603, "r_y2": 439.938, "r_x3": 187.931, "r_y3": 439.938, "coord_origin": "TOPLEFT"}, "text": "<td>", "orig": "<td>", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 31, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 214.754, "r_y0": 448.735, "r_x1": 230.801, "r_y1": 448.735, "r_x2": 230.801, "r_y2": 439.938, "r_x3": 214.754, "r_y3": 439.938, "coord_origin": "TOPLEFT"}, "text": "and", "orig": "and", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 32, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 233.839, "r_y0": 448.735, "r_x1": 262.602, "r_y1": 448.735, "r_x2": 262.602, "r_y2": 439.938, "r_x3": 233.839, "r_y3": 439.938, "coord_origin": "TOPLEFT"}, "text": "</td>", "orig": "</td>", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 33, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 262.716, "r_y0": 448.735, "r_x1": 480.59, "r_y1": 448.735, "r_x2": 480.59, "r_y2": 439.938, "r_x3": 262.716, "r_y3": 439.938, "coord_origin": "TOPLEFT"}, "text": "). Furthermore, when tokenizing the HTML struc-", "orig": "). Furthermore, when tokenizing the HTML struc-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 34, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 460.69, "r_x1": 155.266, "r_y1": 460.69, "r_x2": 155.266, "r_y2": 451.893, "r_x3": 134.765, "r_y3": 451.893, "coord_origin": "TOPLEFT"}, "text": "ture,", "orig": "ture,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 35, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 159.789, "r_y0": 460.69, "r_x1": 260.86, "r_y1": 460.69, "r_x2": 260.86, "r_y2": 451.893, "r_x3": 159.789, "r_y3": 451.893, "coord_origin": "TOPLEFT"}, "text": "one needs to explicitly", "orig": "one needs to explicitly", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 36, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 265.383, "r_y0": 460.69, "r_x1": 480.588, "r_y1": 460.69, "r_x2": 480.588, "r_y2": 451.893, "r_x3": 265.383, "r_y3": 451.893, "coord_origin": "TOPLEFT"}, "text": "enumerate possible column-spans and row-spans", "orig": "enumerate possible column-spans and row-spans", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 37, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 472.645, "r_x1": 480.587, "r_y1": 472.645, "r_x2": 480.587, "r_y2": 463.848, "r_x3": 134.765, "r_y3": 463.848, "coord_origin": "TOPLEFT"}, "text": "as words. In practice, this ends up requiring 28 different HTML tokens (when", "orig": "as words. In practice, this ends up requiring 28 different HTML tokens (when", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 38, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 484.601, "r_x1": 480.587, "r_y1": 484.601, "r_x2": 480.587, "r_y2": 475.804, "r_x3": 134.765, "r_y3": 475.804, "coord_origin": "TOPLEFT"}, "text": "including column- and row-spans up to 10 cells) just to describe every table in", "orig": "including column- and row-spans up to 10 cells) just to describe every table in", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 39, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 496.556, "r_x1": 480.591, "r_y1": 496.556, "r_x2": 480.591, "r_y2": 487.759, "r_x3": 134.765, "r_y3": 487.759, "coord_origin": "TOPLEFT"}, "text": "the PubTabNet dataset. Clearly, not every token is equally represented, as is", "orig": "the PubTabNet dataset. Clearly, not every token is equally represented, as is", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 40, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 508.511, "r_x1": 480.593, "r_y1": 508.511, "r_x2": 480.593, "r_y2": 499.714, "r_x3": 134.765, "r_y3": 499.714, "coord_origin": "TOPLEFT"}, "text": "depicted in Figure 2. This skewed distribution of tokens in combination with", "orig": "depicted in Figure 2. This skewed distribution of tokens in combination with", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 41, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 520.466, "r_x1": 480.595, "r_y1": 520.466, "r_x2": 480.595, "r_y2": 511.669, "r_x3": 134.765, "r_y3": 511.669, "coord_origin": "TOPLEFT"}, "text": "variable token row-length makes it challenging for models to learn the HTML", "orig": "variable token row-length makes it challenging for models to learn the HTML", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 42, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 532.421, "r_x1": 176.929, "r_y1": 532.421, "r_x2": 176.929, "r_y2": 523.624, "r_x3": 134.765, "r_y3": 523.624, "coord_origin": "TOPLEFT"}, "text": "structure.", "orig": "structure.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "Obviously, HTML and other general-purpose markup languages were not designed for Im2Seq models. As such, they have some serious drawbacks. First, the token vocabulary needs to be artificially large in order to describe all plausible tabular structures. Since most Im2Seq models use an autoregressive approach, they generate the sequence token by token. Therefore, to reduce inference time, a shorter sequence length is critical. Every table-cell is represented by at least two tokens ( <td> and </td> ). Furthermore, when tokenizing the HTML structure, one needs to explicitly enumerate possible column-spans and row-spans as words. In practice, this ends up requiring 28 different HTML tokens (when including column- and row-spans up to 10 cells) just to describe every table in the PubTabNet dataset. Clearly, not every token is equally represented, as is depicted in Figure 2. This skewed distribution of tokens in combination with variable token row-length makes it challenging for models to learn the HTML structure."}, {"label": "text", "id": 3, "page_no": 4, "cluster": {"id": 3, "label": "text", "bbox": {"l": 134.765, "t": 536.043, "r": 480.593, "b": 580.706, "coord_origin": "TOPLEFT"}, "confidence": 0.978394627571106, "cells": [{"index": 43, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 149.709, "r_y0": 544.84, "r_x1": 480.593, "r_y1": 544.84, "r_x2": 480.593, "r_y2": 536.043, "r_x3": 149.709, "r_y3": 536.043, "coord_origin": "TOPLEFT"}, "text": "Additionally, it would be desirable if the representation would easily allow", "orig": "Additionally, it would be desirable if the representation would easily allow", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 44, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 556.795, "r_x1": 480.591, "r_y1": 556.795, "r_x2": 480.591, "r_y2": 547.998, "r_x3": 134.765, "r_y3": 547.998, "coord_origin": "TOPLEFT"}, "text": "an early detection of invalid sequences on-the-go, before the prediction of the", "orig": "an early detection of invalid sequences on-the-go, before the prediction of the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 45, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 568.75, "r_x1": 480.59, "r_y1": 568.75, "r_x2": 480.59, "r_y2": 559.953, "r_x3": 134.765, "r_y3": 559.953, "coord_origin": "TOPLEFT"}, "text": "entire table structure is completed. HTML is not well-suited for this purpose as", "orig": "entire table structure is completed. HTML is not well-suited for this purpose as", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 46, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 580.706, "r_x1": 452.189, "r_y1": 580.706, "r_x2": 452.189, "r_y2": 571.909, "r_x3": 134.765, "r_y3": 571.909, "coord_origin": "TOPLEFT"}, "text": "the verification of incomplete sequences is non-trivial or even impossible.", "orig": "the verification of incomplete sequences is non-trivial or even impossible.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "Additionally, it would be desirable if the representation would easily allow an early detection of invalid sequences on-the-go, before the prediction of the entire table structure is completed. HTML is not well-suited for this purpose as the verification of incomplete sequences is non-trivial or even impossible."}, {"label": "text", "id": 2, "page_no": 4, "cluster": {"id": 2, "label": "text", "bbox": {"l": 134.765, "t": 584.327, "r": 480.595, "b": 664.855, "coord_origin": "TOPLEFT"}, "confidence": 0.9838283061981201, "cells": [{"index": 47, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 149.709, "r_y0": 593.124, "r_x1": 480.593, "r_y1": 593.124, "r_x2": 480.593, "r_y2": 584.327, "r_x3": 149.709, "r_y3": 584.327, "coord_origin": "TOPLEFT"}, "text": "In a valid HTML table, the token sequence must describe a 2D grid of table", "orig": "In a valid HTML table, the token sequence must describe a 2D grid of table", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 48, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 605.08, "r_x1": 155.846, "r_y1": 605.08, "r_x2": 155.846, "r_y2": 596.283, "r_x3": 134.765, "r_y3": 596.283, "coord_origin": "TOPLEFT"}, "text": "cells,", "orig": "cells,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 49, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 160.09, "r_y0": 605.08, "r_x1": 199.514, "r_y1": 605.08, "r_x2": 199.514, "r_y2": 596.283, "r_x3": 160.09, "r_y3": 596.283, "coord_origin": "TOPLEFT"}, "text": "serialised", "orig": "serialised", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 50, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 203.758, "r_y0": 605.08, "r_x1": 212.058, "r_y1": 605.08, "r_x2": 212.058, "r_y2": 596.283, "r_x3": 203.758, "r_y3": 596.283, "coord_origin": "TOPLEFT"}, "text": "in", "orig": "in", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 51, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 216.302, "r_y0": 605.08, "r_x1": 480.59, "r_y1": 605.08, "r_x2": 480.59, "r_y2": 596.283, "r_x3": 216.302, "r_y3": 596.283, "coord_origin": "TOPLEFT"}, "text": "row-major ordering, where each row and each column have", "orig": "row-major ordering, where each row and each column have", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 52, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 617.035, "r_x1": 480.594, "r_y1": 617.035, "r_x2": 480.594, "r_y2": 608.238, "r_x3": 134.765, "r_y3": 608.238, "coord_origin": "TOPLEFT"}, "text": "the same length (while considering row- and column-spans). Furthermore, every", "orig": "the same length (while considering row- and column-spans). Furthermore, every", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 53, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 628.99, "r_x1": 480.591, "r_y1": 628.99, "r_x2": 480.591, "r_y2": 620.193, "r_x3": 134.765, "r_y3": 620.193, "coord_origin": "TOPLEFT"}, "text": "opening tag in HTML needs to be matched by a closing tag in a correct hierar-", "orig": "opening tag in HTML needs to be matched by a closing tag in a correct hierar-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 54, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 640.9449999999999, "r_x1": 480.586, "r_y1": 640.9449999999999, "r_x2": 480.586, "r_y2": 632.148, "r_x3": 134.765, "r_y3": 632.148, "coord_origin": "TOPLEFT"}, "text": "chical manner. Since the number of tokens for each table row and column can", "orig": "chical manner. Since the number of tokens for each table row and column can", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 55, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 652.9, "r_x1": 480.592, "r_y1": 652.9, "r_x2": 480.592, "r_y2": 644.1030000000001, "r_x3": 134.765, "r_y3": 644.1030000000001, "coord_origin": "TOPLEFT"}, "text": "vary significantly, especially for large tables with many row- and column-spans,", "orig": "vary significantly, especially for large tables with many row- and column-spans,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 56, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 664.855, "r_x1": 141.405, "r_y1": 664.855, "r_x2": 141.405, "r_y2": 656.058, "r_x3": 134.765, "r_y3": 656.058, "coord_origin": "TOPLEFT"}, "text": "it", "orig": "it", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 57, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 145.281, "r_y0": 664.855, "r_x1": 151.975, "r_y1": 664.855, "r_x2": 151.975, "r_y2": 656.058, "r_x3": 145.281, "r_y3": 656.058, "coord_origin": "TOPLEFT"}, "text": "is", "orig": "is", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 58, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 155.861, "r_y0": 664.855, "r_x1": 480.595, "r_y1": 664.855, "r_x2": 480.595, "r_y2": 656.058, "r_x3": 155.861, "r_y3": 656.058, "coord_origin": "TOPLEFT"}, "text": "complex to verify the consistency of predicted structures during sequence", "orig": "complex to verify the consistency of predicted structures during sequence", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "In a valid HTML table, the token sequence must describe a 2D grid of table cells, serialised in row-major ordering, where each row and each column have the same length (while considering row- and column-spans). Furthermore, every opening tag in HTML needs to be matched by a closing tag in a correct hierarchical manner. Since the number of tokens for each table row and column can vary significantly, especially for large tables with many row- and column-spans, it is complex to verify the consistency of predicted structures during sequence"}, {"label": "picture", "id": 4, "page_no": 4, "cluster": {"id": 4, "label": "picture", "bbox": {"l": 137.41448974609375, "t": 233.51231384277344, "r": 476.5608215332031, "b": 340.2304992675781, "coord_origin": "TOPLEFT"}, "confidence": 0.9387977123260498, "cells": [], "children": []}, "text": "", "annotations": [], "provenance": null, "predicted_class": null, "confidence": null}], "body": [{"label": "text", "id": 0, "page_no": 4, "cluster": {"id": 0, "label": "text", "bbox": {"l": 134.765, "t": 118.93399999999997, "r": 480.594, "b": 187.50699999999995, "coord_origin": "TOPLEFT"}, "confidence": 0.9857171773910522, "cells": [{"index": 2, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 127.731, "r_x1": 480.586, "r_y1": 127.731, "r_x2": 480.586, "r_y2": 118.93399999999997, "r_x3": 134.765, "r_y3": 118.93399999999997, "coord_origin": "TOPLEFT"}, "text": "ulary and can be interpreted as a table structure. For example, with the HTML", "orig": "ulary and can be interpreted as a table structure. For example, with the HTML", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 3, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 139.68600000000004, "r_x1": 162.485, "r_y1": 139.68600000000004, "r_x2": 162.485, "r_y2": 130.889, "r_x3": 134.765, "r_y3": 130.889, "coord_origin": "TOPLEFT"}, "text": "tokens", "orig": "tokens", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 4, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 166.368, "r_y0": 139.68600000000004, "r_x1": 201.749, "r_y1": 139.68600000000004, "r_x2": 201.749, "r_y2": 130.889, "r_x3": 166.368, "r_y3": 130.889, "coord_origin": "TOPLEFT"}, "text": "<table>", "orig": "<table>", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 5, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 201.749, "r_y0": 139.68600000000004, "r_x1": 204.516, "r_y1": 139.68600000000004, "r_x2": 204.516, "r_y2": 130.889, "r_x3": 201.749, "r_y3": 130.889, "coord_origin": "TOPLEFT"}, "text": ",", "orig": ",", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 6, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 208.397, "r_y0": 139.68600000000004, "r_x1": 248.869, "r_y1": 139.68600000000004, "r_x2": 248.869, "r_y2": 130.889, "r_x3": 208.397, "r_y3": 130.889, "coord_origin": "TOPLEFT"}, "text": "</table>", "orig": "</table>", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 7, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 248.869, "r_y0": 139.68600000000004, "r_x1": 251.636, "r_y1": 139.68600000000004, "r_x2": 251.636, "r_y2": 130.889, "r_x3": 248.869, "r_y3": 130.889, "coord_origin": "TOPLEFT"}, "text": ",", "orig": ",", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 8, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 255.517, "r_y0": 139.68600000000004, "r_x1": 278.298, "r_y1": 139.68600000000004, "r_x2": 278.298, "r_y2": 130.889, "r_x3": 255.517, "r_y3": 130.889, "coord_origin": "TOPLEFT"}, "text": "<tr>", "orig": "<tr>", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 9, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 278.298, "r_y0": 139.68600000000004, "r_x1": 281.065, "r_y1": 139.68600000000004, "r_x2": 281.065, "r_y2": 130.889, "r_x3": 278.298, "r_y3": 130.889, "coord_origin": "TOPLEFT"}, "text": ",", "orig": ",", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 10, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 284.946, "r_y0": 139.68600000000004, "r_x1": 312.818, "r_y1": 139.68600000000004, "r_x2": 312.818, "r_y2": 130.889, "r_x3": 284.946, "r_y3": 130.889, "coord_origin": "TOPLEFT"}, "text": "</tr>", "orig": "</tr>", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 11, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 312.818, "r_y0": 139.68600000000004, "r_x1": 315.585, "r_y1": 139.68600000000004, "r_x2": 315.585, "r_y2": 130.889, "r_x3": 312.818, "r_y3": 130.889, "coord_origin": "TOPLEFT"}, "text": ",", "orig": ",", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 12, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 319.466, "r_y0": 139.68600000000004, "r_x1": 343.138, "r_y1": 139.68600000000004, "r_x2": 343.138, "r_y2": 130.889, "r_x3": 319.466, "r_y3": 130.889, "coord_origin": "TOPLEFT"}, "text": "<td>", "orig": "<td>", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 13, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 347.132, "r_y0": 139.68600000000004, "r_x1": 363.179, "r_y1": 139.68600000000004, "r_x2": 363.179, "r_y2": 130.889, "r_x3": 347.132, "r_y3": 130.889, "coord_origin": "TOPLEFT"}, "text": "and", "orig": "and", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 14, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 367.06, "r_y0": 139.68600000000004, "r_x1": 395.823, "r_y1": 139.68600000000004, "r_x2": 395.823, "r_y2": 130.889, "r_x3": 367.06, "r_y3": 130.889, "coord_origin": "TOPLEFT"}, "text": "</td>", "orig": "</td>", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 15, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 395.823, "r_y0": 139.68600000000004, "r_x1": 398.59, "r_y1": 139.68600000000004, "r_x2": 398.59, "r_y2": 130.889, "r_x3": 395.823, "r_y3": 130.889, "coord_origin": "TOPLEFT"}, "text": ",", "orig": ",", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 16, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 402.475, "r_y0": 139.68600000000004, "r_x1": 480.592, "r_y1": 139.68600000000004, "r_x2": 480.592, "r_y2": 130.889, "r_x3": 402.475, "r_y3": 130.889, "coord_origin": "TOPLEFT"}, "text": "one can construct", "orig": "one can construct", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 17, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 151.64200000000005, "r_x1": 480.594, "r_y1": 151.64200000000005, "r_x2": 480.594, "r_y2": 142.84500000000003, "r_x3": 134.765, "r_y3": 142.84500000000003, "coord_origin": "TOPLEFT"}, "text": "simple table structures without any spanning cells. In reality though, one needs", "orig": "simple table structures without any spanning cells. In reality though, one needs", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 18, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 163.59699999999998, "r_x1": 480.586, "r_y1": 163.59699999999998, "r_x2": 480.586, "r_y2": 154.79999999999995, "r_x3": 134.765, "r_y3": 154.79999999999995, "coord_origin": "TOPLEFT"}, "text": "at least 28 HTML tokens to describe the most common complex tables observed", "orig": "at least 28 HTML tokens to describe the most common complex tables observed", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 19, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 175.55200000000002, "r_x1": 480.594, "r_y1": 175.55200000000002, "r_x2": 480.594, "r_y2": 166.755, "r_x3": 134.765, "r_y3": 166.755, "coord_origin": "TOPLEFT"}, "text": "in real-world documents [21,22], due to a variety of spanning cells definitions in", "orig": "in real-world documents [21,22], due to a variety of spanning cells definitions in", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 20, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 187.50699999999995, "r_x1": 261.926, "r_y1": 187.50699999999995, "r_x2": 261.926, "r_y2": 178.71000000000004, "r_x3": 134.765, "r_y3": 178.71000000000004, "coord_origin": "TOPLEFT"}, "text": "the HTML token vocabulary.", "orig": "the HTML token vocabulary.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "ulary and can be interpreted as a table structure. For example, with the HTML tokens <table> , </table> , <tr> , </tr> , <td> and </td> , one can construct simple table structures without any spanning cells. In reality though, one needs at least 28 HTML tokens to describe the most common complex tables observed in real-world documents [21,22], due to a variety of spanning cells definitions in the HTML token vocabulary."}, {"label": "caption", "id": 7, "page_no": 4, "cluster": {"id": 7, "label": "caption", "bbox": {"l": 145.607, "t": 218.86400000000003, "r": 469.752, "b": 230.15300000000002, "coord_origin": "TOPLEFT"}, "confidence": 0.8472551703453064, "cells": [{"index": 21, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 145.607, "r_y0": 229.005, "r_x1": 173.486, "r_y1": 229.005, "r_x2": 173.486, "r_y2": 221.07899999999995, "r_x3": 145.607, "r_y3": 221.07899999999995, "coord_origin": "TOPLEFT"}, "text": "Fig. 2.", "orig": "Fig. 2.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 22, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 176.56, "r_y0": 230.15300000000002, "r_x1": 469.752, "r_y1": 230.15300000000002, "r_x2": 469.752, "r_y2": 218.86400000000003, "r_x3": 176.56, "r_y3": 218.86400000000003, "coord_origin": "TOPLEFT"}, "text": "Frequency of tokens in HTML and OTSL as they appear in PubTabNet.", "orig": "Frequency of tokens in HTML and OTSL as they appear in PubTabNet.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "Fig. 2. Frequency of tokens in HTML and OTSL as they appear in PubTabNet."}, {"label": "text", "id": 1, "page_no": 4, "cluster": {"id": 1, "label": "text", "bbox": {"l": 134.765, "t": 368.207, "r": 480.595, "b": 532.421, "coord_origin": "TOPLEFT"}, "confidence": 0.9844799637794495, "cells": [{"index": 23, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 149.709, "r_y0": 377.004, "r_x1": 480.593, "r_y1": 377.004, "r_x2": 480.593, "r_y2": 368.207, "r_x3": 149.709, "r_y3": 368.207, "coord_origin": "TOPLEFT"}, "text": "Obviously, HTML and other general-purpose markup languages were not de-", "orig": "Obviously, HTML and other general-purpose markup languages were not de-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 24, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 388.959, "r_x1": 480.587, "r_y1": 388.959, "r_x2": 480.587, "r_y2": 380.162, "r_x3": 134.765, "r_y3": 380.162, "coord_origin": "TOPLEFT"}, "text": "signed for Im2Seq models. As such, they have some serious drawbacks. First, the", "orig": "signed for Im2Seq models. As such, they have some serious drawbacks. First, the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 25, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 400.914, "r_x1": 480.592, "r_y1": 400.914, "r_x2": 480.592, "r_y2": 392.117, "r_x3": 134.765, "r_y3": 392.117, "coord_origin": "TOPLEFT"}, "text": "token vocabulary needs to be artificially large in order to describe all plausible", "orig": "token vocabulary needs to be artificially large in order to describe all plausible", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 26, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 412.869, "r_x1": 480.59, "r_y1": 412.869, "r_x2": 480.59, "r_y2": 404.072, "r_x3": 134.765, "r_y3": 404.072, "coord_origin": "TOPLEFT"}, "text": "tabular structures. Since most Im2Seq models use an autoregressive approach,", "orig": "tabular structures. Since most Im2Seq models use an autoregressive approach,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 27, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 424.825, "r_x1": 480.589, "r_y1": 424.825, "r_x2": 480.589, "r_y2": 416.028, "r_x3": 134.765, "r_y3": 416.028, "coord_origin": "TOPLEFT"}, "text": "they generate the sequence token by token. Therefore, to reduce inference time,", "orig": "they generate the sequence token by token. Therefore, to reduce inference time,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 28, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 436.78, "r_x1": 480.593, "r_y1": 436.78, "r_x2": 480.593, "r_y2": 427.983, "r_x3": 134.765, "r_y3": 427.983, "coord_origin": "TOPLEFT"}, "text": "a shorter sequence length is critical. Every table-cell is represented by at least", "orig": "a shorter sequence length is critical. Every table-cell is represented by at least", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 29, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 448.735, "r_x1": 187.934, "r_y1": 448.735, "r_x2": 187.934, "r_y2": 439.938, "r_x3": 134.765, "r_y3": 439.938, "coord_origin": "TOPLEFT"}, "text": "two tokens (", "orig": "two tokens (", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 30, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 187.931, "r_y0": 448.735, "r_x1": 211.603, "r_y1": 448.735, "r_x2": 211.603, "r_y2": 439.938, "r_x3": 187.931, "r_y3": 439.938, "coord_origin": "TOPLEFT"}, "text": "<td>", "orig": "<td>", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 31, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 214.754, "r_y0": 448.735, "r_x1": 230.801, "r_y1": 448.735, "r_x2": 230.801, "r_y2": 439.938, "r_x3": 214.754, "r_y3": 439.938, "coord_origin": "TOPLEFT"}, "text": "and", "orig": "and", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 32, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 233.839, "r_y0": 448.735, "r_x1": 262.602, "r_y1": 448.735, "r_x2": 262.602, "r_y2": 439.938, "r_x3": 233.839, "r_y3": 439.938, "coord_origin": "TOPLEFT"}, "text": "</td>", "orig": "</td>", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 33, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 262.716, "r_y0": 448.735, "r_x1": 480.59, "r_y1": 448.735, "r_x2": 480.59, "r_y2": 439.938, "r_x3": 262.716, "r_y3": 439.938, "coord_origin": "TOPLEFT"}, "text": "). Furthermore, when tokenizing the HTML struc-", "orig": "). Furthermore, when tokenizing the HTML struc-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 34, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 460.69, "r_x1": 155.266, "r_y1": 460.69, "r_x2": 155.266, "r_y2": 451.893, "r_x3": 134.765, "r_y3": 451.893, "coord_origin": "TOPLEFT"}, "text": "ture,", "orig": "ture,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 35, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 159.789, "r_y0": 460.69, "r_x1": 260.86, "r_y1": 460.69, "r_x2": 260.86, "r_y2": 451.893, "r_x3": 159.789, "r_y3": 451.893, "coord_origin": "TOPLEFT"}, "text": "one needs to explicitly", "orig": "one needs to explicitly", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 36, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 265.383, "r_y0": 460.69, "r_x1": 480.588, "r_y1": 460.69, "r_x2": 480.588, "r_y2": 451.893, "r_x3": 265.383, "r_y3": 451.893, "coord_origin": "TOPLEFT"}, "text": "enumerate possible column-spans and row-spans", "orig": "enumerate possible column-spans and row-spans", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 37, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 472.645, "r_x1": 480.587, "r_y1": 472.645, "r_x2": 480.587, "r_y2": 463.848, "r_x3": 134.765, "r_y3": 463.848, "coord_origin": "TOPLEFT"}, "text": "as words. In practice, this ends up requiring 28 different HTML tokens (when", "orig": "as words. In practice, this ends up requiring 28 different HTML tokens (when", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 38, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 484.601, "r_x1": 480.587, "r_y1": 484.601, "r_x2": 480.587, "r_y2": 475.804, "r_x3": 134.765, "r_y3": 475.804, "coord_origin": "TOPLEFT"}, "text": "including column- and row-spans up to 10 cells) just to describe every table in", "orig": "including column- and row-spans up to 10 cells) just to describe every table in", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 39, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 496.556, "r_x1": 480.591, "r_y1": 496.556, "r_x2": 480.591, "r_y2": 487.759, "r_x3": 134.765, "r_y3": 487.759, "coord_origin": "TOPLEFT"}, "text": "the PubTabNet dataset. Clearly, not every token is equally represented, as is", "orig": "the PubTabNet dataset. Clearly, not every token is equally represented, as is", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 40, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 508.511, "r_x1": 480.593, "r_y1": 508.511, "r_x2": 480.593, "r_y2": 499.714, "r_x3": 134.765, "r_y3": 499.714, "coord_origin": "TOPLEFT"}, "text": "depicted in Figure 2. This skewed distribution of tokens in combination with", "orig": "depicted in Figure 2. This skewed distribution of tokens in combination with", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 41, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 520.466, "r_x1": 480.595, "r_y1": 520.466, "r_x2": 480.595, "r_y2": 511.669, "r_x3": 134.765, "r_y3": 511.669, "coord_origin": "TOPLEFT"}, "text": "variable token row-length makes it challenging for models to learn the HTML", "orig": "variable token row-length makes it challenging for models to learn the HTML", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 42, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 532.421, "r_x1": 176.929, "r_y1": 532.421, "r_x2": 176.929, "r_y2": 523.624, "r_x3": 134.765, "r_y3": 523.624, "coord_origin": "TOPLEFT"}, "text": "structure.", "orig": "structure.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "Obviously, HTML and other general-purpose markup languages were not designed for Im2Seq models. As such, they have some serious drawbacks. First, the token vocabulary needs to be artificially large in order to describe all plausible tabular structures. Since most Im2Seq models use an autoregressive approach, they generate the sequence token by token. Therefore, to reduce inference time, a shorter sequence length is critical. Every table-cell is represented by at least two tokens ( <td> and </td> ). Furthermore, when tokenizing the HTML structure, one needs to explicitly enumerate possible column-spans and row-spans as words. In practice, this ends up requiring 28 different HTML tokens (when including column- and row-spans up to 10 cells) just to describe every table in the PubTabNet dataset. Clearly, not every token is equally represented, as is depicted in Figure 2. This skewed distribution of tokens in combination with variable token row-length makes it challenging for models to learn the HTML structure."}, {"label": "text", "id": 3, "page_no": 4, "cluster": {"id": 3, "label": "text", "bbox": {"l": 134.765, "t": 536.043, "r": 480.593, "b": 580.706, "coord_origin": "TOPLEFT"}, "confidence": 0.978394627571106, "cells": [{"index": 43, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 149.709, "r_y0": 544.84, "r_x1": 480.593, "r_y1": 544.84, "r_x2": 480.593, "r_y2": 536.043, "r_x3": 149.709, "r_y3": 536.043, "coord_origin": "TOPLEFT"}, "text": "Additionally, it would be desirable if the representation would easily allow", "orig": "Additionally, it would be desirable if the representation would easily allow", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 44, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 556.795, "r_x1": 480.591, "r_y1": 556.795, "r_x2": 480.591, "r_y2": 547.998, "r_x3": 134.765, "r_y3": 547.998, "coord_origin": "TOPLEFT"}, "text": "an early detection of invalid sequences on-the-go, before the prediction of the", "orig": "an early detection of invalid sequences on-the-go, before the prediction of the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 45, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 568.75, "r_x1": 480.59, "r_y1": 568.75, "r_x2": 480.59, "r_y2": 559.953, "r_x3": 134.765, "r_y3": 559.953, "coord_origin": "TOPLEFT"}, "text": "entire table structure is completed. HTML is not well-suited for this purpose as", "orig": "entire table structure is completed. HTML is not well-suited for this purpose as", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 46, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 580.706, "r_x1": 452.189, "r_y1": 580.706, "r_x2": 452.189, "r_y2": 571.909, "r_x3": 134.765, "r_y3": 571.909, "coord_origin": "TOPLEFT"}, "text": "the verification of incomplete sequences is non-trivial or even impossible.", "orig": "the verification of incomplete sequences is non-trivial or even impossible.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "Additionally, it would be desirable if the representation would easily allow an early detection of invalid sequences on-the-go, before the prediction of the entire table structure is completed. HTML is not well-suited for this purpose as the verification of incomplete sequences is non-trivial or even impossible."}, {"label": "text", "id": 2, "page_no": 4, "cluster": {"id": 2, "label": "text", "bbox": {"l": 134.765, "t": 584.327, "r": 480.595, "b": 664.855, "coord_origin": "TOPLEFT"}, "confidence": 0.9838283061981201, "cells": [{"index": 47, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 149.709, "r_y0": 593.124, "r_x1": 480.593, "r_y1": 593.124, "r_x2": 480.593, "r_y2": 584.327, "r_x3": 149.709, "r_y3": 584.327, "coord_origin": "TOPLEFT"}, "text": "In a valid HTML table, the token sequence must describe a 2D grid of table", "orig": "In a valid HTML table, the token sequence must describe a 2D grid of table", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 48, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 605.08, "r_x1": 155.846, "r_y1": 605.08, "r_x2": 155.846, "r_y2": 596.283, "r_x3": 134.765, "r_y3": 596.283, "coord_origin": "TOPLEFT"}, "text": "cells,", "orig": "cells,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 49, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 160.09, "r_y0": 605.08, "r_x1": 199.514, "r_y1": 605.08, "r_x2": 199.514, "r_y2": 596.283, "r_x3": 160.09, "r_y3": 596.283, "coord_origin": "TOPLEFT"}, "text": "serialised", "orig": "serialised", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 50, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 203.758, "r_y0": 605.08, "r_x1": 212.058, "r_y1": 605.08, "r_x2": 212.058, "r_y2": 596.283, "r_x3": 203.758, "r_y3": 596.283, "coord_origin": "TOPLEFT"}, "text": "in", "orig": "in", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 51, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 216.302, "r_y0": 605.08, "r_x1": 480.59, "r_y1": 605.08, "r_x2": 480.59, "r_y2": 596.283, "r_x3": 216.302, "r_y3": 596.283, "coord_origin": "TOPLEFT"}, "text": "row-major ordering, where each row and each column have", "orig": "row-major ordering, where each row and each column have", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 52, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 617.035, "r_x1": 480.594, "r_y1": 617.035, "r_x2": 480.594, "r_y2": 608.238, "r_x3": 134.765, "r_y3": 608.238, "coord_origin": "TOPLEFT"}, "text": "the same length (while considering row- and column-spans). Furthermore, every", "orig": "the same length (while considering row- and column-spans). Furthermore, every", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 53, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 628.99, "r_x1": 480.591, "r_y1": 628.99, "r_x2": 480.591, "r_y2": 620.193, "r_x3": 134.765, "r_y3": 620.193, "coord_origin": "TOPLEFT"}, "text": "opening tag in HTML needs to be matched by a closing tag in a correct hierar-", "orig": "opening tag in HTML needs to be matched by a closing tag in a correct hierar-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 54, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 640.9449999999999, "r_x1": 480.586, "r_y1": 640.9449999999999, "r_x2": 480.586, "r_y2": 632.148, "r_x3": 134.765, "r_y3": 632.148, "coord_origin": "TOPLEFT"}, "text": "chical manner. Since the number of tokens for each table row and column can", "orig": "chical manner. Since the number of tokens for each table row and column can", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 55, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 652.9, "r_x1": 480.592, "r_y1": 652.9, "r_x2": 480.592, "r_y2": 644.1030000000001, "r_x3": 134.765, "r_y3": 644.1030000000001, "coord_origin": "TOPLEFT"}, "text": "vary significantly, especially for large tables with many row- and column-spans,", "orig": "vary significantly, especially for large tables with many row- and column-spans,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 56, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 664.855, "r_x1": 141.405, "r_y1": 664.855, "r_x2": 141.405, "r_y2": 656.058, "r_x3": 134.765, "r_y3": 656.058, "coord_origin": "TOPLEFT"}, "text": "it", "orig": "it", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 57, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 145.281, "r_y0": 664.855, "r_x1": 151.975, "r_y1": 664.855, "r_x2": 151.975, "r_y2": 656.058, "r_x3": 145.281, "r_y3": 656.058, "coord_origin": "TOPLEFT"}, "text": "is", "orig": "is", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 58, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 155.861, "r_y0": 664.855, "r_x1": 480.595, "r_y1": 664.855, "r_x2": 480.595, "r_y2": 656.058, "r_x3": 155.861, "r_y3": 656.058, "coord_origin": "TOPLEFT"}, "text": "complex to verify the consistency of predicted structures during sequence", "orig": "complex to verify the consistency of predicted structures during sequence", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "In a valid HTML table, the token sequence must describe a 2D grid of table cells, serialised in row-major ordering, where each row and each column have the same length (while considering row- and column-spans). Furthermore, every opening tag in HTML needs to be matched by a closing tag in a correct hierarchical manner. Since the number of tokens for each table row and column can vary significantly, especially for large tables with many row- and column-spans, it is complex to verify the consistency of predicted structures during sequence"}, {"label": "picture", "id": 4, "page_no": 4, "cluster": {"id": 4, "label": "picture", "bbox": {"l": 137.41448974609375, "t": 233.51231384277344, "r": 476.5608215332031, "b": 340.2304992675781, "coord_origin": "TOPLEFT"}, "confidence": 0.9387977123260498, "cells": [], "children": []}, "text": "", "annotations": [], "provenance": null, "predicted_class": null, "confidence": null}], "headers": [{"label": "page_header", "id": 5, "page_no": 4, "cluster": {"id": 5, "label": "page_header", "bbox": {"l": 194.478, "t": 91.49300000000005, "r": 447.543, "b": 102.78200000000004, "coord_origin": "TOPLEFT"}, "confidence": 0.9269194602966309, "cells": [{"index": 0, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 194.478, "r_y0": 102.78200000000004, "r_x1": 447.543, "r_y1": 102.78200000000004, "r_x2": 447.543, "r_y2": 91.49300000000005, "r_x3": 194.478, "r_y3": 91.49300000000005, "coord_origin": "TOPLEFT"}, "text": "Optimized Table Tokenization for Table Structure Recognition", "orig": "Optimized Table Tokenization for Table Structure Recognition", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "Optimized Table Tokenization for Table Structure Recognition"}, {"label": "page_header", "id": 6, "page_no": 4, "cluster": {"id": 6, "label": "page_header", "bbox": {"l": 475.984, "t": 91.49300000000005, "r": 480.591, "b": 102.78200000000004, "coord_origin": "TOPLEFT"}, "confidence": 0.8696112036705017, "cells": [{"index": 1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 475.984, "r_y0": 102.78200000000004, "r_x1": 480.591, "r_y1": 102.78200000000004, "r_x2": 480.591, "r_y2": 91.49300000000005, "r_x3": 475.984, "r_y3": 91.49300000000005, "coord_origin": "TOPLEFT"}, "text": "5", "orig": "5", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "5"}]}}, {"page_no": 5, "size": {"width": 612.0, "height": 792.0}, "cells": [{"index": 0, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 102.78200000000004, "r_x1": 139.372, "r_y1": 102.78200000000004, "r_x2": 139.372, "r_y2": 91.49300000000005, "r_x3": 134.765, "r_y3": 91.49300000000005, "coord_origin": "TOPLEFT"}, "text": "6", "orig": "6", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 167.813, "r_y0": 102.78200000000004, "r_x1": 231.722, "r_y1": 102.78200000000004, "r_x2": 231.722, "r_y2": 91.49300000000005, "r_x3": 167.813, "r_y3": 91.49300000000005, "coord_origin": "TOPLEFT"}, "text": "M. Lysak, et al.", "orig": "M. Lysak, et al.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 2, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 127.731, "r_x1": 480.595, "r_y1": 127.731, "r_x2": 480.595, "r_y2": 118.93399999999997, "r_x3": 134.765, "r_y3": 118.93399999999997, "coord_origin": "TOPLEFT"}, "text": "generation. Implicitly, this also means that Im2Seq models need to learn these", "orig": "generation. Implicitly, this also means that Im2Seq models need to learn these", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 3, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 139.68600000000004, "r_x1": 364.625, "r_y1": 139.68600000000004, "r_x2": 364.625, "r_y2": 130.889, "r_x3": 134.765, "r_y3": 130.889, "coord_origin": "TOPLEFT"}, "text": "complex syntax rules, simply to deliver valid output.", "orig": "complex syntax rules, simply to deliver valid output.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 4, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 149.709, "r_y0": 152.27999999999997, "r_x1": 480.59, "r_y1": 152.27999999999997, "r_x2": 480.59, "r_y2": 143.48299999999995, "r_x3": 149.709, "r_y3": 143.48299999999995, "coord_origin": "TOPLEFT"}, "text": "In practice, we observe two major issues with prediction quality when train-", "orig": "In practice, we observe two major issues with prediction quality when train-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 5, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 164.235, "r_x1": 480.594, "r_y1": 164.235, "r_x2": 480.594, "r_y2": 155.438, "r_x3": 134.765, "r_y3": 155.438, "coord_origin": "TOPLEFT"}, "text": "ing Im2Seq models on HTML table structure generation from images. On the", "orig": "ing Im2Seq models on HTML table structure generation from images. On the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 6, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 176.19000000000005, "r_x1": 480.587, "r_y1": 176.19000000000005, "r_x2": 480.587, "r_y2": 167.39300000000003, "r_x3": 134.765, "r_y3": 167.39300000000003, "coord_origin": "TOPLEFT"}, "text": "one hand, we find that on large tables, the visual attention of the model often", "orig": "one hand, we find that on large tables, the visual attention of the model often", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 7, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 188.14499999999998, "r_x1": 480.595, "r_y1": 188.14499999999998, "r_x2": 480.595, "r_y2": 179.34799999999996, "r_x3": 134.765, "r_y3": 179.34799999999996, "coord_origin": "TOPLEFT"}, "text": "starts to drift and is not accurately moving forward cell by cell anymore. This", "orig": "starts to drift and is not accurately moving forward cell by cell anymore. This", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 8, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 200.10000000000002, "r_x1": 314.278, "r_y1": 200.10000000000002, "r_x2": 314.278, "r_y2": 191.303, "r_x3": 134.765, "r_y3": 191.303, "coord_origin": "TOPLEFT"}, "text": "manifests itself in either in an increasing", "orig": "manifests itself in either in an increasing", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 9, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 318.056, "r_y0": 200.10000000000002, "r_x1": 374.087, "r_y1": 200.10000000000002, "r_x2": 374.087, "r_y2": 191.303, "r_x3": 318.056, "r_y3": 191.303, "coord_origin": "TOPLEFT"}, "text": "location drift", "orig": "location drift", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 10, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 378.809, "r_y0": 200.10000000000002, "r_x1": 480.586, "r_y1": 200.10000000000002, "r_x2": 480.586, "r_y2": 191.303, "r_x3": 378.809, "r_y3": 191.303, "coord_origin": "TOPLEFT"}, "text": "for proposed table-cells", "orig": "for proposed table-cells", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 11, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 212.05600000000004, "r_x1": 480.588, "r_y1": 212.05600000000004, "r_x2": 480.588, "r_y2": 203.25900000000001, "r_x3": 134.765, "r_y3": 203.25900000000001, "coord_origin": "TOPLEFT"}, "text": "in later rows on the same column or even complete loss of vertical alignment, as", "orig": "in later rows on the same column or even complete loss of vertical alignment, as", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 12, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 224.01099999999997, "r_x1": 480.596, "r_y1": 224.01099999999997, "r_x2": 480.596, "r_y2": 215.21400000000006, "r_x3": 134.765, "r_y3": 215.21400000000006, "coord_origin": "TOPLEFT"}, "text": "illustrated in Figure 5. Addressing this with post-processing is partially possible,", "orig": "illustrated in Figure 5. Addressing this with post-processing is partially possible,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 13, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 235.966, "r_x1": 480.595, "r_y1": 235.966, "r_x2": 480.595, "r_y2": 227.16899999999998, "r_x3": 134.765, "r_y3": 227.16899999999998, "coord_origin": "TOPLEFT"}, "text": "but clearly undesired. On the other hand, we find many instances of predictions", "orig": "but clearly undesired. On the other hand, we find many instances of predictions", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 14, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 247.92100000000005, "r_x1": 480.588, "r_y1": 247.92100000000005, "r_x2": 480.588, "r_y2": 239.12400000000002, "r_x3": 134.765, "r_y3": 239.12400000000002, "coord_origin": "TOPLEFT"}, "text": "with structural inconsistencies or plain invalid HTML output, as shown in Fig-", "orig": "with structural inconsistencies or plain invalid HTML output, as shown in Fig-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 15, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 259.876, "r_x1": 480.593, "r_y1": 259.876, "r_x2": 480.593, "r_y2": 251.07899999999995, "r_x3": 134.765, "r_y3": 251.07899999999995, "coord_origin": "TOPLEFT"}, "text": "ure 6, which are nearly impossible to properly correct. Both problems seriously", "orig": "ure 6, which are nearly impossible to properly correct. Both problems seriously", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 16, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 271.831, "r_x1": 480.595, "r_y1": 271.831, "r_x2": 480.595, "r_y2": 263.034, "r_x3": 134.765, "r_y3": 263.034, "coord_origin": "TOPLEFT"}, "text": "impact the TSR model performance, since they reflect not only in the task of", "orig": "impact the TSR model performance, since they reflect not only in the task of", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 17, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 283.787, "r_x1": 480.59, "r_y1": 283.787, "r_x2": 480.59, "r_y2": 274.99, "r_x3": 134.765, "r_y3": 274.99, "coord_origin": "TOPLEFT"}, "text": "pure structure recognition but also in the equally crucial recognition or matching", "orig": "pure structure recognition but also in the equally crucial recognition or matching", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 18, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 295.742, "r_x1": 223.573, "r_y1": 295.742, "r_x2": 223.573, "r_y2": 286.945, "r_x3": 134.765, "r_y3": 286.945, "coord_origin": "TOPLEFT"}, "text": "of table cell content.", "orig": "of table cell content.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 19, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 331.199, "r_x1": 141.489, "r_y1": 331.199, "r_x2": 141.489, "r_y2": 320.631, "r_x3": 134.765, "r_y3": 320.631, "coord_origin": "TOPLEFT"}, "text": "4", "orig": "4", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 20, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 154.938, "r_y0": 331.199, "r_x1": 372.508, "r_y1": 331.199, "r_x2": 372.508, "r_y2": 320.631, "r_x3": 154.938, "r_y3": 320.631, "coord_origin": "TOPLEFT"}, "text": "Optimised Table Structure Language", "orig": "Optimised Table Structure Language", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 21, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 357.914, "r_x1": 480.591, "r_y1": 357.914, "r_x2": 480.591, "r_y2": 349.117, "r_x3": 134.765, "r_y3": 349.117, "coord_origin": "TOPLEFT"}, "text": "To mitigate the issues with HTML in Im2Seq-based TSR models laid out before,", "orig": "To mitigate the issues with HTML in Im2Seq-based TSR models laid out before,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 22, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 369.869, "r_x1": 480.589, "r_y1": 369.869, "r_x2": 480.589, "r_y2": 361.072, "r_x3": 134.765, "r_y3": 361.072, "coord_origin": "TOPLEFT"}, "text": "we propose here our Optimised Table Structure Language (OTSL). OTSL is", "orig": "we propose here our Optimised Table Structure Language (OTSL). OTSL is", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 23, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 381.825, "r_x1": 480.587, "r_y1": 381.825, "r_x2": 480.587, "r_y2": 373.028, "r_x3": 134.765, "r_y3": 373.028, "coord_origin": "TOPLEFT"}, "text": "designed to express table structure with a minimized vocabulary and a simple", "orig": "designed to express table structure with a minimized vocabulary and a simple", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 24, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 393.78, "r_x1": 146.993, "r_y1": 393.78, "r_x2": 146.993, "r_y2": 384.983, "r_x3": 134.765, "r_y3": 384.983, "coord_origin": "TOPLEFT"}, "text": "set", "orig": "set", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 25, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 151.088, "r_y0": 393.78, "r_x1": 159.112, "r_y1": 393.78, "r_x2": 159.112, "r_y2": 384.983, "r_x3": 151.088, "r_y3": 384.983, "coord_origin": "TOPLEFT"}, "text": "of", "orig": "of", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 26, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 163.196, "r_y0": 393.78, "r_x1": 186.519, "r_y1": 393.78, "r_x2": 186.519, "r_y2": 384.983, "r_x3": 163.196, "r_y3": 384.983, "coord_origin": "TOPLEFT"}, "text": "rules,", "orig": "rules,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 27, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 190.613, "r_y0": 393.78, "r_x1": 480.589, "r_y1": 393.78, "r_x2": 480.589, "r_y2": 384.983, "r_x3": 190.613, "r_y3": 384.983, "coord_origin": "TOPLEFT"}, "text": "which are both significantly reduced compared to HTML. At the", "orig": "which are both significantly reduced compared to HTML. At the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 28, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 405.735, "r_x1": 480.59, "r_y1": 405.735, "r_x2": 480.59, "r_y2": 396.938, "r_x3": 134.765, "r_y3": 396.938, "coord_origin": "TOPLEFT"}, "text": "same time, OTSL enables easy error detection and correction during sequence", "orig": "same time, OTSL enables easy error detection and correction during sequence", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 29, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 417.69, "r_x1": 480.595, "r_y1": 417.69, "r_x2": 480.595, "r_y2": 408.893, "r_x3": 134.765, "r_y3": 408.893, "coord_origin": "TOPLEFT"}, "text": "generation. We further demonstrate how the compact structure representation", "orig": "generation. We further demonstrate how the compact structure representation", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 30, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 429.645, "r_x1": 480.589, "r_y1": 429.645, "r_x2": 480.589, "r_y2": 420.848, "r_x3": 134.765, "r_y3": 420.848, "coord_origin": "TOPLEFT"}, "text": "and minimized sequence length improves prediction accuracy and inference time", "orig": "and minimized sequence length improves prediction accuracy and inference time", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 31, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 441.6, "r_x1": 276.673, "r_y1": 441.6, "r_x2": 276.673, "r_y2": 432.803, "r_x3": 134.765, "r_y3": 432.803, "coord_origin": "TOPLEFT"}, "text": "in the TableFormer architecture.", "orig": "in the TableFormer architecture.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 32, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 474.679, "r_x1": 149.402, "r_y1": 474.679, "r_x2": 149.402, "r_y2": 465.872, "r_x3": 134.765, "r_y3": 465.872, "coord_origin": "TOPLEFT"}, "text": "4.1", "orig": "4.1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 33, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 160.859, "r_y0": 474.679, "r_x1": 261.801, "r_y1": 474.679, "r_x2": 261.801, "r_y2": 465.872, "r_x3": 160.859, "r_y3": 465.872, "coord_origin": "TOPLEFT"}, "text": "Language Definition", "orig": "Language Definition", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 34, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 497.795, "r_x1": 480.589, "r_y1": 497.795, "r_x2": 480.589, "r_y2": 488.998, "r_x3": 134.765, "r_y3": 488.998, "coord_origin": "TOPLEFT"}, "text": "In Figure 3, we illustrate how the OTSL is defined. In essence, the OTSL defines", "orig": "In Figure 3, we illustrate how the OTSL is defined. In essence, the OTSL defines", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 35, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 509.75, "r_x1": 480.587, "r_y1": 509.75, "r_x2": 480.587, "r_y2": 500.953, "r_x3": 134.765, "r_y3": 500.953, "coord_origin": "TOPLEFT"}, "text": "only 5 tokens that directly describe a tabular structure based on an atomic 2D", "orig": "only 5 tokens that directly describe a tabular structure based on an atomic 2D", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 36, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 521.706, "r_x1": 154.713, "r_y1": 521.706, "r_x2": 154.713, "r_y2": 512.909, "r_x3": 134.765, "r_y3": 512.909, "coord_origin": "TOPLEFT"}, "text": "grid.", "orig": "grid.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 37, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 149.709, "r_y0": 534.299, "r_x1": 409.311, "r_y1": 534.299, "r_x2": 409.311, "r_y2": 525.502, "r_x3": 149.709, "r_y3": 525.502, "coord_origin": "TOPLEFT"}, "text": "The OTSL vocabulary is comprised of the following tokens:", "orig": "The OTSL vocabulary is comprised of the following tokens:", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 38, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 140.993, "r_y0": 556.777, "r_x1": 146.72, "r_y1": 556.777, "r_x2": 146.72, "r_y2": 547.97, "r_x3": 140.993, "r_y3": 547.97, "coord_origin": "TOPLEFT"}, "text": "-", "orig": "-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 39, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 151.701, "r_y0": 556.777, "r_x1": 193.206, "r_y1": 556.777, "r_x2": 193.206, "r_y2": 547.98, "r_x3": 151.701, "r_y3": 547.98, "coord_origin": "TOPLEFT"}, "text": "\"C\" cell -", "orig": "\"C\" cell -", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 40, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 196.522, "r_y0": 556.777, "r_x1": 263.466, "r_y1": 556.777, "r_x2": 263.466, "r_y2": 547.98, "r_x3": 196.522, "r_y3": 547.98, "coord_origin": "TOPLEFT"}, "text": "a new table cell", "orig": "a new table cell", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 41, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 267.815, "r_y0": 556.777, "r_x1": 460.544, "r_y1": 556.777, "r_x2": 460.544, "r_y2": 547.98, "r_x3": 267.815, "r_y3": 547.98, "coord_origin": "TOPLEFT"}, "text": "that either has or does not have cell content", "orig": "that either has or does not have cell content", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 42, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 140.993, "r_y0": 569.37, "r_x1": 146.72, "r_y1": 569.37, "r_x2": 146.72, "r_y2": 560.563, "r_x3": 140.993, "r_y3": 560.563, "coord_origin": "TOPLEFT"}, "text": "-", "orig": "-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 43, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 151.701, "r_y0": 569.37, "r_x1": 194.3, "r_y1": 569.37, "r_x2": 194.3, "r_y2": 560.573, "r_x3": 151.701, "r_y3": 560.573, "coord_origin": "TOPLEFT"}, "text": "\"L\" cell -", "orig": "\"L\" cell -", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 44, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 198.659, "r_y0": 569.37, "r_x1": 245.75, "r_y1": 569.37, "r_x2": 245.75, "r_y2": 560.573, "r_x3": 198.659, "r_y3": 560.573, "coord_origin": "TOPLEFT"}, "text": "left-looking", "orig": "left-looking", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 45, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 250.263, "r_y0": 569.37, "r_x1": 264.518, "r_y1": 569.37, "r_x2": 264.518, "r_y2": 560.573, "r_x3": 250.263, "r_y3": 560.573, "coord_origin": "TOPLEFT"}, "text": "cell", "orig": "cell", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 46, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 264.518, "r_y0": 569.37, "r_x1": 267.285, "r_y1": 569.37, "r_x2": 267.285, "r_y2": 560.573, "r_x3": 264.518, "r_y3": 560.573, "coord_origin": "TOPLEFT"}, "text": ",", "orig": ",", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 47, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 271.638, "r_y0": 569.37, "r_x1": 480.594, "r_y1": 569.37, "r_x2": 480.594, "r_y2": 560.573, "r_x3": 271.638, "r_y3": 560.573, "coord_origin": "TOPLEFT"}, "text": "merging with the left neighbor cell to create a", "orig": "merging with the left neighbor cell to create a", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 48, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 151.701, "r_y0": 581.325, "r_x1": 171.676, "r_y1": 581.325, "r_x2": 171.676, "r_y2": 572.528, "r_x3": 151.701, "r_y3": 572.528, "coord_origin": "TOPLEFT"}, "text": "span", "orig": "span", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 49, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 140.993, "r_y0": 593.919, "r_x1": 146.72, "r_y1": 593.919, "r_x2": 146.72, "r_y2": 585.112, "r_x3": 140.993, "r_y3": 585.112, "coord_origin": "TOPLEFT"}, "text": "-", "orig": "-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 50, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 151.701, "r_y0": 593.919, "r_x1": 194.111, "r_y1": 593.919, "r_x2": 194.111, "r_y2": 585.1220000000001, "r_x3": 151.701, "r_y3": 585.1220000000001, "coord_origin": "TOPLEFT"}, "text": "\"U\" cell -", "orig": "\"U\" cell -", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 51, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 197.748, "r_y0": 593.919, "r_x1": 259.895, "r_y1": 593.919, "r_x2": 259.895, "r_y2": 585.1220000000001, "r_x3": 197.748, "r_y3": 585.1220000000001, "coord_origin": "TOPLEFT"}, "text": "up-looking cell", "orig": "up-looking cell", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 52, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 259.892, "r_y0": 593.919, "r_x1": 262.659, "r_y1": 593.919, "r_x2": 262.659, "r_y2": 585.1220000000001, "r_x3": 259.892, "r_y3": 585.1220000000001, "coord_origin": "TOPLEFT"}, "text": ",", "orig": ",", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 53, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 266.295, "r_y0": 593.919, "r_x1": 480.588, "r_y1": 593.919, "r_x2": 480.588, "r_y2": 585.1220000000001, "r_x3": 266.295, "r_y3": 585.1220000000001, "coord_origin": "TOPLEFT"}, "text": "merging with the upper neighbor cell to create a", "orig": "merging with the upper neighbor cell to create a", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 54, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 151.701, "r_y0": 605.874, "r_x1": 171.676, "r_y1": 605.874, "r_x2": 171.676, "r_y2": 597.077, "r_x3": 151.701, "r_y3": 597.077, "coord_origin": "TOPLEFT"}, "text": "span", "orig": "span", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 55, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 140.993, "r_y0": 618.467, "r_x1": 146.72, "r_y1": 618.467, "r_x2": 146.72, "r_y2": 609.66, "r_x3": 140.993, "r_y3": 609.66, "coord_origin": "TOPLEFT"}, "text": "-", "orig": "-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 56, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 151.701, "r_y0": 618.467, "r_x1": 193.483, "r_y1": 618.467, "r_x2": 193.483, "r_y2": 609.67, "r_x3": 151.701, "r_y3": 609.67, "coord_origin": "TOPLEFT"}, "text": "\"X\" cell -", "orig": "\"X\" cell -", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 57, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 196.799, "r_y0": 618.467, "r_x1": 236.12, "r_y1": 618.467, "r_x2": 236.12, "r_y2": 609.67, "r_x3": 196.799, "r_y3": 609.67, "coord_origin": "TOPLEFT"}, "text": "cross cell", "orig": "cross cell", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 58, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 236.125, "r_y0": 618.467, "r_x1": 238.892, "r_y1": 618.467, "r_x2": 238.892, "r_y2": 609.67, "r_x3": 236.125, "r_y3": 609.67, "coord_origin": "TOPLEFT"}, "text": ",", "orig": ",", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 59, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 242.209, "r_y0": 618.467, "r_x1": 454.555, "r_y1": 618.467, "r_x2": 454.555, "r_y2": 609.67, "r_x3": 242.209, "r_y3": 609.67, "coord_origin": "TOPLEFT"}, "text": "to merge with both left and upper neighbor cells", "orig": "to merge with both left and upper neighbor cells", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 60, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 140.993, "r_y0": 631.061, "r_x1": 146.72, "r_y1": 631.061, "r_x2": 146.72, "r_y2": 622.254, "r_x3": 140.993, "r_y3": 622.254, "coord_origin": "TOPLEFT"}, "text": "-", "orig": "-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 61, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 151.701, "r_y0": 631.061, "r_x1": 181.994, "r_y1": 631.061, "r_x2": 181.994, "r_y2": 622.264, "r_x3": 151.701, "r_y3": 622.264, "coord_origin": "TOPLEFT"}, "text": "\"NL\" -", "orig": "\"NL\" -", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 62, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 185.317, "r_y0": 631.061, "r_x1": 221.462, "r_y1": 631.061, "r_x2": 221.462, "r_y2": 622.264, "r_x3": 185.317, "r_y3": 622.264, "coord_origin": "TOPLEFT"}, "text": "new-line", "orig": "new-line", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 63, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 221.461, "r_y0": 631.061, "r_x1": 224.228, "r_y1": 631.061, "r_x2": 224.228, "r_y2": 622.264, "r_x3": 221.461, "r_y3": 622.264, "coord_origin": "TOPLEFT"}, "text": ",", "orig": ",", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 64, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 227.545, "r_y0": 631.061, "r_x1": 328.617, "r_y1": 631.061, "r_x2": 328.617, "r_y2": 622.264, "r_x3": 227.545, "r_y3": 622.264, "coord_origin": "TOPLEFT"}, "text": "switch to the next row.", "orig": "switch to the next row.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 65, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 149.709, "r_y0": 652.9, "r_x1": 480.593, "r_y1": 652.9, "r_x2": 480.593, "r_y2": 644.1030000000001, "r_x3": 149.709, "r_y3": 644.1030000000001, "coord_origin": "TOPLEFT"}, "text": "A notable attribute of OTSL is that it has the capability of achieving lossless", "orig": "A notable attribute of OTSL is that it has the capability of achieving lossless", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 66, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 664.855, "r_x1": 228.223, "r_y1": 664.855, "r_x2": 228.223, "r_y2": 656.058, "r_x3": 134.765, "r_y3": 656.058, "coord_origin": "TOPLEFT"}, "text": "conversion to HTML.", "orig": "conversion to HTML.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "parsed_page": null, "predictions": {"layout": {"clusters": [{"id": 14, "label": "page_header", "bbox": {"l": 134.765, "t": 91.49300000000005, "r": 139.372, "b": 102.78200000000004, "coord_origin": "TOPLEFT"}, "confidence": 0.8378868699073792, "cells": [{"index": 0, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 102.78200000000004, "r_x1": 139.372, "r_y1": 102.78200000000004, "r_x2": 139.372, "r_y2": 91.49300000000005, "r_x3": 134.765, "r_y3": 91.49300000000005, "coord_origin": "TOPLEFT"}, "text": "6", "orig": "6", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 11, "label": "page_header", "bbox": {"l": 167.813, "t": 91.49300000000005, "r": 231.722, "b": 102.78200000000004, "coord_origin": "TOPLEFT"}, "confidence": 0.8919177651405334, "cells": [{"index": 1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 167.813, "r_y0": 102.78200000000004, "r_x1": 231.722, "r_y1": 102.78200000000004, "r_x2": 231.722, "r_y2": 91.49300000000005, "r_x3": 167.813, "r_y3": 91.49300000000005, "coord_origin": "TOPLEFT"}, "text": "M. Lysak, et al.", "orig": "M. Lysak, et al.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 3, "label": "text", "bbox": {"l": 134.765, "t": 118.93399999999997, "r": 480.595, "b": 139.68600000000004, "coord_origin": "TOPLEFT"}, "confidence": 0.9633480906486511, "cells": [{"index": 2, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 127.731, "r_x1": 480.595, "r_y1": 127.731, "r_x2": 480.595, "r_y2": 118.93399999999997, "r_x3": 134.765, "r_y3": 118.93399999999997, "coord_origin": "TOPLEFT"}, "text": "generation. Implicitly, this also means that Im2Seq models need to learn these", "orig": "generation. Implicitly, this also means that Im2Seq models need to learn these", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 3, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 139.68600000000004, "r_x1": 364.625, "r_y1": 139.68600000000004, "r_x2": 364.625, "r_y2": 130.889, "r_x3": 134.765, "r_y3": 130.889, "coord_origin": "TOPLEFT"}, "text": "complex syntax rules, simply to deliver valid output.", "orig": "complex syntax rules, simply to deliver valid output.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 1, "label": "text", "bbox": {"l": 134.765, "t": 143.48299999999995, "r": 480.596, "b": 295.742, "coord_origin": "TOPLEFT"}, "confidence": 0.9856827855110168, "cells": [{"index": 4, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 149.709, "r_y0": 152.27999999999997, "r_x1": 480.59, "r_y1": 152.27999999999997, "r_x2": 480.59, "r_y2": 143.48299999999995, "r_x3": 149.709, "r_y3": 143.48299999999995, "coord_origin": "TOPLEFT"}, "text": "In practice, we observe two major issues with prediction quality when train-", "orig": "In practice, we observe two major issues with prediction quality when train-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 5, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 164.235, "r_x1": 480.594, "r_y1": 164.235, "r_x2": 480.594, "r_y2": 155.438, "r_x3": 134.765, "r_y3": 155.438, "coord_origin": "TOPLEFT"}, "text": "ing Im2Seq models on HTML table structure generation from images. On the", "orig": "ing Im2Seq models on HTML table structure generation from images. On the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 6, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 176.19000000000005, "r_x1": 480.587, "r_y1": 176.19000000000005, "r_x2": 480.587, "r_y2": 167.39300000000003, "r_x3": 134.765, "r_y3": 167.39300000000003, "coord_origin": "TOPLEFT"}, "text": "one hand, we find that on large tables, the visual attention of the model often", "orig": "one hand, we find that on large tables, the visual attention of the model often", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 7, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 188.14499999999998, "r_x1": 480.595, "r_y1": 188.14499999999998, "r_x2": 480.595, "r_y2": 179.34799999999996, "r_x3": 134.765, "r_y3": 179.34799999999996, "coord_origin": "TOPLEFT"}, "text": "starts to drift and is not accurately moving forward cell by cell anymore. This", "orig": "starts to drift and is not accurately moving forward cell by cell anymore. This", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 8, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 200.10000000000002, "r_x1": 314.278, "r_y1": 200.10000000000002, "r_x2": 314.278, "r_y2": 191.303, "r_x3": 134.765, "r_y3": 191.303, "coord_origin": "TOPLEFT"}, "text": "manifests itself in either in an increasing", "orig": "manifests itself in either in an increasing", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 9, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 318.056, "r_y0": 200.10000000000002, "r_x1": 374.087, "r_y1": 200.10000000000002, "r_x2": 374.087, "r_y2": 191.303, "r_x3": 318.056, "r_y3": 191.303, "coord_origin": "TOPLEFT"}, "text": "location drift", "orig": "location drift", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 10, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 378.809, "r_y0": 200.10000000000002, "r_x1": 480.586, "r_y1": 200.10000000000002, "r_x2": 480.586, "r_y2": 191.303, "r_x3": 378.809, "r_y3": 191.303, "coord_origin": "TOPLEFT"}, "text": "for proposed table-cells", "orig": "for proposed table-cells", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 11, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 212.05600000000004, "r_x1": 480.588, "r_y1": 212.05600000000004, "r_x2": 480.588, "r_y2": 203.25900000000001, "r_x3": 134.765, "r_y3": 203.25900000000001, "coord_origin": "TOPLEFT"}, "text": "in later rows on the same column or even complete loss of vertical alignment, as", "orig": "in later rows on the same column or even complete loss of vertical alignment, as", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 12, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 224.01099999999997, "r_x1": 480.596, "r_y1": 224.01099999999997, "r_x2": 480.596, "r_y2": 215.21400000000006, "r_x3": 134.765, "r_y3": 215.21400000000006, "coord_origin": "TOPLEFT"}, "text": "illustrated in Figure 5. Addressing this with post-processing is partially possible,", "orig": "illustrated in Figure 5. Addressing this with post-processing is partially possible,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 13, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 235.966, "r_x1": 480.595, "r_y1": 235.966, "r_x2": 480.595, "r_y2": 227.16899999999998, "r_x3": 134.765, "r_y3": 227.16899999999998, "coord_origin": "TOPLEFT"}, "text": "but clearly undesired. On the other hand, we find many instances of predictions", "orig": "but clearly undesired. On the other hand, we find many instances of predictions", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 14, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 247.92100000000005, "r_x1": 480.588, "r_y1": 247.92100000000005, "r_x2": 480.588, "r_y2": 239.12400000000002, "r_x3": 134.765, "r_y3": 239.12400000000002, "coord_origin": "TOPLEFT"}, "text": "with structural inconsistencies or plain invalid HTML output, as shown in Fig-", "orig": "with structural inconsistencies or plain invalid HTML output, as shown in Fig-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 15, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 259.876, "r_x1": 480.593, "r_y1": 259.876, "r_x2": 480.593, "r_y2": 251.07899999999995, "r_x3": 134.765, "r_y3": 251.07899999999995, "coord_origin": "TOPLEFT"}, "text": "ure 6, which are nearly impossible to properly correct. Both problems seriously", "orig": "ure 6, which are nearly impossible to properly correct. Both problems seriously", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 16, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 271.831, "r_x1": 480.595, "r_y1": 271.831, "r_x2": 480.595, "r_y2": 263.034, "r_x3": 134.765, "r_y3": 263.034, "coord_origin": "TOPLEFT"}, "text": "impact the TSR model performance, since they reflect not only in the task of", "orig": "impact the TSR model performance, since they reflect not only in the task of", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 17, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 283.787, "r_x1": 480.59, "r_y1": 283.787, "r_x2": 480.59, "r_y2": 274.99, "r_x3": 134.765, "r_y3": 274.99, "coord_origin": "TOPLEFT"}, "text": "pure structure recognition but also in the equally crucial recognition or matching", "orig": "pure structure recognition but also in the equally crucial recognition or matching", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 18, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 295.742, "r_x1": 223.573, "r_y1": 295.742, "r_x2": 223.573, "r_y2": 286.945, "r_x3": 134.765, "r_y3": 286.945, "coord_origin": "TOPLEFT"}, "text": "of table cell content.", "orig": "of table cell content.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 4, "label": "section_header", "bbox": {"l": 134.765, "t": 320.631, "r": 372.508, "b": 331.199, "coord_origin": "TOPLEFT"}, "confidence": 0.957028865814209, "cells": [{"index": 19, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 331.199, "r_x1": 141.489, "r_y1": 331.199, "r_x2": 141.489, "r_y2": 320.631, "r_x3": 134.765, "r_y3": 320.631, "coord_origin": "TOPLEFT"}, "text": "4", "orig": "4", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 20, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 154.938, "r_y0": 331.199, "r_x1": 372.508, "r_y1": 331.199, "r_x2": 372.508, "r_y2": 320.631, "r_x3": 154.938, "r_y3": 320.631, "coord_origin": "TOPLEFT"}, "text": "Optimised Table Structure Language", "orig": "Optimised Table Structure Language", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 0, "label": "text", "bbox": {"l": 134.765, "t": 349.117, "r": 480.595, "b": 441.6, "coord_origin": "TOPLEFT"}, "confidence": 0.9879323840141296, "cells": [{"index": 21, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 357.914, "r_x1": 480.591, "r_y1": 357.914, "r_x2": 480.591, "r_y2": 349.117, "r_x3": 134.765, "r_y3": 349.117, "coord_origin": "TOPLEFT"}, "text": "To mitigate the issues with HTML in Im2Seq-based TSR models laid out before,", "orig": "To mitigate the issues with HTML in Im2Seq-based TSR models laid out before,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 22, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 369.869, "r_x1": 480.589, "r_y1": 369.869, "r_x2": 480.589, "r_y2": 361.072, "r_x3": 134.765, "r_y3": 361.072, "coord_origin": "TOPLEFT"}, "text": "we propose here our Optimised Table Structure Language (OTSL). OTSL is", "orig": "we propose here our Optimised Table Structure Language (OTSL). OTSL is", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 23, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 381.825, "r_x1": 480.587, "r_y1": 381.825, "r_x2": 480.587, "r_y2": 373.028, "r_x3": 134.765, "r_y3": 373.028, "coord_origin": "TOPLEFT"}, "text": "designed to express table structure with a minimized vocabulary and a simple", "orig": "designed to express table structure with a minimized vocabulary and a simple", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 24, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 393.78, "r_x1": 146.993, "r_y1": 393.78, "r_x2": 146.993, "r_y2": 384.983, "r_x3": 134.765, "r_y3": 384.983, "coord_origin": "TOPLEFT"}, "text": "set", "orig": "set", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 25, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 151.088, "r_y0": 393.78, "r_x1": 159.112, "r_y1": 393.78, "r_x2": 159.112, "r_y2": 384.983, "r_x3": 151.088, "r_y3": 384.983, "coord_origin": "TOPLEFT"}, "text": "of", "orig": "of", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 26, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 163.196, "r_y0": 393.78, "r_x1": 186.519, "r_y1": 393.78, "r_x2": 186.519, "r_y2": 384.983, "r_x3": 163.196, "r_y3": 384.983, "coord_origin": "TOPLEFT"}, "text": "rules,", "orig": "rules,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 27, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 190.613, "r_y0": 393.78, "r_x1": 480.589, "r_y1": 393.78, "r_x2": 480.589, "r_y2": 384.983, "r_x3": 190.613, "r_y3": 384.983, "coord_origin": "TOPLEFT"}, "text": "which are both significantly reduced compared to HTML. At the", "orig": "which are both significantly reduced compared to HTML. At the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 28, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 405.735, "r_x1": 480.59, "r_y1": 405.735, "r_x2": 480.59, "r_y2": 396.938, "r_x3": 134.765, "r_y3": 396.938, "coord_origin": "TOPLEFT"}, "text": "same time, OTSL enables easy error detection and correction during sequence", "orig": "same time, OTSL enables easy error detection and correction during sequence", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 29, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 417.69, "r_x1": 480.595, "r_y1": 417.69, "r_x2": 480.595, "r_y2": 408.893, "r_x3": 134.765, "r_y3": 408.893, "coord_origin": "TOPLEFT"}, "text": "generation. We further demonstrate how the compact structure representation", "orig": "generation. We further demonstrate how the compact structure representation", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 30, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 429.645, "r_x1": 480.589, "r_y1": 429.645, "r_x2": 480.589, "r_y2": 420.848, "r_x3": 134.765, "r_y3": 420.848, "coord_origin": "TOPLEFT"}, "text": "and minimized sequence length improves prediction accuracy and inference time", "orig": "and minimized sequence length improves prediction accuracy and inference time", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 31, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 441.6, "r_x1": 276.673, "r_y1": 441.6, "r_x2": 276.673, "r_y2": 432.803, "r_x3": 134.765, "r_y3": 432.803, "coord_origin": "TOPLEFT"}, "text": "in the TableFormer architecture.", "orig": "in the TableFormer architecture.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 5, "label": "section_header", "bbox": {"l": 134.765, "t": 465.872, "r": 261.801, "b": 474.679, "coord_origin": "TOPLEFT"}, "confidence": 0.9559652209281921, "cells": [{"index": 32, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 474.679, "r_x1": 149.402, "r_y1": 474.679, "r_x2": 149.402, "r_y2": 465.872, "r_x3": 134.765, "r_y3": 465.872, "coord_origin": "TOPLEFT"}, "text": "4.1", "orig": "4.1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 33, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 160.859, "r_y0": 474.679, "r_x1": 261.801, "r_y1": 474.679, "r_x2": 261.801, "r_y2": 465.872, "r_x3": 160.859, "r_y3": 465.872, "coord_origin": "TOPLEFT"}, "text": "Language Definition", "orig": "Language Definition", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 2, "label": "text", "bbox": {"l": 134.765, "t": 488.998, "r": 480.589, "b": 521.706, "coord_origin": "TOPLEFT"}, "confidence": 0.9671263098716736, "cells": [{"index": 34, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 497.795, "r_x1": 480.589, "r_y1": 497.795, "r_x2": 480.589, "r_y2": 488.998, "r_x3": 134.765, "r_y3": 488.998, "coord_origin": "TOPLEFT"}, "text": "In Figure 3, we illustrate how the OTSL is defined. In essence, the OTSL defines", "orig": "In Figure 3, we illustrate how the OTSL is defined. In essence, the OTSL defines", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 35, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 509.75, "r_x1": 480.587, "r_y1": 509.75, "r_x2": 480.587, "r_y2": 500.953, "r_x3": 134.765, "r_y3": 500.953, "coord_origin": "TOPLEFT"}, "text": "only 5 tokens that directly describe a tabular structure based on an atomic 2D", "orig": "only 5 tokens that directly describe a tabular structure based on an atomic 2D", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 36, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 521.706, "r_x1": 154.713, "r_y1": 521.706, "r_x2": 154.713, "r_y2": 512.909, "r_x3": 134.765, "r_y3": 512.909, "coord_origin": "TOPLEFT"}, "text": "grid.", "orig": "grid.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 13, "label": "text", "bbox": {"l": 149.709, "t": 525.502, "r": 409.311, "b": 534.299, "coord_origin": "TOPLEFT"}, "confidence": 0.8555866479873657, "cells": [{"index": 37, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 149.709, "r_y0": 534.299, "r_x1": 409.311, "r_y1": 534.299, "r_x2": 409.311, "r_y2": 525.502, "r_x3": 149.709, "r_y3": 525.502, "coord_origin": "TOPLEFT"}, "text": "The OTSL vocabulary is comprised of the following tokens:", "orig": "The OTSL vocabulary is comprised of the following tokens:", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 9, "label": "list_item", "bbox": {"l": 140.993, "t": 547.97, "r": 460.544, "b": 556.777, "coord_origin": "TOPLEFT"}, "confidence": 0.9184334874153137, "cells": [{"index": 38, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 140.993, "r_y0": 556.777, "r_x1": 146.72, "r_y1": 556.777, "r_x2": 146.72, "r_y2": 547.97, "r_x3": 140.993, "r_y3": 547.97, "coord_origin": "TOPLEFT"}, "text": "-", "orig": "-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 39, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 151.701, "r_y0": 556.777, "r_x1": 193.206, "r_y1": 556.777, "r_x2": 193.206, "r_y2": 547.98, "r_x3": 151.701, "r_y3": 547.98, "coord_origin": "TOPLEFT"}, "text": "\"C\" cell -", "orig": "\"C\" cell -", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 40, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 196.522, "r_y0": 556.777, "r_x1": 263.466, "r_y1": 556.777, "r_x2": 263.466, "r_y2": 547.98, "r_x3": 196.522, "r_y3": 547.98, "coord_origin": "TOPLEFT"}, "text": "a new table cell", "orig": "a new table cell", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 41, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 267.815, "r_y0": 556.777, "r_x1": 460.544, "r_y1": 556.777, "r_x2": 460.544, "r_y2": 547.98, "r_x3": 267.815, "r_y3": 547.98, "coord_origin": "TOPLEFT"}, "text": "that either has or does not have cell content", "orig": "that either has or does not have cell content", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 8, "label": "list_item", "bbox": {"l": 140.993, "t": 560.563, "r": 480.594, "b": 581.325, "coord_origin": "TOPLEFT"}, "confidence": 0.9319931268692017, "cells": [{"index": 42, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 140.993, "r_y0": 569.37, "r_x1": 146.72, "r_y1": 569.37, "r_x2": 146.72, "r_y2": 560.563, "r_x3": 140.993, "r_y3": 560.563, "coord_origin": "TOPLEFT"}, "text": "-", "orig": "-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 43, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 151.701, "r_y0": 569.37, "r_x1": 194.3, "r_y1": 569.37, "r_x2": 194.3, "r_y2": 560.573, "r_x3": 151.701, "r_y3": 560.573, "coord_origin": "TOPLEFT"}, "text": "\"L\" cell -", "orig": "\"L\" cell -", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 44, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 198.659, "r_y0": 569.37, "r_x1": 245.75, "r_y1": 569.37, "r_x2": 245.75, "r_y2": 560.573, "r_x3": 198.659, "r_y3": 560.573, "coord_origin": "TOPLEFT"}, "text": "left-looking", "orig": "left-looking", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 45, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 250.263, "r_y0": 569.37, "r_x1": 264.518, "r_y1": 569.37, "r_x2": 264.518, "r_y2": 560.573, "r_x3": 250.263, "r_y3": 560.573, "coord_origin": "TOPLEFT"}, "text": "cell", "orig": "cell", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 46, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 264.518, "r_y0": 569.37, "r_x1": 267.285, "r_y1": 569.37, "r_x2": 267.285, "r_y2": 560.573, "r_x3": 264.518, "r_y3": 560.573, "coord_origin": "TOPLEFT"}, "text": ",", "orig": ",", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 47, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 271.638, "r_y0": 569.37, "r_x1": 480.594, "r_y1": 569.37, "r_x2": 480.594, "r_y2": 560.573, "r_x3": 271.638, "r_y3": 560.573, "coord_origin": "TOPLEFT"}, "text": "merging with the left neighbor cell to create a", "orig": "merging with the left neighbor cell to create a", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 48, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 151.701, "r_y0": 581.325, "r_x1": 171.676, "r_y1": 581.325, "r_x2": 171.676, "r_y2": 572.528, "r_x3": 151.701, "r_y3": 572.528, "coord_origin": "TOPLEFT"}, "text": "span", "orig": "span", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 7, "label": "list_item", "bbox": {"l": 140.993, "t": 585.112, "r": 480.588, "b": 605.874, "coord_origin": "TOPLEFT"}, "confidence": 0.9438967704772949, "cells": [{"index": 49, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 140.993, "r_y0": 593.919, "r_x1": 146.72, "r_y1": 593.919, "r_x2": 146.72, "r_y2": 585.112, "r_x3": 140.993, "r_y3": 585.112, "coord_origin": "TOPLEFT"}, "text": "-", "orig": "-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 50, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 151.701, "r_y0": 593.919, "r_x1": 194.111, "r_y1": 593.919, "r_x2": 194.111, "r_y2": 585.1220000000001, "r_x3": 151.701, "r_y3": 585.1220000000001, "coord_origin": "TOPLEFT"}, "text": "\"U\" cell -", "orig": "\"U\" cell -", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 51, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 197.748, "r_y0": 593.919, "r_x1": 259.895, "r_y1": 593.919, "r_x2": 259.895, "r_y2": 585.1220000000001, "r_x3": 197.748, "r_y3": 585.1220000000001, "coord_origin": "TOPLEFT"}, "text": "up-looking cell", "orig": "up-looking cell", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 52, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 259.892, "r_y0": 593.919, "r_x1": 262.659, "r_y1": 593.919, "r_x2": 262.659, "r_y2": 585.1220000000001, "r_x3": 259.892, "r_y3": 585.1220000000001, "coord_origin": "TOPLEFT"}, "text": ",", "orig": ",", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 53, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 266.295, "r_y0": 593.919, "r_x1": 480.588, "r_y1": 593.919, "r_x2": 480.588, "r_y2": 585.1220000000001, "r_x3": 266.295, "r_y3": 585.1220000000001, "coord_origin": "TOPLEFT"}, "text": "merging with the upper neighbor cell to create a", "orig": "merging with the upper neighbor cell to create a", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 54, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 151.701, "r_y0": 605.874, "r_x1": 171.676, "r_y1": 605.874, "r_x2": 171.676, "r_y2": 597.077, "r_x3": 151.701, "r_y3": 597.077, "coord_origin": "TOPLEFT"}, "text": "span", "orig": "span", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 10, "label": "list_item", "bbox": {"l": 140.993, "t": 609.66, "r": 454.555, "b": 618.467, "coord_origin": "TOPLEFT"}, "confidence": 0.9036387801170349, "cells": [{"index": 55, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 140.993, "r_y0": 618.467, "r_x1": 146.72, "r_y1": 618.467, "r_x2": 146.72, "r_y2": 609.66, "r_x3": 140.993, "r_y3": 609.66, "coord_origin": "TOPLEFT"}, "text": "-", "orig": "-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 56, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 151.701, "r_y0": 618.467, "r_x1": 193.483, "r_y1": 618.467, "r_x2": 193.483, "r_y2": 609.67, "r_x3": 151.701, "r_y3": 609.67, "coord_origin": "TOPLEFT"}, "text": "\"X\" cell -", "orig": "\"X\" cell -", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 57, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 196.799, "r_y0": 618.467, "r_x1": 236.12, "r_y1": 618.467, "r_x2": 236.12, "r_y2": 609.67, "r_x3": 196.799, "r_y3": 609.67, "coord_origin": "TOPLEFT"}, "text": "cross cell", "orig": "cross cell", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 58, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 236.125, "r_y0": 618.467, "r_x1": 238.892, "r_y1": 618.467, "r_x2": 238.892, "r_y2": 609.67, "r_x3": 236.125, "r_y3": 609.67, "coord_origin": "TOPLEFT"}, "text": ",", "orig": ",", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 59, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 242.209, "r_y0": 618.467, "r_x1": 454.555, "r_y1": 618.467, "r_x2": 454.555, "r_y2": 609.67, "r_x3": 242.209, "r_y3": 609.67, "coord_origin": "TOPLEFT"}, "text": "to merge with both left and upper neighbor cells", "orig": "to merge with both left and upper neighbor cells", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 12, "label": "list_item", "bbox": {"l": 140.993, "t": 622.254, "r": 328.617, "b": 631.061, "coord_origin": "TOPLEFT"}, "confidence": 0.8636871576309204, "cells": [{"index": 60, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 140.993, "r_y0": 631.061, "r_x1": 146.72, "r_y1": 631.061, "r_x2": 146.72, "r_y2": 622.254, "r_x3": 140.993, "r_y3": 622.254, "coord_origin": "TOPLEFT"}, "text": "-", "orig": "-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 61, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 151.701, "r_y0": 631.061, "r_x1": 181.994, "r_y1": 631.061, "r_x2": 181.994, "r_y2": 622.264, "r_x3": 151.701, "r_y3": 622.264, "coord_origin": "TOPLEFT"}, "text": "\"NL\" -", "orig": "\"NL\" -", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 62, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 185.317, "r_y0": 631.061, "r_x1": 221.462, "r_y1": 631.061, "r_x2": 221.462, "r_y2": 622.264, "r_x3": 185.317, "r_y3": 622.264, "coord_origin": "TOPLEFT"}, "text": "new-line", "orig": "new-line", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 63, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 221.461, "r_y0": 631.061, "r_x1": 224.228, "r_y1": 631.061, "r_x2": 224.228, "r_y2": 622.264, "r_x3": 221.461, "r_y3": 622.264, "coord_origin": "TOPLEFT"}, "text": ",", "orig": ",", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 64, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 227.545, "r_y0": 631.061, "r_x1": 328.617, "r_y1": 631.061, "r_x2": 328.617, "r_y2": 622.264, "r_x3": 227.545, "r_y3": 622.264, "coord_origin": "TOPLEFT"}, "text": "switch to the next row.", "orig": "switch to the next row.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 6, "label": "text", "bbox": {"l": 134.765, "t": 644.1030000000001, "r": 480.593, "b": 664.855, "coord_origin": "TOPLEFT"}, "confidence": 0.9443338513374329, "cells": [{"index": 65, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 149.709, "r_y0": 652.9, "r_x1": 480.593, "r_y1": 652.9, "r_x2": 480.593, "r_y2": 644.1030000000001, "r_x3": 149.709, "r_y3": 644.1030000000001, "coord_origin": "TOPLEFT"}, "text": "A notable attribute of OTSL is that it has the capability of achieving lossless", "orig": "A notable attribute of OTSL is that it has the capability of achieving lossless", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 66, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 664.855, "r_x1": 228.223, "r_y1": 664.855, "r_x2": 228.223, "r_y2": 656.058, "r_x3": 134.765, "r_y3": 656.058, "coord_origin": "TOPLEFT"}, "text": "conversion to HTML.", "orig": "conversion to HTML.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}]}, "tablestructure": {"table_map": {}}, "figures_classification": null, "equations_prediction": null, "vlm_response": null}, "assembled": {"elements": [{"label": "page_header", "id": 14, "page_no": 5, "cluster": {"id": 14, "label": "page_header", "bbox": {"l": 134.765, "t": 91.49300000000005, "r": 139.372, "b": 102.78200000000004, "coord_origin": "TOPLEFT"}, "confidence": 0.8378868699073792, "cells": [{"index": 0, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 102.78200000000004, "r_x1": 139.372, "r_y1": 102.78200000000004, "r_x2": 139.372, "r_y2": 91.49300000000005, "r_x3": 134.765, "r_y3": 91.49300000000005, "coord_origin": "TOPLEFT"}, "text": "6", "orig": "6", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "6"}, {"label": "page_header", "id": 11, "page_no": 5, "cluster": {"id": 11, "label": "page_header", "bbox": {"l": 167.813, "t": 91.49300000000005, "r": 231.722, "b": 102.78200000000004, "coord_origin": "TOPLEFT"}, "confidence": 0.8919177651405334, "cells": [{"index": 1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 167.813, "r_y0": 102.78200000000004, "r_x1": 231.722, "r_y1": 102.78200000000004, "r_x2": 231.722, "r_y2": 91.49300000000005, "r_x3": 167.813, "r_y3": 91.49300000000005, "coord_origin": "TOPLEFT"}, "text": "M. Lysak, et al.", "orig": "M. Lysak, et al.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "M. Lysak, et al."}, {"label": "text", "id": 3, "page_no": 5, "cluster": {"id": 3, "label": "text", "bbox": {"l": 134.765, "t": 118.93399999999997, "r": 480.595, "b": 139.68600000000004, "coord_origin": "TOPLEFT"}, "confidence": 0.9633480906486511, "cells": [{"index": 2, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 127.731, "r_x1": 480.595, "r_y1": 127.731, "r_x2": 480.595, "r_y2": 118.93399999999997, "r_x3": 134.765, "r_y3": 118.93399999999997, "coord_origin": "TOPLEFT"}, "text": "generation. Implicitly, this also means that Im2Seq models need to learn these", "orig": "generation. Implicitly, this also means that Im2Seq models need to learn these", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 3, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 139.68600000000004, "r_x1": 364.625, "r_y1": 139.68600000000004, "r_x2": 364.625, "r_y2": 130.889, "r_x3": 134.765, "r_y3": 130.889, "coord_origin": "TOPLEFT"}, "text": "complex syntax rules, simply to deliver valid output.", "orig": "complex syntax rules, simply to deliver valid output.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "generation. Implicitly, this also means that Im2Seq models need to learn these complex syntax rules, simply to deliver valid output."}, {"label": "text", "id": 1, "page_no": 5, "cluster": {"id": 1, "label": "text", "bbox": {"l": 134.765, "t": 143.48299999999995, "r": 480.596, "b": 295.742, "coord_origin": "TOPLEFT"}, "confidence": 0.9856827855110168, "cells": [{"index": 4, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 149.709, "r_y0": 152.27999999999997, "r_x1": 480.59, "r_y1": 152.27999999999997, "r_x2": 480.59, "r_y2": 143.48299999999995, "r_x3": 149.709, "r_y3": 143.48299999999995, "coord_origin": "TOPLEFT"}, "text": "In practice, we observe two major issues with prediction quality when train-", "orig": "In practice, we observe two major issues with prediction quality when train-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 5, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 164.235, "r_x1": 480.594, "r_y1": 164.235, "r_x2": 480.594, "r_y2": 155.438, "r_x3": 134.765, "r_y3": 155.438, "coord_origin": "TOPLEFT"}, "text": "ing Im2Seq models on HTML table structure generation from images. On the", "orig": "ing Im2Seq models on HTML table structure generation from images. On the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 6, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 176.19000000000005, "r_x1": 480.587, "r_y1": 176.19000000000005, "r_x2": 480.587, "r_y2": 167.39300000000003, "r_x3": 134.765, "r_y3": 167.39300000000003, "coord_origin": "TOPLEFT"}, "text": "one hand, we find that on large tables, the visual attention of the model often", "orig": "one hand, we find that on large tables, the visual attention of the model often", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 7, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 188.14499999999998, "r_x1": 480.595, "r_y1": 188.14499999999998, "r_x2": 480.595, "r_y2": 179.34799999999996, "r_x3": 134.765, "r_y3": 179.34799999999996, "coord_origin": "TOPLEFT"}, "text": "starts to drift and is not accurately moving forward cell by cell anymore. This", "orig": "starts to drift and is not accurately moving forward cell by cell anymore. This", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 8, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 200.10000000000002, "r_x1": 314.278, "r_y1": 200.10000000000002, "r_x2": 314.278, "r_y2": 191.303, "r_x3": 134.765, "r_y3": 191.303, "coord_origin": "TOPLEFT"}, "text": "manifests itself in either in an increasing", "orig": "manifests itself in either in an increasing", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 9, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 318.056, "r_y0": 200.10000000000002, "r_x1": 374.087, "r_y1": 200.10000000000002, "r_x2": 374.087, "r_y2": 191.303, "r_x3": 318.056, "r_y3": 191.303, "coord_origin": "TOPLEFT"}, "text": "location drift", "orig": "location drift", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 10, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 378.809, "r_y0": 200.10000000000002, "r_x1": 480.586, "r_y1": 200.10000000000002, "r_x2": 480.586, "r_y2": 191.303, "r_x3": 378.809, "r_y3": 191.303, "coord_origin": "TOPLEFT"}, "text": "for proposed table-cells", "orig": "for proposed table-cells", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 11, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 212.05600000000004, "r_x1": 480.588, "r_y1": 212.05600000000004, "r_x2": 480.588, "r_y2": 203.25900000000001, "r_x3": 134.765, "r_y3": 203.25900000000001, "coord_origin": "TOPLEFT"}, "text": "in later rows on the same column or even complete loss of vertical alignment, as", "orig": "in later rows on the same column or even complete loss of vertical alignment, as", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 12, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 224.01099999999997, "r_x1": 480.596, "r_y1": 224.01099999999997, "r_x2": 480.596, "r_y2": 215.21400000000006, "r_x3": 134.765, "r_y3": 215.21400000000006, "coord_origin": "TOPLEFT"}, "text": "illustrated in Figure 5. Addressing this with post-processing is partially possible,", "orig": "illustrated in Figure 5. Addressing this with post-processing is partially possible,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 13, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 235.966, "r_x1": 480.595, "r_y1": 235.966, "r_x2": 480.595, "r_y2": 227.16899999999998, "r_x3": 134.765, "r_y3": 227.16899999999998, "coord_origin": "TOPLEFT"}, "text": "but clearly undesired. On the other hand, we find many instances of predictions", "orig": "but clearly undesired. On the other hand, we find many instances of predictions", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 14, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 247.92100000000005, "r_x1": 480.588, "r_y1": 247.92100000000005, "r_x2": 480.588, "r_y2": 239.12400000000002, "r_x3": 134.765, "r_y3": 239.12400000000002, "coord_origin": "TOPLEFT"}, "text": "with structural inconsistencies or plain invalid HTML output, as shown in Fig-", "orig": "with structural inconsistencies or plain invalid HTML output, as shown in Fig-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 15, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 259.876, "r_x1": 480.593, "r_y1": 259.876, "r_x2": 480.593, "r_y2": 251.07899999999995, "r_x3": 134.765, "r_y3": 251.07899999999995, "coord_origin": "TOPLEFT"}, "text": "ure 6, which are nearly impossible to properly correct. Both problems seriously", "orig": "ure 6, which are nearly impossible to properly correct. Both problems seriously", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 16, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 271.831, "r_x1": 480.595, "r_y1": 271.831, "r_x2": 480.595, "r_y2": 263.034, "r_x3": 134.765, "r_y3": 263.034, "coord_origin": "TOPLEFT"}, "text": "impact the TSR model performance, since they reflect not only in the task of", "orig": "impact the TSR model performance, since they reflect not only in the task of", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 17, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 283.787, "r_x1": 480.59, "r_y1": 283.787, "r_x2": 480.59, "r_y2": 274.99, "r_x3": 134.765, "r_y3": 274.99, "coord_origin": "TOPLEFT"}, "text": "pure structure recognition but also in the equally crucial recognition or matching", "orig": "pure structure recognition but also in the equally crucial recognition or matching", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 18, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 295.742, "r_x1": 223.573, "r_y1": 295.742, "r_x2": 223.573, "r_y2": 286.945, "r_x3": 134.765, "r_y3": 286.945, "coord_origin": "TOPLEFT"}, "text": "of table cell content.", "orig": "of table cell content.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "In practice, we observe two major issues with prediction quality when training Im2Seq models on HTML table structure generation from images. On the one hand, we find that on large tables, the visual attention of the model often starts to drift and is not accurately moving forward cell by cell anymore. This manifests itself in either in an increasing location drift for proposed table-cells in later rows on the same column or even complete loss of vertical alignment, as illustrated in Figure 5. Addressing this with post-processing is partially possible, but clearly undesired. On the other hand, we find many instances of predictions with structural inconsistencies or plain invalid HTML output, as shown in Figure 6, which are nearly impossible to properly correct. Both problems seriously impact the TSR model performance, since they reflect not only in the task of pure structure recognition but also in the equally crucial recognition or matching of table cell content."}, {"label": "section_header", "id": 4, "page_no": 5, "cluster": {"id": 4, "label": "section_header", "bbox": {"l": 134.765, "t": 320.631, "r": 372.508, "b": 331.199, "coord_origin": "TOPLEFT"}, "confidence": 0.957028865814209, "cells": [{"index": 19, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 331.199, "r_x1": 141.489, "r_y1": 331.199, "r_x2": 141.489, "r_y2": 320.631, "r_x3": 134.765, "r_y3": 320.631, "coord_origin": "TOPLEFT"}, "text": "4", "orig": "4", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 20, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 154.938, "r_y0": 331.199, "r_x1": 372.508, "r_y1": 331.199, "r_x2": 372.508, "r_y2": 320.631, "r_x3": 154.938, "r_y3": 320.631, "coord_origin": "TOPLEFT"}, "text": "Optimised Table Structure Language", "orig": "Optimised Table Structure Language", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "4 Optimised Table Structure Language"}, {"label": "text", "id": 0, "page_no": 5, "cluster": {"id": 0, "label": "text", "bbox": {"l": 134.765, "t": 349.117, "r": 480.595, "b": 441.6, "coord_origin": "TOPLEFT"}, "confidence": 0.9879323840141296, "cells": [{"index": 21, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 357.914, "r_x1": 480.591, "r_y1": 357.914, "r_x2": 480.591, "r_y2": 349.117, "r_x3": 134.765, "r_y3": 349.117, "coord_origin": "TOPLEFT"}, "text": "To mitigate the issues with HTML in Im2Seq-based TSR models laid out before,", "orig": "To mitigate the issues with HTML in Im2Seq-based TSR models laid out before,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 22, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 369.869, "r_x1": 480.589, "r_y1": 369.869, "r_x2": 480.589, "r_y2": 361.072, "r_x3": 134.765, "r_y3": 361.072, "coord_origin": "TOPLEFT"}, "text": "we propose here our Optimised Table Structure Language (OTSL). OTSL is", "orig": "we propose here our Optimised Table Structure Language (OTSL). OTSL is", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 23, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 381.825, "r_x1": 480.587, "r_y1": 381.825, "r_x2": 480.587, "r_y2": 373.028, "r_x3": 134.765, "r_y3": 373.028, "coord_origin": "TOPLEFT"}, "text": "designed to express table structure with a minimized vocabulary and a simple", "orig": "designed to express table structure with a minimized vocabulary and a simple", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 24, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 393.78, "r_x1": 146.993, "r_y1": 393.78, "r_x2": 146.993, "r_y2": 384.983, "r_x3": 134.765, "r_y3": 384.983, "coord_origin": "TOPLEFT"}, "text": "set", "orig": "set", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 25, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 151.088, "r_y0": 393.78, "r_x1": 159.112, "r_y1": 393.78, "r_x2": 159.112, "r_y2": 384.983, "r_x3": 151.088, "r_y3": 384.983, "coord_origin": "TOPLEFT"}, "text": "of", "orig": "of", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 26, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 163.196, "r_y0": 393.78, "r_x1": 186.519, "r_y1": 393.78, "r_x2": 186.519, "r_y2": 384.983, "r_x3": 163.196, "r_y3": 384.983, "coord_origin": "TOPLEFT"}, "text": "rules,", "orig": "rules,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 27, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 190.613, "r_y0": 393.78, "r_x1": 480.589, "r_y1": 393.78, "r_x2": 480.589, "r_y2": 384.983, "r_x3": 190.613, "r_y3": 384.983, "coord_origin": "TOPLEFT"}, "text": "which are both significantly reduced compared to HTML. At the", "orig": "which are both significantly reduced compared to HTML. At the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 28, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 405.735, "r_x1": 480.59, "r_y1": 405.735, "r_x2": 480.59, "r_y2": 396.938, "r_x3": 134.765, "r_y3": 396.938, "coord_origin": "TOPLEFT"}, "text": "same time, OTSL enables easy error detection and correction during sequence", "orig": "same time, OTSL enables easy error detection and correction during sequence", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 29, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 417.69, "r_x1": 480.595, "r_y1": 417.69, "r_x2": 480.595, "r_y2": 408.893, "r_x3": 134.765, "r_y3": 408.893, "coord_origin": "TOPLEFT"}, "text": "generation. We further demonstrate how the compact structure representation", "orig": "generation. We further demonstrate how the compact structure representation", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 30, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 429.645, "r_x1": 480.589, "r_y1": 429.645, "r_x2": 480.589, "r_y2": 420.848, "r_x3": 134.765, "r_y3": 420.848, "coord_origin": "TOPLEFT"}, "text": "and minimized sequence length improves prediction accuracy and inference time", "orig": "and minimized sequence length improves prediction accuracy and inference time", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 31, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 441.6, "r_x1": 276.673, "r_y1": 441.6, "r_x2": 276.673, "r_y2": 432.803, "r_x3": 134.765, "r_y3": 432.803, "coord_origin": "TOPLEFT"}, "text": "in the TableFormer architecture.", "orig": "in the TableFormer architecture.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "To mitigate the issues with HTML in Im2Seq-based TSR models laid out before, we propose here our Optimised Table Structure Language (OTSL). OTSL is designed to express table structure with a minimized vocabulary and a simple set of rules, which are both significantly reduced compared to HTML. At the same time, OTSL enables easy error detection and correction during sequence generation. We further demonstrate how the compact structure representation and minimized sequence length improves prediction accuracy and inference time in the TableFormer architecture."}, {"label": "section_header", "id": 5, "page_no": 5, "cluster": {"id": 5, "label": "section_header", "bbox": {"l": 134.765, "t": 465.872, "r": 261.801, "b": 474.679, "coord_origin": "TOPLEFT"}, "confidence": 0.9559652209281921, "cells": [{"index": 32, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 474.679, "r_x1": 149.402, "r_y1": 474.679, "r_x2": 149.402, "r_y2": 465.872, "r_x3": 134.765, "r_y3": 465.872, "coord_origin": "TOPLEFT"}, "text": "4.1", "orig": "4.1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 33, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 160.859, "r_y0": 474.679, "r_x1": 261.801, "r_y1": 474.679, "r_x2": 261.801, "r_y2": 465.872, "r_x3": 160.859, "r_y3": 465.872, "coord_origin": "TOPLEFT"}, "text": "Language Definition", "orig": "Language Definition", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "4.1 Language Definition"}, {"label": "text", "id": 2, "page_no": 5, "cluster": {"id": 2, "label": "text", "bbox": {"l": 134.765, "t": 488.998, "r": 480.589, "b": 521.706, "coord_origin": "TOPLEFT"}, "confidence": 0.9671263098716736, "cells": [{"index": 34, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 497.795, "r_x1": 480.589, "r_y1": 497.795, "r_x2": 480.589, "r_y2": 488.998, "r_x3": 134.765, "r_y3": 488.998, "coord_origin": "TOPLEFT"}, "text": "In Figure 3, we illustrate how the OTSL is defined. In essence, the OTSL defines", "orig": "In Figure 3, we illustrate how the OTSL is defined. In essence, the OTSL defines", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 35, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 509.75, "r_x1": 480.587, "r_y1": 509.75, "r_x2": 480.587, "r_y2": 500.953, "r_x3": 134.765, "r_y3": 500.953, "coord_origin": "TOPLEFT"}, "text": "only 5 tokens that directly describe a tabular structure based on an atomic 2D", "orig": "only 5 tokens that directly describe a tabular structure based on an atomic 2D", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 36, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 521.706, "r_x1": 154.713, "r_y1": 521.706, "r_x2": 154.713, "r_y2": 512.909, "r_x3": 134.765, "r_y3": 512.909, "coord_origin": "TOPLEFT"}, "text": "grid.", "orig": "grid.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "In Figure 3, we illustrate how the OTSL is defined. In essence, the OTSL defines only 5 tokens that directly describe a tabular structure based on an atomic 2D grid."}, {"label": "text", "id": 13, "page_no": 5, "cluster": {"id": 13, "label": "text", "bbox": {"l": 149.709, "t": 525.502, "r": 409.311, "b": 534.299, "coord_origin": "TOPLEFT"}, "confidence": 0.8555866479873657, "cells": [{"index": 37, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 149.709, "r_y0": 534.299, "r_x1": 409.311, "r_y1": 534.299, "r_x2": 409.311, "r_y2": 525.502, "r_x3": 149.709, "r_y3": 525.502, "coord_origin": "TOPLEFT"}, "text": "The OTSL vocabulary is comprised of the following tokens:", "orig": "The OTSL vocabulary is comprised of the following tokens:", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "The OTSL vocabulary is comprised of the following tokens:"}, {"label": "list_item", "id": 9, "page_no": 5, "cluster": {"id": 9, "label": "list_item", "bbox": {"l": 140.993, "t": 547.97, "r": 460.544, "b": 556.777, "coord_origin": "TOPLEFT"}, "confidence": 0.9184334874153137, "cells": [{"index": 38, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 140.993, "r_y0": 556.777, "r_x1": 146.72, "r_y1": 556.777, "r_x2": 146.72, "r_y2": 547.97, "r_x3": 140.993, "r_y3": 547.97, "coord_origin": "TOPLEFT"}, "text": "-", "orig": "-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 39, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 151.701, "r_y0": 556.777, "r_x1": 193.206, "r_y1": 556.777, "r_x2": 193.206, "r_y2": 547.98, "r_x3": 151.701, "r_y3": 547.98, "coord_origin": "TOPLEFT"}, "text": "\"C\" cell -", "orig": "\"C\" cell -", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 40, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 196.522, "r_y0": 556.777, "r_x1": 263.466, "r_y1": 556.777, "r_x2": 263.466, "r_y2": 547.98, "r_x3": 196.522, "r_y3": 547.98, "coord_origin": "TOPLEFT"}, "text": "a new table cell", "orig": "a new table cell", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 41, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 267.815, "r_y0": 556.777, "r_x1": 460.544, "r_y1": 556.777, "r_x2": 460.544, "r_y2": 547.98, "r_x3": 267.815, "r_y3": 547.98, "coord_origin": "TOPLEFT"}, "text": "that either has or does not have cell content", "orig": "that either has or does not have cell content", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "-\"C\" cell a new table cell that either has or does not have cell content"}, {"label": "list_item", "id": 8, "page_no": 5, "cluster": {"id": 8, "label": "list_item", "bbox": {"l": 140.993, "t": 560.563, "r": 480.594, "b": 581.325, "coord_origin": "TOPLEFT"}, "confidence": 0.9319931268692017, "cells": [{"index": 42, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 140.993, "r_y0": 569.37, "r_x1": 146.72, "r_y1": 569.37, "r_x2": 146.72, "r_y2": 560.563, "r_x3": 140.993, "r_y3": 560.563, "coord_origin": "TOPLEFT"}, "text": "-", "orig": "-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 43, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 151.701, "r_y0": 569.37, "r_x1": 194.3, "r_y1": 569.37, "r_x2": 194.3, "r_y2": 560.573, "r_x3": 151.701, "r_y3": 560.573, "coord_origin": "TOPLEFT"}, "text": "\"L\" cell -", "orig": "\"L\" cell -", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 44, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 198.659, "r_y0": 569.37, "r_x1": 245.75, "r_y1": 569.37, "r_x2": 245.75, "r_y2": 560.573, "r_x3": 198.659, "r_y3": 560.573, "coord_origin": "TOPLEFT"}, "text": "left-looking", "orig": "left-looking", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 45, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 250.263, "r_y0": 569.37, "r_x1": 264.518, "r_y1": 569.37, "r_x2": 264.518, "r_y2": 560.573, "r_x3": 250.263, "r_y3": 560.573, "coord_origin": "TOPLEFT"}, "text": "cell", "orig": "cell", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 46, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 264.518, "r_y0": 569.37, "r_x1": 267.285, "r_y1": 569.37, "r_x2": 267.285, "r_y2": 560.573, "r_x3": 264.518, "r_y3": 560.573, "coord_origin": "TOPLEFT"}, "text": ",", "orig": ",", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 47, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 271.638, "r_y0": 569.37, "r_x1": 480.594, "r_y1": 569.37, "r_x2": 480.594, "r_y2": 560.573, "r_x3": 271.638, "r_y3": 560.573, "coord_origin": "TOPLEFT"}, "text": "merging with the left neighbor cell to create a", "orig": "merging with the left neighbor cell to create a", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 48, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 151.701, "r_y0": 581.325, "r_x1": 171.676, "r_y1": 581.325, "r_x2": 171.676, "r_y2": 572.528, "r_x3": 151.701, "r_y3": 572.528, "coord_origin": "TOPLEFT"}, "text": "span", "orig": "span", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "-\"L\" cell left-looking cell , merging with the left neighbor cell to create a span"}, {"label": "list_item", "id": 7, "page_no": 5, "cluster": {"id": 7, "label": "list_item", "bbox": {"l": 140.993, "t": 585.112, "r": 480.588, "b": 605.874, "coord_origin": "TOPLEFT"}, "confidence": 0.9438967704772949, "cells": [{"index": 49, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 140.993, "r_y0": 593.919, "r_x1": 146.72, "r_y1": 593.919, "r_x2": 146.72, "r_y2": 585.112, "r_x3": 140.993, "r_y3": 585.112, "coord_origin": "TOPLEFT"}, "text": "-", "orig": "-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 50, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 151.701, "r_y0": 593.919, "r_x1": 194.111, "r_y1": 593.919, "r_x2": 194.111, "r_y2": 585.1220000000001, "r_x3": 151.701, "r_y3": 585.1220000000001, "coord_origin": "TOPLEFT"}, "text": "\"U\" cell -", "orig": "\"U\" cell -", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 51, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 197.748, "r_y0": 593.919, "r_x1": 259.895, "r_y1": 593.919, "r_x2": 259.895, "r_y2": 585.1220000000001, "r_x3": 197.748, "r_y3": 585.1220000000001, "coord_origin": "TOPLEFT"}, "text": "up-looking cell", "orig": "up-looking cell", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 52, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 259.892, "r_y0": 593.919, "r_x1": 262.659, "r_y1": 593.919, "r_x2": 262.659, "r_y2": 585.1220000000001, "r_x3": 259.892, "r_y3": 585.1220000000001, "coord_origin": "TOPLEFT"}, "text": ",", "orig": ",", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 53, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 266.295, "r_y0": 593.919, "r_x1": 480.588, "r_y1": 593.919, "r_x2": 480.588, "r_y2": 585.1220000000001, "r_x3": 266.295, "r_y3": 585.1220000000001, "coord_origin": "TOPLEFT"}, "text": "merging with the upper neighbor cell to create a", "orig": "merging with the upper neighbor cell to create a", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 54, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 151.701, "r_y0": 605.874, "r_x1": 171.676, "r_y1": 605.874, "r_x2": 171.676, "r_y2": 597.077, "r_x3": 151.701, "r_y3": 597.077, "coord_origin": "TOPLEFT"}, "text": "span", "orig": "span", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "-\"U\" cell up-looking cell , merging with the upper neighbor cell to create a span"}, {"label": "list_item", "id": 10, "page_no": 5, "cluster": {"id": 10, "label": "list_item", "bbox": {"l": 140.993, "t": 609.66, "r": 454.555, "b": 618.467, "coord_origin": "TOPLEFT"}, "confidence": 0.9036387801170349, "cells": [{"index": 55, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 140.993, "r_y0": 618.467, "r_x1": 146.72, "r_y1": 618.467, "r_x2": 146.72, "r_y2": 609.66, "r_x3": 140.993, "r_y3": 609.66, "coord_origin": "TOPLEFT"}, "text": "-", "orig": "-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 56, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 151.701, "r_y0": 618.467, "r_x1": 193.483, "r_y1": 618.467, "r_x2": 193.483, "r_y2": 609.67, "r_x3": 151.701, "r_y3": 609.67, "coord_origin": "TOPLEFT"}, "text": "\"X\" cell -", "orig": "\"X\" cell -", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 57, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 196.799, "r_y0": 618.467, "r_x1": 236.12, "r_y1": 618.467, "r_x2": 236.12, "r_y2": 609.67, "r_x3": 196.799, "r_y3": 609.67, "coord_origin": "TOPLEFT"}, "text": "cross cell", "orig": "cross cell", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 58, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 236.125, "r_y0": 618.467, "r_x1": 238.892, "r_y1": 618.467, "r_x2": 238.892, "r_y2": 609.67, "r_x3": 236.125, "r_y3": 609.67, "coord_origin": "TOPLEFT"}, "text": ",", "orig": ",", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 59, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 242.209, "r_y0": 618.467, "r_x1": 454.555, "r_y1": 618.467, "r_x2": 454.555, "r_y2": 609.67, "r_x3": 242.209, "r_y3": 609.67, "coord_origin": "TOPLEFT"}, "text": "to merge with both left and upper neighbor cells", "orig": "to merge with both left and upper neighbor cells", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "-\"X\" cell cross cell , to merge with both left and upper neighbor cells"}, {"label": "list_item", "id": 12, "page_no": 5, "cluster": {"id": 12, "label": "list_item", "bbox": {"l": 140.993, "t": 622.254, "r": 328.617, "b": 631.061, "coord_origin": "TOPLEFT"}, "confidence": 0.8636871576309204, "cells": [{"index": 60, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 140.993, "r_y0": 631.061, "r_x1": 146.72, "r_y1": 631.061, "r_x2": 146.72, "r_y2": 622.254, "r_x3": 140.993, "r_y3": 622.254, "coord_origin": "TOPLEFT"}, "text": "-", "orig": "-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 61, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 151.701, "r_y0": 631.061, "r_x1": 181.994, "r_y1": 631.061, "r_x2": 181.994, "r_y2": 622.264, "r_x3": 151.701, "r_y3": 622.264, "coord_origin": "TOPLEFT"}, "text": "\"NL\" -", "orig": "\"NL\" -", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 62, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 185.317, "r_y0": 631.061, "r_x1": 221.462, "r_y1": 631.061, "r_x2": 221.462, "r_y2": 622.264, "r_x3": 185.317, "r_y3": 622.264, "coord_origin": "TOPLEFT"}, "text": "new-line", "orig": "new-line", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 63, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 221.461, "r_y0": 631.061, "r_x1": 224.228, "r_y1": 631.061, "r_x2": 224.228, "r_y2": 622.264, "r_x3": 221.461, "r_y3": 622.264, "coord_origin": "TOPLEFT"}, "text": ",", "orig": ",", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 64, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 227.545, "r_y0": 631.061, "r_x1": 328.617, "r_y1": 631.061, "r_x2": 328.617, "r_y2": 622.264, "r_x3": 227.545, "r_y3": 622.264, "coord_origin": "TOPLEFT"}, "text": "switch to the next row.", "orig": "switch to the next row.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "-\"NL\" new-line , switch to the next row."}, {"label": "text", "id": 6, "page_no": 5, "cluster": {"id": 6, "label": "text", "bbox": {"l": 134.765, "t": 644.1030000000001, "r": 480.593, "b": 664.855, "coord_origin": "TOPLEFT"}, "confidence": 0.9443338513374329, "cells": [{"index": 65, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 149.709, "r_y0": 652.9, "r_x1": 480.593, "r_y1": 652.9, "r_x2": 480.593, "r_y2": 644.1030000000001, "r_x3": 149.709, "r_y3": 644.1030000000001, "coord_origin": "TOPLEFT"}, "text": "A notable attribute of OTSL is that it has the capability of achieving lossless", "orig": "A notable attribute of OTSL is that it has the capability of achieving lossless", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 66, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 664.855, "r_x1": 228.223, "r_y1": 664.855, "r_x2": 228.223, "r_y2": 656.058, "r_x3": 134.765, "r_y3": 656.058, "coord_origin": "TOPLEFT"}, "text": "conversion to HTML.", "orig": "conversion to HTML.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "A notable attribute of OTSL is that it has the capability of achieving lossless conversion to HTML."}], "body": [{"label": "text", "id": 3, "page_no": 5, "cluster": {"id": 3, "label": "text", "bbox": {"l": 134.765, "t": 118.93399999999997, "r": 480.595, "b": 139.68600000000004, "coord_origin": "TOPLEFT"}, "confidence": 0.9633480906486511, "cells": [{"index": 2, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 127.731, "r_x1": 480.595, "r_y1": 127.731, "r_x2": 480.595, "r_y2": 118.93399999999997, "r_x3": 134.765, "r_y3": 118.93399999999997, "coord_origin": "TOPLEFT"}, "text": "generation. Implicitly, this also means that Im2Seq models need to learn these", "orig": "generation. Implicitly, this also means that Im2Seq models need to learn these", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 3, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 139.68600000000004, "r_x1": 364.625, "r_y1": 139.68600000000004, "r_x2": 364.625, "r_y2": 130.889, "r_x3": 134.765, "r_y3": 130.889, "coord_origin": "TOPLEFT"}, "text": "complex syntax rules, simply to deliver valid output.", "orig": "complex syntax rules, simply to deliver valid output.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "generation. Implicitly, this also means that Im2Seq models need to learn these complex syntax rules, simply to deliver valid output."}, {"label": "text", "id": 1, "page_no": 5, "cluster": {"id": 1, "label": "text", "bbox": {"l": 134.765, "t": 143.48299999999995, "r": 480.596, "b": 295.742, "coord_origin": "TOPLEFT"}, "confidence": 0.9856827855110168, "cells": [{"index": 4, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 149.709, "r_y0": 152.27999999999997, "r_x1": 480.59, "r_y1": 152.27999999999997, "r_x2": 480.59, "r_y2": 143.48299999999995, "r_x3": 149.709, "r_y3": 143.48299999999995, "coord_origin": "TOPLEFT"}, "text": "In practice, we observe two major issues with prediction quality when train-", "orig": "In practice, we observe two major issues with prediction quality when train-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 5, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 164.235, "r_x1": 480.594, "r_y1": 164.235, "r_x2": 480.594, "r_y2": 155.438, "r_x3": 134.765, "r_y3": 155.438, "coord_origin": "TOPLEFT"}, "text": "ing Im2Seq models on HTML table structure generation from images. On the", "orig": "ing Im2Seq models on HTML table structure generation from images. On the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 6, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 176.19000000000005, "r_x1": 480.587, "r_y1": 176.19000000000005, "r_x2": 480.587, "r_y2": 167.39300000000003, "r_x3": 134.765, "r_y3": 167.39300000000003, "coord_origin": "TOPLEFT"}, "text": "one hand, we find that on large tables, the visual attention of the model often", "orig": "one hand, we find that on large tables, the visual attention of the model often", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 7, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 188.14499999999998, "r_x1": 480.595, "r_y1": 188.14499999999998, "r_x2": 480.595, "r_y2": 179.34799999999996, "r_x3": 134.765, "r_y3": 179.34799999999996, "coord_origin": "TOPLEFT"}, "text": "starts to drift and is not accurately moving forward cell by cell anymore. This", "orig": "starts to drift and is not accurately moving forward cell by cell anymore. This", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 8, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 200.10000000000002, "r_x1": 314.278, "r_y1": 200.10000000000002, "r_x2": 314.278, "r_y2": 191.303, "r_x3": 134.765, "r_y3": 191.303, "coord_origin": "TOPLEFT"}, "text": "manifests itself in either in an increasing", "orig": "manifests itself in either in an increasing", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 9, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 318.056, "r_y0": 200.10000000000002, "r_x1": 374.087, "r_y1": 200.10000000000002, "r_x2": 374.087, "r_y2": 191.303, "r_x3": 318.056, "r_y3": 191.303, "coord_origin": "TOPLEFT"}, "text": "location drift", "orig": "location drift", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 10, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 378.809, "r_y0": 200.10000000000002, "r_x1": 480.586, "r_y1": 200.10000000000002, "r_x2": 480.586, "r_y2": 191.303, "r_x3": 378.809, "r_y3": 191.303, "coord_origin": "TOPLEFT"}, "text": "for proposed table-cells", "orig": "for proposed table-cells", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 11, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 212.05600000000004, "r_x1": 480.588, "r_y1": 212.05600000000004, "r_x2": 480.588, "r_y2": 203.25900000000001, "r_x3": 134.765, "r_y3": 203.25900000000001, "coord_origin": "TOPLEFT"}, "text": "in later rows on the same column or even complete loss of vertical alignment, as", "orig": "in later rows on the same column or even complete loss of vertical alignment, as", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 12, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 224.01099999999997, "r_x1": 480.596, "r_y1": 224.01099999999997, "r_x2": 480.596, "r_y2": 215.21400000000006, "r_x3": 134.765, "r_y3": 215.21400000000006, "coord_origin": "TOPLEFT"}, "text": "illustrated in Figure 5. Addressing this with post-processing is partially possible,", "orig": "illustrated in Figure 5. Addressing this with post-processing is partially possible,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 13, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 235.966, "r_x1": 480.595, "r_y1": 235.966, "r_x2": 480.595, "r_y2": 227.16899999999998, "r_x3": 134.765, "r_y3": 227.16899999999998, "coord_origin": "TOPLEFT"}, "text": "but clearly undesired. On the other hand, we find many instances of predictions", "orig": "but clearly undesired. On the other hand, we find many instances of predictions", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 14, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 247.92100000000005, "r_x1": 480.588, "r_y1": 247.92100000000005, "r_x2": 480.588, "r_y2": 239.12400000000002, "r_x3": 134.765, "r_y3": 239.12400000000002, "coord_origin": "TOPLEFT"}, "text": "with structural inconsistencies or plain invalid HTML output, as shown in Fig-", "orig": "with structural inconsistencies or plain invalid HTML output, as shown in Fig-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 15, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 259.876, "r_x1": 480.593, "r_y1": 259.876, "r_x2": 480.593, "r_y2": 251.07899999999995, "r_x3": 134.765, "r_y3": 251.07899999999995, "coord_origin": "TOPLEFT"}, "text": "ure 6, which are nearly impossible to properly correct. Both problems seriously", "orig": "ure 6, which are nearly impossible to properly correct. Both problems seriously", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 16, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 271.831, "r_x1": 480.595, "r_y1": 271.831, "r_x2": 480.595, "r_y2": 263.034, "r_x3": 134.765, "r_y3": 263.034, "coord_origin": "TOPLEFT"}, "text": "impact the TSR model performance, since they reflect not only in the task of", "orig": "impact the TSR model performance, since they reflect not only in the task of", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 17, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 283.787, "r_x1": 480.59, "r_y1": 283.787, "r_x2": 480.59, "r_y2": 274.99, "r_x3": 134.765, "r_y3": 274.99, "coord_origin": "TOPLEFT"}, "text": "pure structure recognition but also in the equally crucial recognition or matching", "orig": "pure structure recognition but also in the equally crucial recognition or matching", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 18, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 295.742, "r_x1": 223.573, "r_y1": 295.742, "r_x2": 223.573, "r_y2": 286.945, "r_x3": 134.765, "r_y3": 286.945, "coord_origin": "TOPLEFT"}, "text": "of table cell content.", "orig": "of table cell content.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "In practice, we observe two major issues with prediction quality when training Im2Seq models on HTML table structure generation from images. On the one hand, we find that on large tables, the visual attention of the model often starts to drift and is not accurately moving forward cell by cell anymore. This manifests itself in either in an increasing location drift for proposed table-cells in later rows on the same column or even complete loss of vertical alignment, as illustrated in Figure 5. Addressing this with post-processing is partially possible, but clearly undesired. On the other hand, we find many instances of predictions with structural inconsistencies or plain invalid HTML output, as shown in Figure 6, which are nearly impossible to properly correct. Both problems seriously impact the TSR model performance, since they reflect not only in the task of pure structure recognition but also in the equally crucial recognition or matching of table cell content."}, {"label": "section_header", "id": 4, "page_no": 5, "cluster": {"id": 4, "label": "section_header", "bbox": {"l": 134.765, "t": 320.631, "r": 372.508, "b": 331.199, "coord_origin": "TOPLEFT"}, "confidence": 0.957028865814209, "cells": [{"index": 19, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 331.199, "r_x1": 141.489, "r_y1": 331.199, "r_x2": 141.489, "r_y2": 320.631, "r_x3": 134.765, "r_y3": 320.631, "coord_origin": "TOPLEFT"}, "text": "4", "orig": "4", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 20, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 154.938, "r_y0": 331.199, "r_x1": 372.508, "r_y1": 331.199, "r_x2": 372.508, "r_y2": 320.631, "r_x3": 154.938, "r_y3": 320.631, "coord_origin": "TOPLEFT"}, "text": "Optimised Table Structure Language", "orig": "Optimised Table Structure Language", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "4 Optimised Table Structure Language"}, {"label": "text", "id": 0, "page_no": 5, "cluster": {"id": 0, "label": "text", "bbox": {"l": 134.765, "t": 349.117, "r": 480.595, "b": 441.6, "coord_origin": "TOPLEFT"}, "confidence": 0.9879323840141296, "cells": [{"index": 21, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 357.914, "r_x1": 480.591, "r_y1": 357.914, "r_x2": 480.591, "r_y2": 349.117, "r_x3": 134.765, "r_y3": 349.117, "coord_origin": "TOPLEFT"}, "text": "To mitigate the issues with HTML in Im2Seq-based TSR models laid out before,", "orig": "To mitigate the issues with HTML in Im2Seq-based TSR models laid out before,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 22, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 369.869, "r_x1": 480.589, "r_y1": 369.869, "r_x2": 480.589, "r_y2": 361.072, "r_x3": 134.765, "r_y3": 361.072, "coord_origin": "TOPLEFT"}, "text": "we propose here our Optimised Table Structure Language (OTSL). OTSL is", "orig": "we propose here our Optimised Table Structure Language (OTSL). OTSL is", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 23, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 381.825, "r_x1": 480.587, "r_y1": 381.825, "r_x2": 480.587, "r_y2": 373.028, "r_x3": 134.765, "r_y3": 373.028, "coord_origin": "TOPLEFT"}, "text": "designed to express table structure with a minimized vocabulary and a simple", "orig": "designed to express table structure with a minimized vocabulary and a simple", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 24, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 393.78, "r_x1": 146.993, "r_y1": 393.78, "r_x2": 146.993, "r_y2": 384.983, "r_x3": 134.765, "r_y3": 384.983, "coord_origin": "TOPLEFT"}, "text": "set", "orig": "set", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 25, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 151.088, "r_y0": 393.78, "r_x1": 159.112, "r_y1": 393.78, "r_x2": 159.112, "r_y2": 384.983, "r_x3": 151.088, "r_y3": 384.983, "coord_origin": "TOPLEFT"}, "text": "of", "orig": "of", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 26, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 163.196, "r_y0": 393.78, "r_x1": 186.519, "r_y1": 393.78, "r_x2": 186.519, "r_y2": 384.983, "r_x3": 163.196, "r_y3": 384.983, "coord_origin": "TOPLEFT"}, "text": "rules,", "orig": "rules,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 27, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 190.613, "r_y0": 393.78, "r_x1": 480.589, "r_y1": 393.78, "r_x2": 480.589, "r_y2": 384.983, "r_x3": 190.613, "r_y3": 384.983, "coord_origin": "TOPLEFT"}, "text": "which are both significantly reduced compared to HTML. At the", "orig": "which are both significantly reduced compared to HTML. At the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 28, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 405.735, "r_x1": 480.59, "r_y1": 405.735, "r_x2": 480.59, "r_y2": 396.938, "r_x3": 134.765, "r_y3": 396.938, "coord_origin": "TOPLEFT"}, "text": "same time, OTSL enables easy error detection and correction during sequence", "orig": "same time, OTSL enables easy error detection and correction during sequence", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 29, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 417.69, "r_x1": 480.595, "r_y1": 417.69, "r_x2": 480.595, "r_y2": 408.893, "r_x3": 134.765, "r_y3": 408.893, "coord_origin": "TOPLEFT"}, "text": "generation. We further demonstrate how the compact structure representation", "orig": "generation. We further demonstrate how the compact structure representation", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 30, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 429.645, "r_x1": 480.589, "r_y1": 429.645, "r_x2": 480.589, "r_y2": 420.848, "r_x3": 134.765, "r_y3": 420.848, "coord_origin": "TOPLEFT"}, "text": "and minimized sequence length improves prediction accuracy and inference time", "orig": "and minimized sequence length improves prediction accuracy and inference time", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 31, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 441.6, "r_x1": 276.673, "r_y1": 441.6, "r_x2": 276.673, "r_y2": 432.803, "r_x3": 134.765, "r_y3": 432.803, "coord_origin": "TOPLEFT"}, "text": "in the TableFormer architecture.", "orig": "in the TableFormer architecture.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "To mitigate the issues with HTML in Im2Seq-based TSR models laid out before, we propose here our Optimised Table Structure Language (OTSL). OTSL is designed to express table structure with a minimized vocabulary and a simple set of rules, which are both significantly reduced compared to HTML. At the same time, OTSL enables easy error detection and correction during sequence generation. We further demonstrate how the compact structure representation and minimized sequence length improves prediction accuracy and inference time in the TableFormer architecture."}, {"label": "section_header", "id": 5, "page_no": 5, "cluster": {"id": 5, "label": "section_header", "bbox": {"l": 134.765, "t": 465.872, "r": 261.801, "b": 474.679, "coord_origin": "TOPLEFT"}, "confidence": 0.9559652209281921, "cells": [{"index": 32, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 474.679, "r_x1": 149.402, "r_y1": 474.679, "r_x2": 149.402, "r_y2": 465.872, "r_x3": 134.765, "r_y3": 465.872, "coord_origin": "TOPLEFT"}, "text": "4.1", "orig": "4.1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 33, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 160.859, "r_y0": 474.679, "r_x1": 261.801, "r_y1": 474.679, "r_x2": 261.801, "r_y2": 465.872, "r_x3": 160.859, "r_y3": 465.872, "coord_origin": "TOPLEFT"}, "text": "Language Definition", "orig": "Language Definition", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "4.1 Language Definition"}, {"label": "text", "id": 2, "page_no": 5, "cluster": {"id": 2, "label": "text", "bbox": {"l": 134.765, "t": 488.998, "r": 480.589, "b": 521.706, "coord_origin": "TOPLEFT"}, "confidence": 0.9671263098716736, "cells": [{"index": 34, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 497.795, "r_x1": 480.589, "r_y1": 497.795, "r_x2": 480.589, "r_y2": 488.998, "r_x3": 134.765, "r_y3": 488.998, "coord_origin": "TOPLEFT"}, "text": "In Figure 3, we illustrate how the OTSL is defined. In essence, the OTSL defines", "orig": "In Figure 3, we illustrate how the OTSL is defined. In essence, the OTSL defines", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 35, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 509.75, "r_x1": 480.587, "r_y1": 509.75, "r_x2": 480.587, "r_y2": 500.953, "r_x3": 134.765, "r_y3": 500.953, "coord_origin": "TOPLEFT"}, "text": "only 5 tokens that directly describe a tabular structure based on an atomic 2D", "orig": "only 5 tokens that directly describe a tabular structure based on an atomic 2D", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 36, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 521.706, "r_x1": 154.713, "r_y1": 521.706, "r_x2": 154.713, "r_y2": 512.909, "r_x3": 134.765, "r_y3": 512.909, "coord_origin": "TOPLEFT"}, "text": "grid.", "orig": "grid.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "In Figure 3, we illustrate how the OTSL is defined. In essence, the OTSL defines only 5 tokens that directly describe a tabular structure based on an atomic 2D grid."}, {"label": "text", "id": 13, "page_no": 5, "cluster": {"id": 13, "label": "text", "bbox": {"l": 149.709, "t": 525.502, "r": 409.311, "b": 534.299, "coord_origin": "TOPLEFT"}, "confidence": 0.8555866479873657, "cells": [{"index": 37, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 149.709, "r_y0": 534.299, "r_x1": 409.311, "r_y1": 534.299, "r_x2": 409.311, "r_y2": 525.502, "r_x3": 149.709, "r_y3": 525.502, "coord_origin": "TOPLEFT"}, "text": "The OTSL vocabulary is comprised of the following tokens:", "orig": "The OTSL vocabulary is comprised of the following tokens:", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "The OTSL vocabulary is comprised of the following tokens:"}, {"label": "list_item", "id": 9, "page_no": 5, "cluster": {"id": 9, "label": "list_item", "bbox": {"l": 140.993, "t": 547.97, "r": 460.544, "b": 556.777, "coord_origin": "TOPLEFT"}, "confidence": 0.9184334874153137, "cells": [{"index": 38, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 140.993, "r_y0": 556.777, "r_x1": 146.72, "r_y1": 556.777, "r_x2": 146.72, "r_y2": 547.97, "r_x3": 140.993, "r_y3": 547.97, "coord_origin": "TOPLEFT"}, "text": "-", "orig": "-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 39, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 151.701, "r_y0": 556.777, "r_x1": 193.206, "r_y1": 556.777, "r_x2": 193.206, "r_y2": 547.98, "r_x3": 151.701, "r_y3": 547.98, "coord_origin": "TOPLEFT"}, "text": "\"C\" cell -", "orig": "\"C\" cell -", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 40, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 196.522, "r_y0": 556.777, "r_x1": 263.466, "r_y1": 556.777, "r_x2": 263.466, "r_y2": 547.98, "r_x3": 196.522, "r_y3": 547.98, "coord_origin": "TOPLEFT"}, "text": "a new table cell", "orig": "a new table cell", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 41, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 267.815, "r_y0": 556.777, "r_x1": 460.544, "r_y1": 556.777, "r_x2": 460.544, "r_y2": 547.98, "r_x3": 267.815, "r_y3": 547.98, "coord_origin": "TOPLEFT"}, "text": "that either has or does not have cell content", "orig": "that either has or does not have cell content", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "-\"C\" cell a new table cell that either has or does not have cell content"}, {"label": "list_item", "id": 8, "page_no": 5, "cluster": {"id": 8, "label": "list_item", "bbox": {"l": 140.993, "t": 560.563, "r": 480.594, "b": 581.325, "coord_origin": "TOPLEFT"}, "confidence": 0.9319931268692017, "cells": [{"index": 42, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 140.993, "r_y0": 569.37, "r_x1": 146.72, "r_y1": 569.37, "r_x2": 146.72, "r_y2": 560.563, "r_x3": 140.993, "r_y3": 560.563, "coord_origin": "TOPLEFT"}, "text": "-", "orig": "-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 43, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 151.701, "r_y0": 569.37, "r_x1": 194.3, "r_y1": 569.37, "r_x2": 194.3, "r_y2": 560.573, "r_x3": 151.701, "r_y3": 560.573, "coord_origin": "TOPLEFT"}, "text": "\"L\" cell -", "orig": "\"L\" cell -", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 44, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 198.659, "r_y0": 569.37, "r_x1": 245.75, "r_y1": 569.37, "r_x2": 245.75, "r_y2": 560.573, "r_x3": 198.659, "r_y3": 560.573, "coord_origin": "TOPLEFT"}, "text": "left-looking", "orig": "left-looking", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 45, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 250.263, "r_y0": 569.37, "r_x1": 264.518, "r_y1": 569.37, "r_x2": 264.518, "r_y2": 560.573, "r_x3": 250.263, "r_y3": 560.573, "coord_origin": "TOPLEFT"}, "text": "cell", "orig": "cell", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 46, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 264.518, "r_y0": 569.37, "r_x1": 267.285, "r_y1": 569.37, "r_x2": 267.285, "r_y2": 560.573, "r_x3": 264.518, "r_y3": 560.573, "coord_origin": "TOPLEFT"}, "text": ",", "orig": ",", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 47, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 271.638, "r_y0": 569.37, "r_x1": 480.594, "r_y1": 569.37, "r_x2": 480.594, "r_y2": 560.573, "r_x3": 271.638, "r_y3": 560.573, "coord_origin": "TOPLEFT"}, "text": "merging with the left neighbor cell to create a", "orig": "merging with the left neighbor cell to create a", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 48, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 151.701, "r_y0": 581.325, "r_x1": 171.676, "r_y1": 581.325, "r_x2": 171.676, "r_y2": 572.528, "r_x3": 151.701, "r_y3": 572.528, "coord_origin": "TOPLEFT"}, "text": "span", "orig": "span", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "-\"L\" cell left-looking cell , merging with the left neighbor cell to create a span"}, {"label": "list_item", "id": 7, "page_no": 5, "cluster": {"id": 7, "label": "list_item", "bbox": {"l": 140.993, "t": 585.112, "r": 480.588, "b": 605.874, "coord_origin": "TOPLEFT"}, "confidence": 0.9438967704772949, "cells": [{"index": 49, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 140.993, "r_y0": 593.919, "r_x1": 146.72, "r_y1": 593.919, "r_x2": 146.72, "r_y2": 585.112, "r_x3": 140.993, "r_y3": 585.112, "coord_origin": "TOPLEFT"}, "text": "-", "orig": "-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 50, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 151.701, "r_y0": 593.919, "r_x1": 194.111, "r_y1": 593.919, "r_x2": 194.111, "r_y2": 585.1220000000001, "r_x3": 151.701, "r_y3": 585.1220000000001, "coord_origin": "TOPLEFT"}, "text": "\"U\" cell -", "orig": "\"U\" cell -", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 51, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 197.748, "r_y0": 593.919, "r_x1": 259.895, "r_y1": 593.919, "r_x2": 259.895, "r_y2": 585.1220000000001, "r_x3": 197.748, "r_y3": 585.1220000000001, "coord_origin": "TOPLEFT"}, "text": "up-looking cell", "orig": "up-looking cell", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 52, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 259.892, "r_y0": 593.919, "r_x1": 262.659, "r_y1": 593.919, "r_x2": 262.659, "r_y2": 585.1220000000001, "r_x3": 259.892, "r_y3": 585.1220000000001, "coord_origin": "TOPLEFT"}, "text": ",", "orig": ",", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 53, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 266.295, "r_y0": 593.919, "r_x1": 480.588, "r_y1": 593.919, "r_x2": 480.588, "r_y2": 585.1220000000001, "r_x3": 266.295, "r_y3": 585.1220000000001, "coord_origin": "TOPLEFT"}, "text": "merging with the upper neighbor cell to create a", "orig": "merging with the upper neighbor cell to create a", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 54, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 151.701, "r_y0": 605.874, "r_x1": 171.676, "r_y1": 605.874, "r_x2": 171.676, "r_y2": 597.077, "r_x3": 151.701, "r_y3": 597.077, "coord_origin": "TOPLEFT"}, "text": "span", "orig": "span", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "-\"U\" cell up-looking cell , merging with the upper neighbor cell to create a span"}, {"label": "list_item", "id": 10, "page_no": 5, "cluster": {"id": 10, "label": "list_item", "bbox": {"l": 140.993, "t": 609.66, "r": 454.555, "b": 618.467, "coord_origin": "TOPLEFT"}, "confidence": 0.9036387801170349, "cells": [{"index": 55, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 140.993, "r_y0": 618.467, "r_x1": 146.72, "r_y1": 618.467, "r_x2": 146.72, "r_y2": 609.66, "r_x3": 140.993, "r_y3": 609.66, "coord_origin": "TOPLEFT"}, "text": "-", "orig": "-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 56, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 151.701, "r_y0": 618.467, "r_x1": 193.483, "r_y1": 618.467, "r_x2": 193.483, "r_y2": 609.67, "r_x3": 151.701, "r_y3": 609.67, "coord_origin": "TOPLEFT"}, "text": "\"X\" cell -", "orig": "\"X\" cell -", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 57, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 196.799, "r_y0": 618.467, "r_x1": 236.12, "r_y1": 618.467, "r_x2": 236.12, "r_y2": 609.67, "r_x3": 196.799, "r_y3": 609.67, "coord_origin": "TOPLEFT"}, "text": "cross cell", "orig": "cross cell", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 58, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 236.125, "r_y0": 618.467, "r_x1": 238.892, "r_y1": 618.467, "r_x2": 238.892, "r_y2": 609.67, "r_x3": 236.125, "r_y3": 609.67, "coord_origin": "TOPLEFT"}, "text": ",", "orig": ",", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 59, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 242.209, "r_y0": 618.467, "r_x1": 454.555, "r_y1": 618.467, "r_x2": 454.555, "r_y2": 609.67, "r_x3": 242.209, "r_y3": 609.67, "coord_origin": "TOPLEFT"}, "text": "to merge with both left and upper neighbor cells", "orig": "to merge with both left and upper neighbor cells", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "-\"X\" cell cross cell , to merge with both left and upper neighbor cells"}, {"label": "list_item", "id": 12, "page_no": 5, "cluster": {"id": 12, "label": "list_item", "bbox": {"l": 140.993, "t": 622.254, "r": 328.617, "b": 631.061, "coord_origin": "TOPLEFT"}, "confidence": 0.8636871576309204, "cells": [{"index": 60, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 140.993, "r_y0": 631.061, "r_x1": 146.72, "r_y1": 631.061, "r_x2": 146.72, "r_y2": 622.254, "r_x3": 140.993, "r_y3": 622.254, "coord_origin": "TOPLEFT"}, "text": "-", "orig": "-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 61, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 151.701, "r_y0": 631.061, "r_x1": 181.994, "r_y1": 631.061, "r_x2": 181.994, "r_y2": 622.264, "r_x3": 151.701, "r_y3": 622.264, "coord_origin": "TOPLEFT"}, "text": "\"NL\" -", "orig": "\"NL\" -", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 62, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 185.317, "r_y0": 631.061, "r_x1": 221.462, "r_y1": 631.061, "r_x2": 221.462, "r_y2": 622.264, "r_x3": 185.317, "r_y3": 622.264, "coord_origin": "TOPLEFT"}, "text": "new-line", "orig": "new-line", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 63, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 221.461, "r_y0": 631.061, "r_x1": 224.228, "r_y1": 631.061, "r_x2": 224.228, "r_y2": 622.264, "r_x3": 221.461, "r_y3": 622.264, "coord_origin": "TOPLEFT"}, "text": ",", "orig": ",", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 64, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 227.545, "r_y0": 631.061, "r_x1": 328.617, "r_y1": 631.061, "r_x2": 328.617, "r_y2": 622.264, "r_x3": 227.545, "r_y3": 622.264, "coord_origin": "TOPLEFT"}, "text": "switch to the next row.", "orig": "switch to the next row.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "-\"NL\" new-line , switch to the next row."}, {"label": "text", "id": 6, "page_no": 5, "cluster": {"id": 6, "label": "text", "bbox": {"l": 134.765, "t": 644.1030000000001, "r": 480.593, "b": 664.855, "coord_origin": "TOPLEFT"}, "confidence": 0.9443338513374329, "cells": [{"index": 65, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 149.709, "r_y0": 652.9, "r_x1": 480.593, "r_y1": 652.9, "r_x2": 480.593, "r_y2": 644.1030000000001, "r_x3": 149.709, "r_y3": 644.1030000000001, "coord_origin": "TOPLEFT"}, "text": "A notable attribute of OTSL is that it has the capability of achieving lossless", "orig": "A notable attribute of OTSL is that it has the capability of achieving lossless", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 66, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 664.855, "r_x1": 228.223, "r_y1": 664.855, "r_x2": 228.223, "r_y2": 656.058, "r_x3": 134.765, "r_y3": 656.058, "coord_origin": "TOPLEFT"}, "text": "conversion to HTML.", "orig": "conversion to HTML.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "A notable attribute of OTSL is that it has the capability of achieving lossless conversion to HTML."}], "headers": [{"label": "page_header", "id": 14, "page_no": 5, "cluster": {"id": 14, "label": "page_header", "bbox": {"l": 134.765, "t": 91.49300000000005, "r": 139.372, "b": 102.78200000000004, "coord_origin": "TOPLEFT"}, "confidence": 0.8378868699073792, "cells": [{"index": 0, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 102.78200000000004, "r_x1": 139.372, "r_y1": 102.78200000000004, "r_x2": 139.372, "r_y2": 91.49300000000005, "r_x3": 134.765, "r_y3": 91.49300000000005, "coord_origin": "TOPLEFT"}, "text": "6", "orig": "6", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "6"}, {"label": "page_header", "id": 11, "page_no": 5, "cluster": {"id": 11, "label": "page_header", "bbox": {"l": 167.813, "t": 91.49300000000005, "r": 231.722, "b": 102.78200000000004, "coord_origin": "TOPLEFT"}, "confidence": 0.8919177651405334, "cells": [{"index": 1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 167.813, "r_y0": 102.78200000000004, "r_x1": 231.722, "r_y1": 102.78200000000004, "r_x2": 231.722, "r_y2": 91.49300000000005, "r_x3": 167.813, "r_y3": 91.49300000000005, "coord_origin": "TOPLEFT"}, "text": "M. Lysak, et al.", "orig": "M. Lysak, et al.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "M. Lysak, et al."}]}}, {"page_no": 6, "size": {"width": 612.0, "height": 792.0}, "cells": [{"index": 0, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 194.478, "r_y0": 102.78200000000004, "r_x1": 447.543, "r_y1": 102.78200000000004, "r_x2": 447.543, "r_y2": 91.49300000000005, "r_x3": 194.478, "r_y3": 91.49300000000005, "coord_origin": "TOPLEFT"}, "text": "Optimized Table Tokenization for Table Structure Recognition", "orig": "Optimized Table Tokenization for Table Structure Recognition", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 475.984, "r_y0": 102.78200000000004, "r_x1": 480.591, "r_y1": 102.78200000000004, "r_x2": 480.591, "r_y2": 91.49300000000005, "r_x3": 475.984, "r_y3": 91.49300000000005, "coord_origin": "TOPLEFT"}, "text": "7", "orig": "7", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 2, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 133.72500000000002, "r_x1": 162.644, "r_y1": 133.72500000000002, "r_x2": 162.644, "r_y2": 125.79899999999998, "r_x3": 134.765, "r_y3": 125.79899999999998, "coord_origin": "TOPLEFT"}, "text": "Fig. 3.", "orig": "Fig. 3.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 3, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 166.276, "r_y0": 134.87300000000005, "r_x1": 480.587, "r_y1": 134.87300000000005, "r_x2": 480.587, "r_y2": 123.58399999999995, "r_x3": 166.276, "r_y3": 123.58399999999995, "coord_origin": "TOPLEFT"}, "text": "OTSL description of table structure: A - table example; B - graphical repre-", "orig": "OTSL description of table structure: A - table example; B - graphical repre-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 4, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 145.832, "r_x1": 171.412, "r_y1": 145.832, "r_x2": 171.412, "r_y2": 134.543, "r_x3": 134.765, "r_y3": 134.543, "coord_origin": "TOPLEFT"}, "text": "sentation", "orig": "sentation", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 5, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 175.546, "r_y0": 145.832, "r_x1": 182.968, "r_y1": 145.832, "r_x2": 182.968, "r_y2": 134.543, "r_x3": 175.546, "r_y3": 134.543, "coord_origin": "TOPLEFT"}, "text": "of", "orig": "of", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 6, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 187.093, "r_y0": 145.832, "r_x1": 207.058, "r_y1": 145.832, "r_x2": 207.058, "r_y2": 134.543, "r_x3": 187.093, "r_y3": 134.543, "coord_origin": "TOPLEFT"}, "text": "table", "orig": "table", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 7, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 211.192, "r_y0": 145.832, "r_x1": 250.188, "r_y1": 145.832, "r_x2": 250.188, "r_y2": 134.543, "r_x3": 211.192, "r_y3": 134.543, "coord_origin": "TOPLEFT"}, "text": "structure;", "orig": "structure;", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 8, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 254.312, "r_y0": 145.832, "r_x1": 480.587, "r_y1": 145.832, "r_x2": 480.587, "r_y2": 134.543, "r_x3": 254.312, "r_y3": 134.543, "coord_origin": "TOPLEFT"}, "text": "C - mapping structure on a grid; D - OTSL structure", "orig": "C - mapping structure on a grid; D - OTSL structure", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 9, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 156.79100000000005, "r_x1": 306.116, "r_y1": 156.79100000000005, "r_x2": 306.116, "r_y2": 145.50199999999995, "r_x3": 134.765, "r_y3": 145.50199999999995, "coord_origin": "TOPLEFT"}, "text": "encoding; E - explanation on cell encoding", "orig": "encoding; E - explanation on cell encoding", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 10, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 374.493, "r_y0": 177.88099999999997, "r_x1": 428.861, "r_y1": 177.22199999999998, "r_x2": 428.861, "r_y2": 168.05399999999997, "r_x3": 374.493, "r_y3": 168.71299999999997, "coord_origin": "TOPLEFT"}, "text": "C L C L L", "orig": "C L C L L", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 11, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 373.769, "r_y0": 202.21299999999997, "r_x1": 448.17, "r_y1": 201.78200000000004, "r_x2": 448.17, "r_y2": 192.61400000000003, "r_x3": 373.769, "r_y3": 193.04499999999996, "coord_origin": "TOPLEFT"}, "text": "C C C C C NL", "orig": "C C C C C NL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 12, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 386.687, "r_y0": 214.42499999999995, "r_x1": 448.085, "r_y1": 214.11800000000005, "r_x2": 448.085, "r_y2": 204.95000000000005, "r_x3": 386.687, "r_y3": 205.25699999999995, "coord_origin": "TOPLEFT"}, "text": "C C C C NL", "orig": "C C C C NL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 13, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 398.657, "r_y0": 190.01999999999998, "r_x1": 448.147, "r_y1": 189.48800000000006, "r_x2": 448.147, "r_y2": 180.32000000000005, "r_x3": 398.657, "r_y3": 180.85199999999998, "coord_origin": "TOPLEFT"}, "text": "C C C NL", "orig": "C C C NL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 14, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 386.506, "r_y0": 226.32600000000002, "r_x1": 448.302, "r_y1": 226.52099999999996, "r_x2": 448.302, "r_y2": 217.35299999999995, "r_x3": 386.506, "r_y3": 217.15800000000002, "coord_origin": "TOPLEFT"}, "text": "C C C C NL", "orig": "C C C C NL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 15, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 435.16, "r_y0": 176.97699999999998, "r_x1": 447.863, "r_y1": 176.97699999999998, "r_x2": 447.863, "r_y2": 167.80899999999997, "r_x3": 435.16, "r_y3": 167.80899999999997, "coord_origin": "TOPLEFT"}, "text": "NL", "orig": "NL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 16, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 374.15, "r_y0": 214.52200000000005, "r_x1": 381.325, "r_y1": 214.52200000000005, "r_x2": 381.325, "r_y2": 205.35400000000004, "r_x3": 374.15, "r_y3": 205.35400000000004, "coord_origin": "TOPLEFT"}, "text": "U", "orig": "U", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 17, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 374.042, "r_y0": 226.43399999999997, "r_x1": 381.217, "r_y1": 226.43399999999997, "r_x2": 381.217, "r_y2": 217.26599999999996, "r_x3": 374.042, "r_y3": 217.26599999999996, "coord_origin": "TOPLEFT"}, "text": "U", "orig": "U", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 18, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 374.344, "r_y0": 190.22199999999998, "r_x1": 393.765, "r_y1": 190.07299999999998, "r_x2": 393.765, "r_y2": 180.90499999999997, "r_x3": 374.344, "r_y3": 181.05399999999997, "coord_origin": "TOPLEFT"}, "text": "U X", "orig": "U X", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 19, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 282.259, "r_y0": 253.79600000000005, "r_x1": 301.055, "r_y1": 253.78099999999995, "r_x2": 301.055, "r_y2": 244.61300000000006, "r_x3": 282.259, "r_y3": 244.62800000000004, "coord_origin": "TOPLEFT"}, "text": "C L", "orig": "C L", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 20, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 282.11, "r_y0": 266.13800000000003, "r_x1": 325.59, "r_y1": 265.58900000000006, "r_x2": 325.59, "r_y2": 256.42100000000005, "r_x3": 282.11, "r_y3": 256.96900000000005, "coord_origin": "TOPLEFT"}, "text": "U X X X", "orig": "U X X X", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 21, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 282.408, "r_y0": 278.41999999999996, "r_x1": 325.478, "r_y1": 278.14200000000005, "r_x2": 325.478, "r_y2": 268.97400000000005, "r_x3": 282.408, "r_y3": 269.25199999999995, "coord_origin": "TOPLEFT"}, "text": "U X X X", "orig": "U X X X", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 22, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 307.466, "r_y0": 253.861, "r_x1": 312.992, "r_y1": 253.861, "r_x2": 312.992, "r_y2": 244.69299999999998, "r_x3": 307.466, "r_y3": 244.69299999999998, "coord_origin": "TOPLEFT"}, "text": "L", "orig": "L", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 23, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 318.769, "r_y0": 253.72799999999995, "r_x1": 324.294, "r_y1": 253.72799999999995, "r_x2": 324.294, "r_y2": 244.55999999999995, "r_x3": 318.769, "r_y3": 244.55999999999995, "coord_origin": "TOPLEFT"}, "text": "L", "orig": "L", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 24, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 195.939, "r_y0": 278.03499999999997, "r_x1": 214.734, "r_y1": 278.02, "r_x2": 214.734, "r_y2": 268.852, "r_x3": 195.939, "r_y3": 268.86699999999996, "coord_origin": "TOPLEFT"}, "text": "C L", "orig": "C L", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 25, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 221.146, "r_y0": 278.1, "r_x1": 226.671, "r_y1": 278.1, "r_x2": 226.671, "r_y2": 268.932, "r_x3": 221.146, "r_y3": 268.932, "coord_origin": "TOPLEFT"}, "text": "L", "orig": "L", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 26, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 232.449, "r_y0": 277.967, "r_x1": 237.974, "r_y1": 277.967, "r_x2": 237.974, "r_y2": 268.799, "r_x3": 232.449, "r_y3": 268.799, "coord_origin": "TOPLEFT"}, "text": "L", "orig": "L", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 27, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 196.217, "r_y0": 253.827, "r_x1": 203.392, "r_y1": 253.827, "r_x2": 203.392, "r_y2": 244.659, "r_x3": 196.217, "r_y3": 244.659, "coord_origin": "TOPLEFT"}, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 28, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 250.321, "r_y0": 253.385, "r_x1": 257.497, "r_y1": 253.385, "r_x2": 257.497, "r_y2": 244.21699999999998, "r_x3": 250.321, "r_y3": 244.21699999999998, "coord_origin": "TOPLEFT"}, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 29, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 250.172, "r_y0": 265.727, "r_x1": 257.348, "r_y1": 265.727, "r_x2": 257.348, "r_y2": 256.55899999999997, "r_x3": 250.172, "r_y3": 256.55899999999997, "coord_origin": "TOPLEFT"}, "text": "U", "orig": "U", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 30, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 250.47, "r_y0": 278.01, "r_x1": 257.646, "r_y1": 278.01, "r_x2": 257.646, "r_y2": 268.842, "r_x3": 250.47, "r_y3": 268.842, "coord_origin": "TOPLEFT"}, "text": "U", "orig": "U", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 31, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 334.511, "r_y0": 249.18600000000004, "r_x1": 391.495, "r_y1": 249.18600000000004, "r_x2": 391.495, "r_y2": 243.07399999999996, "r_x3": 334.511, "r_y3": 243.07399999999996, "coord_origin": "TOPLEFT"}, "text": "1 - simple cells: \"C\"", "orig": "1 - simple cells: \"C\"", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 32, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 334.511, "r_y0": 259.124, "r_x1": 421.986, "r_y1": 259.124, "r_x2": 421.986, "r_y2": 253.01199999999994, "r_x3": 334.511, "r_y3": 253.01199999999994, "coord_origin": "TOPLEFT"}, "text": "2 - horizontal merges: \"C\", \"L\"", "orig": "2 - horizontal merges: \"C\", \"L\"", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 33, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 334.511, "r_y0": 269.062, "r_x1": 415.344, "r_y1": 269.062, "r_x2": 415.344, "r_y2": 262.95000000000005, "r_x3": 334.511, "r_y3": 262.95000000000005, "coord_origin": "TOPLEFT"}, "text": "3 - vertical merges: \"C\", \"U\"", "orig": "3 - vertical merges: \"C\", \"U\"", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 34, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 334.511, "r_y0": 279.0, "r_x1": 426.599, "r_y1": 279.0, "r_x2": 426.599, "r_y2": 272.88800000000003, "r_x3": 334.511, "r_y3": 272.88800000000003, "coord_origin": "TOPLEFT"}, "text": "4 - 2d merges: \"C\", \"L\", \"U\", \"X\"", "orig": "4 - 2d merges: \"C\", \"L\", \"U\", \"X\"", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 35, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 185.672, "r_y0": 250.23400000000004, "r_x1": 189.355, "r_y1": 250.23400000000004, "r_x2": 189.355, "r_y2": 244.12199999999996, "r_x3": 185.672, "r_y3": 244.12199999999996, "coord_origin": "TOPLEFT"}, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 36, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 185.968, "r_y0": 274.539, "r_x1": 189.651, "r_y1": 274.539, "r_x2": 189.651, "r_y2": 268.427, "r_x3": 185.968, "r_y3": 268.427, "coord_origin": "TOPLEFT"}, "text": "2", "orig": "2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 37, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 239.342, "r_y0": 249.817, "r_x1": 243.025, "r_y1": 249.817, "r_x2": 243.025, "r_y2": 243.70500000000004, "r_x3": 239.342, "r_y3": 243.70500000000004, "coord_origin": "TOPLEFT"}, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 38, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 271.329, "r_y0": 249.68499999999995, "r_x1": 275.012, "r_y1": 249.68499999999995, "r_x2": 275.012, "r_y2": 243.57299999999998, "r_x3": 271.329, "r_y3": 243.57299999999998, "coord_origin": "TOPLEFT"}, "text": "4", "orig": "4", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 39, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 229.816, "r_y0": 172.707, "r_x1": 233.5, "r_y1": 172.707, "r_x2": 233.5, "r_y2": 166.59400000000005, "r_x3": 229.816, "r_y3": 166.59400000000005, "coord_origin": "TOPLEFT"}, "text": "2", "orig": "2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 40, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 257.244, "r_y0": 196.15300000000002, "r_x1": 260.928, "r_y1": 196.15300000000002, "r_x2": 260.928, "r_y2": 190.03999999999996, "r_x3": 257.244, "r_y3": 190.03999999999996, "coord_origin": "TOPLEFT"}, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 41, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 186.875, "r_y0": 184.168, "r_x1": 190.559, "r_y1": 184.168, "r_x2": 190.559, "r_y2": 178.05600000000004, "r_x3": 186.875, "r_y3": 178.05600000000004, "coord_origin": "TOPLEFT"}, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 42, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 196.487, "r_y0": 175.207, "r_x1": 200.171, "r_y1": 175.207, "r_x2": 200.171, "r_y2": 169.09500000000003, "r_x3": 196.487, "r_y3": 169.09500000000003, "coord_origin": "TOPLEFT"}, "text": "4", "orig": "4", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 43, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 169.747, "r_y0": 175.62199999999996, "r_x1": 175.727, "r_y1": 175.62199999999996, "r_x2": 175.727, "r_y2": 167.98199999999997, "r_x3": 169.747, "r_y3": 167.98199999999997, "coord_origin": "TOPLEFT"}, "text": "A", "orig": "A", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 44, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 169.747, "r_y0": 214.57799999999997, "r_x1": 175.727, "r_y1": 214.57799999999997, "r_x2": 175.727, "r_y2": 206.938, "r_x3": 169.747, "r_y3": 206.938, "coord_origin": "TOPLEFT"}, "text": "B", "orig": "B", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 45, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 274.294, "r_y0": 176.019, "r_x1": 280.273, "r_y1": 176.019, "r_x2": 280.273, "r_y2": 168.37900000000002, "r_x3": 274.294, "r_y3": 168.37900000000002, "coord_origin": "TOPLEFT"}, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 46, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 359.562, "r_y0": 176.019, "r_x1": 365.541, "r_y1": 176.019, "r_x2": 365.541, "r_y2": 168.37900000000002, "r_x3": 359.562, "r_y3": 168.37900000000002, "coord_origin": "TOPLEFT"}, "text": "D", "orig": "D", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 47, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 169.747, "r_y0": 250.95100000000002, "r_x1": 175.271, "r_y1": 250.95100000000002, "r_x2": 175.271, "r_y2": 243.31100000000004, "r_x3": 169.747, "r_y3": 243.31100000000004, "coord_origin": "TOPLEFT"}, "text": "E", "orig": "E", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 48, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 314.103, "r_x1": 149.402, "r_y1": 314.103, "r_x2": 149.402, "r_y2": 305.296, "r_x3": 134.765, "r_y3": 305.296, "coord_origin": "TOPLEFT"}, "text": "4.2", "orig": "4.2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 49, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 160.859, "r_y0": 314.103, "r_x1": 246.652, "r_y1": 314.103, "r_x2": 246.652, "r_y2": 305.296, "r_x3": 160.859, "r_y3": 305.296, "coord_origin": "TOPLEFT"}, "text": "Language Syntax", "orig": "Language Syntax", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 50, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 334.045, "r_x1": 363.796, "r_y1": 334.045, "r_x2": 363.796, "r_y2": 325.248, "r_x3": 134.765, "r_y3": 325.248, "coord_origin": "TOPLEFT"}, "text": "The OTSL representation follows these syntax rules:", "orig": "The OTSL representation follows these syntax rules:", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 51, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 138.973, "r_y0": 355.978, "r_x1": 146.72, "r_y1": 355.978, "r_x2": 146.72, "r_y2": 347.181, "r_x3": 138.973, "r_y3": 347.181, "coord_origin": "TOPLEFT"}, "text": "1.", "orig": "1.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 52, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 151.701, "r_y0": 355.978, "r_x1": 257.379, "r_y1": 355.978, "r_x2": 257.379, "r_y2": 347.171, "r_x3": 151.701, "r_y3": 347.171, "coord_origin": "TOPLEFT"}, "text": "Left-looking cell rule", "orig": "Left-looking cell rule", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 53, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 257.383, "r_y0": 355.978, "r_x1": 260.15, "r_y1": 355.978, "r_x2": 260.15, "r_y2": 347.181, "r_x3": 257.383, "r_y3": 347.181, "coord_origin": "TOPLEFT"}, "text": ":", "orig": ":", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 54, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 264.184, "r_y0": 355.978, "r_x1": 480.589, "r_y1": 355.978, "r_x2": 480.589, "r_y2": 347.181, "r_x3": 264.184, "r_y3": 347.181, "coord_origin": "TOPLEFT"}, "text": "The left neighbour of an \"L\" cell must be either", "orig": "The left neighbour of an \"L\" cell must be either", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 55, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 151.701, "r_y0": 367.934, "r_x1": 283.594, "r_y1": 367.934, "r_x2": 283.594, "r_y2": 359.137, "r_x3": 151.701, "r_y3": 359.137, "coord_origin": "TOPLEFT"}, "text": "another \"L\" cell or a \"C\" cell.", "orig": "another \"L\" cell or a \"C\" cell.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 56, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 138.973, "r_y0": 379.892, "r_x1": 146.72, "r_y1": 379.892, "r_x2": 146.72, "r_y2": 371.095, "r_x3": 138.973, "r_y3": 371.095, "coord_origin": "TOPLEFT"}, "text": "2.", "orig": "2.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 57, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 151.701, "r_y0": 379.892, "r_x1": 252.112, "r_y1": 379.892, "r_x2": 252.112, "r_y2": 371.085, "r_x3": 151.701, "r_y3": 371.085, "coord_origin": "TOPLEFT"}, "text": "Up-looking cell rule", "orig": "Up-looking cell rule", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 58, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 252.112, "r_y0": 379.892, "r_x1": 254.879, "r_y1": 379.892, "r_x2": 254.879, "r_y2": 371.095, "r_x3": 252.112, "r_y3": 371.095, "coord_origin": "TOPLEFT"}, "text": ":", "orig": ":", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 59, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 258.764, "r_y0": 379.892, "r_x1": 480.592, "r_y1": 379.892, "r_x2": 480.592, "r_y2": 371.095, "r_x3": 258.764, "r_y3": 371.095, "coord_origin": "TOPLEFT"}, "text": "The upper neighbour of a \"U\" cell must be either", "orig": "The upper neighbour of a \"U\" cell must be either", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 60, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 151.701, "r_y0": 391.847, "r_x1": 284.839, "r_y1": 391.847, "r_x2": 284.839, "r_y2": 383.05, "r_x3": 151.701, "r_y3": 383.05, "coord_origin": "TOPLEFT"}, "text": "another \"U\" cell or a \"C\" cell.", "orig": "another \"U\" cell or a \"C\" cell.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 61, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 138.973, "r_y0": 403.805, "r_x1": 146.72, "r_y1": 403.805, "r_x2": 146.72, "r_y2": 395.008, "r_x3": 138.973, "r_y3": 395.008, "coord_origin": "TOPLEFT"}, "text": "3.", "orig": "3.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 62, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 151.701, "r_y0": 403.805, "r_x1": 223.304, "r_y1": 403.805, "r_x2": 223.304, "r_y2": 394.998, "r_x3": 151.701, "r_y3": 394.998, "coord_origin": "TOPLEFT"}, "text": "Cross cell rule", "orig": "Cross cell rule", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 63, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 223.307, "r_y0": 403.805, "r_x1": 226.074, "r_y1": 403.805, "r_x2": 226.074, "r_y2": 395.008, "r_x3": 223.307, "r_y3": 395.008, "coord_origin": "TOPLEFT"}, "text": ":", "orig": ":", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 64, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 151.701, "r_y0": 415.764, "r_x1": 480.592, "r_y1": 415.764, "r_x2": 480.592, "r_y2": 406.967, "r_x3": 151.701, "r_y3": 406.967, "coord_origin": "TOPLEFT"}, "text": "The left neighbour of an \"X\" cell must be either another \"X\" cell or a \"U\"", "orig": "The left neighbour of an \"X\" cell must be either another \"X\" cell or a \"U\"", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 65, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 151.701, "r_y0": 427.719, "r_x1": 480.592, "r_y1": 427.719, "r_x2": 480.592, "r_y2": 418.922, "r_x3": 151.701, "r_y3": 418.922, "coord_origin": "TOPLEFT"}, "text": "cell, and the upper neighbour of an \"X\" cell must be either another \"X\" cell", "orig": "cell, and the upper neighbour of an \"X\" cell must be either another \"X\" cell", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 66, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 151.701, "r_y0": 439.674, "r_x1": 214.397, "r_y1": 439.674, "r_x2": 214.397, "r_y2": 430.877, "r_x3": 151.701, "r_y3": 430.877, "coord_origin": "TOPLEFT"}, "text": "or an \"L\" cell.", "orig": "or an \"L\" cell.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 67, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 138.973, "r_y0": 451.633, "r_x1": 146.72, "r_y1": 451.633, "r_x2": 146.72, "r_y2": 442.836, "r_x3": 138.973, "r_y3": 442.836, "coord_origin": "TOPLEFT"}, "text": "4.", "orig": "4.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 68, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 151.701, "r_y0": 451.633, "r_x1": 221.323, "r_y1": 451.633, "r_x2": 221.323, "r_y2": 442.826, "r_x3": 151.701, "r_y3": 442.826, "coord_origin": "TOPLEFT"}, "text": "First row rule", "orig": "First row rule", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 69, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 221.327, "r_y0": 451.633, "r_x1": 224.094, "r_y1": 451.633, "r_x2": 224.094, "r_y2": 442.836, "r_x3": 221.327, "r_y3": 442.836, "coord_origin": "TOPLEFT"}, "text": ":", "orig": ":", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 70, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 227.411, "r_y0": 451.633, "r_x1": 474.59, "r_y1": 451.633, "r_x2": 474.59, "r_y2": 442.836, "r_x3": 227.411, "r_y3": 442.836, "coord_origin": "TOPLEFT"}, "text": "Only \"L\" cells and \"C\" cells are allowed in the first row.", "orig": "Only \"L\" cells and \"C\" cells are allowed in the first row.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 71, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 138.973, "r_y0": 463.591, "r_x1": 146.72, "r_y1": 463.591, "r_x2": 146.72, "r_y2": 454.794, "r_x3": 138.973, "r_y3": 454.794, "coord_origin": "TOPLEFT"}, "text": "5.", "orig": "5.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 72, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 151.701, "r_y0": 463.591, "r_x1": 240.72, "r_y1": 463.591, "r_x2": 240.72, "r_y2": 454.784, "r_x3": 151.701, "r_y3": 454.784, "coord_origin": "TOPLEFT"}, "text": "First column rule", "orig": "First column rule", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 73, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 240.716, "r_y0": 463.591, "r_x1": 243.483, "r_y1": 463.591, "r_x2": 243.483, "r_y2": 454.794, "r_x3": 240.716, "r_y3": 454.794, "coord_origin": "TOPLEFT"}, "text": ":", "orig": ":", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 74, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 247.458, "r_y0": 463.591, "r_x1": 480.588, "r_y1": 463.591, "r_x2": 480.588, "r_y2": 454.794, "r_x3": 247.458, "r_y3": 454.794, "coord_origin": "TOPLEFT"}, "text": "Only \"U\" cells and \"C\" cells are allowed in the first", "orig": "Only \"U\" cells and \"C\" cells are allowed in the first", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 75, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 151.701, "r_y0": 475.546, "r_x1": 186.007, "r_y1": 475.546, "r_x2": 186.007, "r_y2": 466.749, "r_x3": 151.701, "r_y3": 466.749, "coord_origin": "TOPLEFT"}, "text": "column.", "orig": "column.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 76, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 138.973, "r_y0": 487.504, "r_x1": 146.72, "r_y1": 487.504, "r_x2": 146.72, "r_y2": 478.707, "r_x3": 138.973, "r_y3": 478.707, "coord_origin": "TOPLEFT"}, "text": "6.", "orig": "6.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 77, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 151.701, "r_y0": 487.504, "r_x1": 235.158, "r_y1": 487.504, "r_x2": 235.158, "r_y2": 478.697, "r_x3": 151.701, "r_y3": 478.697, "coord_origin": "TOPLEFT"}, "text": "Rectangular rule", "orig": "Rectangular rule", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 78, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 235.157, "r_y0": 487.504, "r_x1": 480.595, "r_y1": 487.504, "r_x2": 480.595, "r_y2": 478.707, "r_x3": 235.157, "r_y3": 478.707, "coord_origin": "TOPLEFT"}, "text": ": The table representation is always rectangular - all rows", "orig": ": The table representation is always rectangular - all rows", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 79, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 151.701, "r_y0": 499.46, "r_x1": 448.042, "r_y1": 499.46, "r_x2": 448.042, "r_y2": 490.663, "r_x3": 151.701, "r_y3": 490.663, "coord_origin": "TOPLEFT"}, "text": "must have an equal number of tokens, terminated with \"NL\" token.", "orig": "must have an equal number of tokens, terminated with \"NL\" token.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 80, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 149.709, "r_y0": 521.39, "r_x1": 480.596, "r_y1": 521.39, "r_x2": 480.596, "r_y2": 512.5930000000001, "r_x3": 149.709, "r_y3": 512.5930000000001, "coord_origin": "TOPLEFT"}, "text": "The application of these rules gives OTSL a set of unique properties. First", "orig": "The application of these rules gives OTSL a set of unique properties. First", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 81, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 533.345, "r_x1": 480.591, "r_y1": 533.345, "r_x2": 480.591, "r_y2": 524.548, "r_x3": 134.765, "r_y3": 524.548, "coord_origin": "TOPLEFT"}, "text": "of all, the OTSL enforces a strictly rectangular structure representation, where", "orig": "of all, the OTSL enforces a strictly rectangular structure representation, where", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 82, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 545.3, "r_x1": 480.595, "r_y1": 545.3, "r_x2": 480.595, "r_y2": 536.5029999999999, "r_x3": 134.765, "r_y3": 536.5029999999999, "coord_origin": "TOPLEFT"}, "text": "every new-line token starts a new row. As a consequence, all rows and all columns", "orig": "every new-line token starts a new row. As a consequence, all rows and all columns", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 83, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 557.256, "r_x1": 480.589, "r_y1": 557.256, "r_x2": 480.589, "r_y2": 548.4590000000001, "r_x3": 134.765, "r_y3": 548.4590000000001, "coord_origin": "TOPLEFT"}, "text": "have exactly the same number of tokens, irrespective of cell spans. Secondly, the", "orig": "have exactly the same number of tokens, irrespective of cell spans. Secondly, the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 84, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 569.211, "r_x1": 480.594, "r_y1": 569.211, "r_x2": 480.594, "r_y2": 560.414, "r_x3": 134.765, "r_y3": 560.414, "coord_origin": "TOPLEFT"}, "text": "OTSL representation is unambiguous: Every table structure is represented in one", "orig": "OTSL representation is unambiguous: Every table structure is represented in one", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 85, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 581.1659999999999, "r_x1": 480.587, "r_y1": 581.1659999999999, "r_x2": 480.587, "r_y2": 572.369, "r_x3": 134.765, "r_y3": 572.369, "coord_origin": "TOPLEFT"}, "text": "way. In this representation every table cell corresponds to a \"C\"-cell token, which", "orig": "way. In this representation every table cell corresponds to a \"C\"-cell token, which", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 86, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 593.121, "r_x1": 480.592, "r_y1": 593.121, "r_x2": 480.592, "r_y2": 584.3240000000001, "r_x3": 134.765, "r_y3": 584.3240000000001, "coord_origin": "TOPLEFT"}, "text": "in case of spans is always located in the top-left corner of the table cell definition.", "orig": "in case of spans is always located in the top-left corner of the table cell definition.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 87, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 605.076, "r_x1": 480.592, "r_y1": 605.076, "r_x2": 480.592, "r_y2": 596.279, "r_x3": 134.765, "r_y3": 596.279, "coord_origin": "TOPLEFT"}, "text": "Third, OTSL syntax rules are only backward-looking. As a consequence, every", "orig": "Third, OTSL syntax rules are only backward-looking. As a consequence, every", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 88, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 617.032, "r_x1": 480.594, "r_y1": 617.032, "r_x2": 480.594, "r_y2": 608.235, "r_x3": 134.765, "r_y3": 608.235, "coord_origin": "TOPLEFT"}, "text": "predicted token can be validated straight during sequence generation by looking", "orig": "predicted token can be validated straight during sequence generation by looking", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 89, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 628.987, "r_x1": 480.591, "r_y1": 628.987, "r_x2": 480.591, "r_y2": 620.19, "r_x3": 134.765, "r_y3": 620.19, "coord_origin": "TOPLEFT"}, "text": "at the previously predicted sequence. As such, OTSL can guarantee that every", "orig": "at the previously predicted sequence. As such, OTSL can guarantee that every", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 90, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 640.942, "r_x1": 311.198, "r_y1": 640.942, "r_x2": 311.198, "r_y2": 632.145, "r_x3": 134.765, "r_y3": 632.145, "coord_origin": "TOPLEFT"}, "text": "predicted sequence is syntactically valid.", "orig": "predicted sequence is syntactically valid.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 91, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 149.709, "r_y0": 652.9, "r_x1": 480.592, "r_y1": 652.9, "r_x2": 480.592, "r_y2": 644.1030000000001, "r_x3": 149.709, "r_y3": 644.1030000000001, "coord_origin": "TOPLEFT"}, "text": "These characteristics can be easily learned by sequence generator networks,", "orig": "These characteristics can be easily learned by sequence generator networks,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 92, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 664.855, "r_x1": 480.593, "r_y1": 664.855, "r_x2": 480.593, "r_y2": 656.058, "r_x3": 134.765, "r_y3": 656.058, "coord_origin": "TOPLEFT"}, "text": "as we demonstrate further below. We find strong indications that this pattern", "orig": "as we demonstrate further below. We find strong indications that this pattern", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "parsed_page": null, "predictions": {"layout": {"clusters": [{"id": 7, "label": "page_header", "bbox": {"l": 194.478, "t": 91.49300000000005, "r": 447.543, "b": 102.78200000000004, "coord_origin": "TOPLEFT"}, "confidence": 0.932651162147522, "cells": [{"index": 0, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 194.478, "r_y0": 102.78200000000004, "r_x1": 447.543, "r_y1": 102.78200000000004, "r_x2": 447.543, "r_y2": 91.49300000000005, "r_x3": 194.478, "r_y3": 91.49300000000005, "coord_origin": "TOPLEFT"}, "text": "Optimized Table Tokenization for Table Structure Recognition", "orig": "Optimized Table Tokenization for Table Structure Recognition", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 11, "label": "page_header", "bbox": {"l": 475.984, "t": 91.49300000000005, "r": 480.591, "b": 102.78200000000004, "coord_origin": "TOPLEFT"}, "confidence": 0.8749732375144958, "cells": [{"index": 1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 475.984, "r_y0": 102.78200000000004, "r_x1": 480.591, "r_y1": 102.78200000000004, "r_x2": 480.591, "r_y2": 91.49300000000005, "r_x3": 475.984, "r_y3": 91.49300000000005, "coord_origin": "TOPLEFT"}, "text": "7", "orig": "7", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 6, "label": "caption", "bbox": {"l": 134.765, "t": 123.58399999999995, "r": 480.587, "b": 156.79100000000005, "coord_origin": "TOPLEFT"}, "confidence": 0.9333080053329468, "cells": [{"index": 2, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 133.72500000000002, "r_x1": 162.644, "r_y1": 133.72500000000002, "r_x2": 162.644, "r_y2": 125.79899999999998, "r_x3": 134.765, "r_y3": 125.79899999999998, "coord_origin": "TOPLEFT"}, "text": "Fig. 3.", "orig": "Fig. 3.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 3, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 166.276, "r_y0": 134.87300000000005, "r_x1": 480.587, "r_y1": 134.87300000000005, "r_x2": 480.587, "r_y2": 123.58399999999995, "r_x3": 166.276, "r_y3": 123.58399999999995, "coord_origin": "TOPLEFT"}, "text": "OTSL description of table structure: A - table example; B - graphical repre-", "orig": "OTSL description of table structure: A - table example; B - graphical repre-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 4, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 145.832, "r_x1": 171.412, "r_y1": 145.832, "r_x2": 171.412, "r_y2": 134.543, "r_x3": 134.765, "r_y3": 134.543, "coord_origin": "TOPLEFT"}, "text": "sentation", "orig": "sentation", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 5, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 175.546, "r_y0": 145.832, "r_x1": 182.968, "r_y1": 145.832, "r_x2": 182.968, "r_y2": 134.543, "r_x3": 175.546, "r_y3": 134.543, "coord_origin": "TOPLEFT"}, "text": "of", "orig": "of", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 6, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 187.093, "r_y0": 145.832, "r_x1": 207.058, "r_y1": 145.832, "r_x2": 207.058, "r_y2": 134.543, "r_x3": 187.093, "r_y3": 134.543, "coord_origin": "TOPLEFT"}, "text": "table", "orig": "table", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 7, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 211.192, "r_y0": 145.832, "r_x1": 250.188, "r_y1": 145.832, "r_x2": 250.188, "r_y2": 134.543, "r_x3": 211.192, "r_y3": 134.543, "coord_origin": "TOPLEFT"}, "text": "structure;", "orig": "structure;", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 8, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 254.312, "r_y0": 145.832, "r_x1": 480.587, "r_y1": 145.832, "r_x2": 480.587, "r_y2": 134.543, "r_x3": 254.312, "r_y3": 134.543, "coord_origin": "TOPLEFT"}, "text": "C - mapping structure on a grid; D - OTSL structure", "orig": "C - mapping structure on a grid; D - OTSL structure", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 9, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 156.79100000000005, "r_x1": 306.116, "r_y1": 156.79100000000005, "r_x2": 306.116, "r_y2": 145.50199999999995, "r_x3": 134.765, "r_y3": 145.50199999999995, "coord_origin": "TOPLEFT"}, "text": "encoding; E - explanation on cell encoding", "orig": "encoding; E - explanation on cell encoding", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 12, "label": "picture", "bbox": {"l": 164.65028381347656, "t": 163.79708862304688, "r": 449.5505676269531, "b": 280.3409423828125, "coord_origin": "TOPLEFT"}, "confidence": 0.7868534922599792, "cells": [{"index": 10, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 374.493, "r_y0": 177.88099999999997, "r_x1": 428.861, "r_y1": 177.22199999999998, "r_x2": 428.861, "r_y2": 168.05399999999997, "r_x3": 374.493, "r_y3": 168.71299999999997, "coord_origin": "TOPLEFT"}, "text": "C L C L L", "orig": "C L C L L", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 11, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 373.769, "r_y0": 202.21299999999997, "r_x1": 448.17, "r_y1": 201.78200000000004, "r_x2": 448.17, "r_y2": 192.61400000000003, "r_x3": 373.769, "r_y3": 193.04499999999996, "coord_origin": "TOPLEFT"}, "text": "C C C C C NL", "orig": "C C C C C NL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 12, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 386.687, "r_y0": 214.42499999999995, "r_x1": 448.085, "r_y1": 214.11800000000005, "r_x2": 448.085, "r_y2": 204.95000000000005, "r_x3": 386.687, "r_y3": 205.25699999999995, "coord_origin": "TOPLEFT"}, "text": "C C C C NL", "orig": "C C C C NL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 13, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 398.657, "r_y0": 190.01999999999998, "r_x1": 448.147, "r_y1": 189.48800000000006, "r_x2": 448.147, "r_y2": 180.32000000000005, "r_x3": 398.657, "r_y3": 180.85199999999998, "coord_origin": "TOPLEFT"}, "text": "C C C NL", "orig": "C C C NL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 14, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 386.506, "r_y0": 226.32600000000002, "r_x1": 448.302, "r_y1": 226.52099999999996, "r_x2": 448.302, "r_y2": 217.35299999999995, "r_x3": 386.506, "r_y3": 217.15800000000002, "coord_origin": "TOPLEFT"}, "text": "C C C C NL", "orig": "C C C C NL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 15, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 435.16, "r_y0": 176.97699999999998, "r_x1": 447.863, "r_y1": 176.97699999999998, "r_x2": 447.863, "r_y2": 167.80899999999997, "r_x3": 435.16, "r_y3": 167.80899999999997, "coord_origin": "TOPLEFT"}, "text": "NL", "orig": "NL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 16, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 374.15, "r_y0": 214.52200000000005, "r_x1": 381.325, "r_y1": 214.52200000000005, "r_x2": 381.325, "r_y2": 205.35400000000004, "r_x3": 374.15, "r_y3": 205.35400000000004, "coord_origin": "TOPLEFT"}, "text": "U", "orig": "U", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 17, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 374.042, "r_y0": 226.43399999999997, "r_x1": 381.217, "r_y1": 226.43399999999997, "r_x2": 381.217, "r_y2": 217.26599999999996, "r_x3": 374.042, "r_y3": 217.26599999999996, "coord_origin": "TOPLEFT"}, "text": "U", "orig": "U", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 18, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 374.344, "r_y0": 190.22199999999998, "r_x1": 393.765, "r_y1": 190.07299999999998, "r_x2": 393.765, "r_y2": 180.90499999999997, "r_x3": 374.344, "r_y3": 181.05399999999997, "coord_origin": "TOPLEFT"}, "text": "U X", "orig": "U X", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 19, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 282.259, "r_y0": 253.79600000000005, "r_x1": 301.055, "r_y1": 253.78099999999995, "r_x2": 301.055, "r_y2": 244.61300000000006, "r_x3": 282.259, "r_y3": 244.62800000000004, "coord_origin": "TOPLEFT"}, "text": "C L", "orig": "C L", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 20, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 282.11, "r_y0": 266.13800000000003, "r_x1": 325.59, "r_y1": 265.58900000000006, "r_x2": 325.59, "r_y2": 256.42100000000005, "r_x3": 282.11, "r_y3": 256.96900000000005, "coord_origin": "TOPLEFT"}, "text": "U X X X", "orig": "U X X X", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 21, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 282.408, "r_y0": 278.41999999999996, "r_x1": 325.478, "r_y1": 278.14200000000005, "r_x2": 325.478, "r_y2": 268.97400000000005, "r_x3": 282.408, "r_y3": 269.25199999999995, "coord_origin": "TOPLEFT"}, "text": "U X X X", "orig": "U X X X", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 22, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 307.466, "r_y0": 253.861, "r_x1": 312.992, "r_y1": 253.861, "r_x2": 312.992, "r_y2": 244.69299999999998, "r_x3": 307.466, "r_y3": 244.69299999999998, "coord_origin": "TOPLEFT"}, "text": "L", "orig": "L", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 23, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 318.769, "r_y0": 253.72799999999995, "r_x1": 324.294, "r_y1": 253.72799999999995, "r_x2": 324.294, "r_y2": 244.55999999999995, "r_x3": 318.769, "r_y3": 244.55999999999995, "coord_origin": "TOPLEFT"}, "text": "L", "orig": "L", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 24, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 195.939, "r_y0": 278.03499999999997, "r_x1": 214.734, "r_y1": 278.02, "r_x2": 214.734, "r_y2": 268.852, "r_x3": 195.939, "r_y3": 268.86699999999996, "coord_origin": "TOPLEFT"}, "text": "C L", "orig": "C L", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 25, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 221.146, "r_y0": 278.1, "r_x1": 226.671, "r_y1": 278.1, "r_x2": 226.671, "r_y2": 268.932, "r_x3": 221.146, "r_y3": 268.932, "coord_origin": "TOPLEFT"}, "text": "L", "orig": "L", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 26, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 232.449, "r_y0": 277.967, "r_x1": 237.974, "r_y1": 277.967, "r_x2": 237.974, "r_y2": 268.799, "r_x3": 232.449, "r_y3": 268.799, "coord_origin": "TOPLEFT"}, "text": "L", "orig": "L", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 27, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 196.217, "r_y0": 253.827, "r_x1": 203.392, "r_y1": 253.827, "r_x2": 203.392, "r_y2": 244.659, "r_x3": 196.217, "r_y3": 244.659, "coord_origin": "TOPLEFT"}, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 28, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 250.321, "r_y0": 253.385, "r_x1": 257.497, "r_y1": 253.385, "r_x2": 257.497, "r_y2": 244.21699999999998, "r_x3": 250.321, "r_y3": 244.21699999999998, "coord_origin": "TOPLEFT"}, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 29, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 250.172, "r_y0": 265.727, "r_x1": 257.348, "r_y1": 265.727, "r_x2": 257.348, "r_y2": 256.55899999999997, "r_x3": 250.172, "r_y3": 256.55899999999997, "coord_origin": "TOPLEFT"}, "text": "U", "orig": "U", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 30, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 250.47, "r_y0": 278.01, "r_x1": 257.646, "r_y1": 278.01, "r_x2": 257.646, "r_y2": 268.842, "r_x3": 250.47, "r_y3": 268.842, "coord_origin": "TOPLEFT"}, "text": "U", "orig": "U", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 31, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 334.511, "r_y0": 249.18600000000004, "r_x1": 391.495, "r_y1": 249.18600000000004, "r_x2": 391.495, "r_y2": 243.07399999999996, "r_x3": 334.511, "r_y3": 243.07399999999996, "coord_origin": "TOPLEFT"}, "text": "1 - simple cells: \"C\"", "orig": "1 - simple cells: \"C\"", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 32, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 334.511, "r_y0": 259.124, "r_x1": 421.986, "r_y1": 259.124, "r_x2": 421.986, "r_y2": 253.01199999999994, "r_x3": 334.511, "r_y3": 253.01199999999994, "coord_origin": "TOPLEFT"}, "text": "2 - horizontal merges: \"C\", \"L\"", "orig": "2 - horizontal merges: \"C\", \"L\"", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 33, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 334.511, "r_y0": 269.062, "r_x1": 415.344, "r_y1": 269.062, "r_x2": 415.344, "r_y2": 262.95000000000005, "r_x3": 334.511, "r_y3": 262.95000000000005, "coord_origin": "TOPLEFT"}, "text": "3 - vertical merges: \"C\", \"U\"", "orig": "3 - vertical merges: \"C\", \"U\"", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 34, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 334.511, "r_y0": 279.0, "r_x1": 426.599, "r_y1": 279.0, "r_x2": 426.599, "r_y2": 272.88800000000003, "r_x3": 334.511, "r_y3": 272.88800000000003, "coord_origin": "TOPLEFT"}, "text": "4 - 2d merges: \"C\", \"L\", \"U\", \"X\"", "orig": "4 - 2d merges: \"C\", \"L\", \"U\", \"X\"", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 35, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 185.672, "r_y0": 250.23400000000004, "r_x1": 189.355, "r_y1": 250.23400000000004, "r_x2": 189.355, "r_y2": 244.12199999999996, "r_x3": 185.672, "r_y3": 244.12199999999996, "coord_origin": "TOPLEFT"}, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 36, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 185.968, "r_y0": 274.539, "r_x1": 189.651, "r_y1": 274.539, "r_x2": 189.651, "r_y2": 268.427, "r_x3": 185.968, "r_y3": 268.427, "coord_origin": "TOPLEFT"}, "text": "2", "orig": "2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 37, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 239.342, "r_y0": 249.817, "r_x1": 243.025, "r_y1": 249.817, "r_x2": 243.025, "r_y2": 243.70500000000004, "r_x3": 239.342, "r_y3": 243.70500000000004, "coord_origin": "TOPLEFT"}, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 38, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 271.329, "r_y0": 249.68499999999995, "r_x1": 275.012, "r_y1": 249.68499999999995, "r_x2": 275.012, "r_y2": 243.57299999999998, "r_x3": 271.329, "r_y3": 243.57299999999998, "coord_origin": "TOPLEFT"}, "text": "4", "orig": "4", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 39, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 229.816, "r_y0": 172.707, "r_x1": 233.5, "r_y1": 172.707, "r_x2": 233.5, "r_y2": 166.59400000000005, "r_x3": 229.816, "r_y3": 166.59400000000005, "coord_origin": "TOPLEFT"}, "text": "2", "orig": "2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 40, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 257.244, "r_y0": 196.15300000000002, "r_x1": 260.928, "r_y1": 196.15300000000002, "r_x2": 260.928, "r_y2": 190.03999999999996, "r_x3": 257.244, "r_y3": 190.03999999999996, "coord_origin": "TOPLEFT"}, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 41, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 186.875, "r_y0": 184.168, "r_x1": 190.559, "r_y1": 184.168, "r_x2": 190.559, "r_y2": 178.05600000000004, "r_x3": 186.875, "r_y3": 178.05600000000004, "coord_origin": "TOPLEFT"}, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 42, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 196.487, "r_y0": 175.207, "r_x1": 200.171, "r_y1": 175.207, "r_x2": 200.171, "r_y2": 169.09500000000003, "r_x3": 196.487, "r_y3": 169.09500000000003, "coord_origin": "TOPLEFT"}, "text": "4", "orig": "4", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 43, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 169.747, "r_y0": 175.62199999999996, "r_x1": 175.727, "r_y1": 175.62199999999996, "r_x2": 175.727, "r_y2": 167.98199999999997, "r_x3": 169.747, "r_y3": 167.98199999999997, "coord_origin": "TOPLEFT"}, "text": "A", "orig": "A", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 44, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 169.747, "r_y0": 214.57799999999997, "r_x1": 175.727, "r_y1": 214.57799999999997, "r_x2": 175.727, "r_y2": 206.938, "r_x3": 169.747, "r_y3": 206.938, "coord_origin": "TOPLEFT"}, "text": "B", "orig": "B", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 45, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 274.294, "r_y0": 176.019, "r_x1": 280.273, "r_y1": 176.019, "r_x2": 280.273, "r_y2": 168.37900000000002, "r_x3": 274.294, "r_y3": 168.37900000000002, "coord_origin": "TOPLEFT"}, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 46, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 359.562, "r_y0": 176.019, "r_x1": 365.541, "r_y1": 176.019, "r_x2": 365.541, "r_y2": 168.37900000000002, "r_x3": 359.562, "r_y3": 168.37900000000002, "coord_origin": "TOPLEFT"}, "text": "D", "orig": "D", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 47, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 169.747, "r_y0": 250.95100000000002, "r_x1": 175.271, "r_y1": 250.95100000000002, "r_x2": 175.271, "r_y2": 243.31100000000004, "r_x3": 169.747, "r_y3": 243.31100000000004, "coord_origin": "TOPLEFT"}, "text": "E", "orig": "E", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": [{"id": 38, "label": "text", "bbox": {"l": 374.493, "t": 168.05399999999997, "r": 428.861, "b": 177.88099999999997, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 10, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 374.493, "r_y0": 177.88099999999997, "r_x1": 428.861, "r_y1": 177.22199999999998, "r_x2": 428.861, "r_y2": 168.05399999999997, "r_x3": 374.493, "r_y3": 168.71299999999997, "coord_origin": "TOPLEFT"}, "text": "C L C L L", "orig": "C L C L L", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 39, "label": "text", "bbox": {"l": 373.769, "t": 192.61400000000003, "r": 448.17, "b": 202.21299999999997, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 11, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 373.769, "r_y0": 202.21299999999997, "r_x1": 448.17, "r_y1": 201.78200000000004, "r_x2": 448.17, "r_y2": 192.61400000000003, "r_x3": 373.769, "r_y3": 193.04499999999996, "coord_origin": "TOPLEFT"}, "text": "C C C C C NL", "orig": "C C C C C NL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 40, "label": "text", "bbox": {"l": 386.687, "t": 204.95000000000005, "r": 448.085, "b": 214.42499999999995, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 12, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 386.687, "r_y0": 214.42499999999995, "r_x1": 448.085, "r_y1": 214.11800000000005, "r_x2": 448.085, "r_y2": 204.95000000000005, "r_x3": 386.687, "r_y3": 205.25699999999995, "coord_origin": "TOPLEFT"}, "text": "C C C C NL", "orig": "C C C C NL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 41, "label": "text", "bbox": {"l": 398.657, "t": 180.32000000000005, "r": 448.147, "b": 190.01999999999998, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 13, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 398.657, "r_y0": 190.01999999999998, "r_x1": 448.147, "r_y1": 189.48800000000006, "r_x2": 448.147, "r_y2": 180.32000000000005, "r_x3": 398.657, "r_y3": 180.85199999999998, "coord_origin": "TOPLEFT"}, "text": "C C C NL", "orig": "C C C NL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 42, "label": "text", "bbox": {"l": 386.506, "t": 217.15800000000002, "r": 448.302, "b": 226.52099999999996, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 14, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 386.506, "r_y0": 226.32600000000002, "r_x1": 448.302, "r_y1": 226.52099999999996, "r_x2": 448.302, "r_y2": 217.35299999999995, "r_x3": 386.506, "r_y3": 217.15800000000002, "coord_origin": "TOPLEFT"}, "text": "C C C C NL", "orig": "C C C C NL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 43, "label": "text", "bbox": {"l": 435.16, "t": 167.80899999999997, "r": 447.863, "b": 176.97699999999998, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 15, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 435.16, "r_y0": 176.97699999999998, "r_x1": 447.863, "r_y1": 176.97699999999998, "r_x2": 447.863, "r_y2": 167.80899999999997, "r_x3": 435.16, "r_y3": 167.80899999999997, "coord_origin": "TOPLEFT"}, "text": "NL", "orig": "NL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 44, "label": "text", "bbox": {"l": 374.15, "t": 205.35400000000004, "r": 381.325, "b": 214.52200000000005, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 16, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 374.15, "r_y0": 214.52200000000005, "r_x1": 381.325, "r_y1": 214.52200000000005, "r_x2": 381.325, "r_y2": 205.35400000000004, "r_x3": 374.15, "r_y3": 205.35400000000004, "coord_origin": "TOPLEFT"}, "text": "U", "orig": "U", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 45, "label": "text", "bbox": {"l": 374.042, "t": 217.26599999999996, "r": 381.217, "b": 226.43399999999997, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 17, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 374.042, "r_y0": 226.43399999999997, "r_x1": 381.217, "r_y1": 226.43399999999997, "r_x2": 381.217, "r_y2": 217.26599999999996, "r_x3": 374.042, "r_y3": 217.26599999999996, "coord_origin": "TOPLEFT"}, "text": "U", "orig": "U", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 46, "label": "text", "bbox": {"l": 374.344, "t": 180.90499999999997, "r": 393.765, "b": 190.22199999999998, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 18, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 374.344, "r_y0": 190.22199999999998, "r_x1": 393.765, "r_y1": 190.07299999999998, "r_x2": 393.765, "r_y2": 180.90499999999997, "r_x3": 374.344, "r_y3": 181.05399999999997, "coord_origin": "TOPLEFT"}, "text": "U X", "orig": "U X", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 47, "label": "text", "bbox": {"l": 282.259, "t": 244.61300000000006, "r": 301.055, "b": 253.79600000000005, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 19, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 282.259, "r_y0": 253.79600000000005, "r_x1": 301.055, "r_y1": 253.78099999999995, "r_x2": 301.055, "r_y2": 244.61300000000006, "r_x3": 282.259, "r_y3": 244.62800000000004, "coord_origin": "TOPLEFT"}, "text": "C L", "orig": "C L", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 48, "label": "text", "bbox": {"l": 282.11, "t": 256.42100000000005, "r": 325.59, "b": 266.13800000000003, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 20, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 282.11, "r_y0": 266.13800000000003, "r_x1": 325.59, "r_y1": 265.58900000000006, "r_x2": 325.59, "r_y2": 256.42100000000005, "r_x3": 282.11, "r_y3": 256.96900000000005, "coord_origin": "TOPLEFT"}, "text": "U X X X", "orig": "U X X X", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 49, "label": "text", "bbox": {"l": 282.408, "t": 268.97400000000005, "r": 325.478, "b": 278.41999999999996, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 21, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 282.408, "r_y0": 278.41999999999996, "r_x1": 325.478, "r_y1": 278.14200000000005, "r_x2": 325.478, "r_y2": 268.97400000000005, "r_x3": 282.408, "r_y3": 269.25199999999995, "coord_origin": "TOPLEFT"}, "text": "U X X X", "orig": "U X X X", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 50, "label": "text", "bbox": {"l": 307.466, "t": 244.69299999999998, "r": 312.992, "b": 253.861, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 22, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 307.466, "r_y0": 253.861, "r_x1": 312.992, "r_y1": 253.861, "r_x2": 312.992, "r_y2": 244.69299999999998, "r_x3": 307.466, "r_y3": 244.69299999999998, "coord_origin": "TOPLEFT"}, "text": "L", "orig": "L", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 51, "label": "text", "bbox": {"l": 318.769, "t": 244.55999999999995, "r": 324.294, "b": 253.72799999999995, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 23, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 318.769, "r_y0": 253.72799999999995, "r_x1": 324.294, "r_y1": 253.72799999999995, "r_x2": 324.294, "r_y2": 244.55999999999995, "r_x3": 318.769, "r_y3": 244.55999999999995, "coord_origin": "TOPLEFT"}, "text": "L", "orig": "L", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 52, "label": "text", "bbox": {"l": 195.939, "t": 268.852, "r": 214.734, "b": 278.03499999999997, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 24, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 195.939, "r_y0": 278.03499999999997, "r_x1": 214.734, "r_y1": 278.02, "r_x2": 214.734, "r_y2": 268.852, "r_x3": 195.939, "r_y3": 268.86699999999996, "coord_origin": "TOPLEFT"}, "text": "C L", "orig": "C L", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 53, "label": "text", "bbox": {"l": 221.146, "t": 268.932, "r": 226.671, "b": 278.1, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 25, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 221.146, "r_y0": 278.1, "r_x1": 226.671, "r_y1": 278.1, "r_x2": 226.671, "r_y2": 268.932, "r_x3": 221.146, "r_y3": 268.932, "coord_origin": "TOPLEFT"}, "text": "L", "orig": "L", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 54, "label": "text", "bbox": {"l": 232.449, "t": 268.799, "r": 237.974, "b": 277.967, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 26, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 232.449, "r_y0": 277.967, "r_x1": 237.974, "r_y1": 277.967, "r_x2": 237.974, "r_y2": 268.799, "r_x3": 232.449, "r_y3": 268.799, "coord_origin": "TOPLEFT"}, "text": "L", "orig": "L", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 55, "label": "text", "bbox": {"l": 196.217, "t": 244.659, "r": 203.392, "b": 253.827, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 27, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 196.217, "r_y0": 253.827, "r_x1": 203.392, "r_y1": 253.827, "r_x2": 203.392, "r_y2": 244.659, "r_x3": 196.217, "r_y3": 244.659, "coord_origin": "TOPLEFT"}, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 56, "label": "text", "bbox": {"l": 250.321, "t": 244.21699999999998, "r": 257.497, "b": 253.385, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 28, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 250.321, "r_y0": 253.385, "r_x1": 257.497, "r_y1": 253.385, "r_x2": 257.497, "r_y2": 244.21699999999998, "r_x3": 250.321, "r_y3": 244.21699999999998, "coord_origin": "TOPLEFT"}, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 57, "label": "text", "bbox": {"l": 250.172, "t": 256.55899999999997, "r": 257.348, "b": 265.727, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 29, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 250.172, "r_y0": 265.727, "r_x1": 257.348, "r_y1": 265.727, "r_x2": 257.348, "r_y2": 256.55899999999997, "r_x3": 250.172, "r_y3": 256.55899999999997, "coord_origin": "TOPLEFT"}, "text": "U", "orig": "U", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 58, "label": "text", "bbox": {"l": 250.47, "t": 268.842, "r": 257.646, "b": 278.01, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 30, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 250.47, "r_y0": 278.01, "r_x1": 257.646, "r_y1": 278.01, "r_x2": 257.646, "r_y2": 268.842, "r_x3": 250.47, "r_y3": 268.842, "coord_origin": "TOPLEFT"}, "text": "U", "orig": "U", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 59, "label": "text", "bbox": {"l": 334.511, "t": 243.07399999999996, "r": 391.495, "b": 249.18600000000004, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 31, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 334.511, "r_y0": 249.18600000000004, "r_x1": 391.495, "r_y1": 249.18600000000004, "r_x2": 391.495, "r_y2": 243.07399999999996, "r_x3": 334.511, "r_y3": 243.07399999999996, "coord_origin": "TOPLEFT"}, "text": "1 - simple cells: \"C\"", "orig": "1 - simple cells: \"C\"", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 60, "label": "text", "bbox": {"l": 334.511, "t": 253.01199999999994, "r": 421.986, "b": 259.124, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 32, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 334.511, "r_y0": 259.124, "r_x1": 421.986, "r_y1": 259.124, "r_x2": 421.986, "r_y2": 253.01199999999994, "r_x3": 334.511, "r_y3": 253.01199999999994, "coord_origin": "TOPLEFT"}, "text": "2 - horizontal merges: \"C\", \"L\"", "orig": "2 - horizontal merges: \"C\", \"L\"", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 61, "label": "text", "bbox": {"l": 334.511, "t": 262.95000000000005, "r": 415.344, "b": 269.062, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 33, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 334.511, "r_y0": 269.062, "r_x1": 415.344, "r_y1": 269.062, "r_x2": 415.344, "r_y2": 262.95000000000005, "r_x3": 334.511, "r_y3": 262.95000000000005, "coord_origin": "TOPLEFT"}, "text": "3 - vertical merges: \"C\", \"U\"", "orig": "3 - vertical merges: \"C\", \"U\"", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 18, "label": "list_item", "bbox": {"l": 334.511, "t": 272.88800000000003, "r": 426.599, "b": 279.0, "coord_origin": "TOPLEFT"}, "confidence": 0.5250625610351562, "cells": [{"index": 34, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 334.511, "r_y0": 279.0, "r_x1": 426.599, "r_y1": 279.0, "r_x2": 426.599, "r_y2": 272.88800000000003, "r_x3": 334.511, "r_y3": 272.88800000000003, "coord_origin": "TOPLEFT"}, "text": "4 - 2d merges: \"C\", \"L\", \"U\", \"X\"", "orig": "4 - 2d merges: \"C\", \"L\", \"U\", \"X\"", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 62, "label": "text", "bbox": {"l": 185.672, "t": 244.12199999999996, "r": 189.355, "b": 250.23400000000004, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 35, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 185.672, "r_y0": 250.23400000000004, "r_x1": 189.355, "r_y1": 250.23400000000004, "r_x2": 189.355, "r_y2": 244.12199999999996, "r_x3": 185.672, "r_y3": 244.12199999999996, "coord_origin": "TOPLEFT"}, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 63, "label": "text", "bbox": {"l": 185.968, "t": 268.427, "r": 189.651, "b": 274.539, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 36, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 185.968, "r_y0": 274.539, "r_x1": 189.651, "r_y1": 274.539, "r_x2": 189.651, "r_y2": 268.427, "r_x3": 185.968, "r_y3": 268.427, "coord_origin": "TOPLEFT"}, "text": "2", "orig": "2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 64, "label": "text", "bbox": {"l": 239.342, "t": 243.70500000000004, "r": 243.025, "b": 249.817, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 37, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 239.342, "r_y0": 249.817, "r_x1": 243.025, "r_y1": 249.817, "r_x2": 243.025, "r_y2": 243.70500000000004, "r_x3": 239.342, "r_y3": 243.70500000000004, "coord_origin": "TOPLEFT"}, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 65, "label": "text", "bbox": {"l": 271.329, "t": 243.57299999999998, "r": 275.012, "b": 249.68499999999995, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 38, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 271.329, "r_y0": 249.68499999999995, "r_x1": 275.012, "r_y1": 249.68499999999995, "r_x2": 275.012, "r_y2": 243.57299999999998, "r_x3": 271.329, "r_y3": 243.57299999999998, "coord_origin": "TOPLEFT"}, "text": "4", "orig": "4", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 66, "label": "text", "bbox": {"l": 229.816, "t": 166.59400000000005, "r": 233.5, "b": 172.707, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 39, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 229.816, "r_y0": 172.707, "r_x1": 233.5, "r_y1": 172.707, "r_x2": 233.5, "r_y2": 166.59400000000005, "r_x3": 229.816, "r_y3": 166.59400000000005, "coord_origin": "TOPLEFT"}, "text": "2", "orig": "2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 67, "label": "text", "bbox": {"l": 257.244, "t": 190.03999999999996, "r": 260.928, "b": 196.15300000000002, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 40, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 257.244, "r_y0": 196.15300000000002, "r_x1": 260.928, "r_y1": 196.15300000000002, "r_x2": 260.928, "r_y2": 190.03999999999996, "r_x3": 257.244, "r_y3": 190.03999999999996, "coord_origin": "TOPLEFT"}, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 68, "label": "text", "bbox": {"l": 186.875, "t": 178.05600000000004, "r": 190.559, "b": 184.168, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 41, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 186.875, "r_y0": 184.168, "r_x1": 190.559, "r_y1": 184.168, "r_x2": 190.559, "r_y2": 178.05600000000004, "r_x3": 186.875, "r_y3": 178.05600000000004, "coord_origin": "TOPLEFT"}, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 69, "label": "text", "bbox": {"l": 196.487, "t": 169.09500000000003, "r": 200.171, "b": 175.207, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 42, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 196.487, "r_y0": 175.207, "r_x1": 200.171, "r_y1": 175.207, "r_x2": 200.171, "r_y2": 169.09500000000003, "r_x3": 196.487, "r_y3": 169.09500000000003, "coord_origin": "TOPLEFT"}, "text": "4", "orig": "4", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 70, "label": "text", "bbox": {"l": 169.747, "t": 167.98199999999997, "r": 175.727, "b": 175.62199999999996, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 43, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 169.747, "r_y0": 175.62199999999996, "r_x1": 175.727, "r_y1": 175.62199999999996, "r_x2": 175.727, "r_y2": 167.98199999999997, "r_x3": 169.747, "r_y3": 167.98199999999997, "coord_origin": "TOPLEFT"}, "text": "A", "orig": "A", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 71, "label": "text", "bbox": {"l": 169.747, "t": 206.938, "r": 175.727, "b": 214.57799999999997, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 44, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 169.747, "r_y0": 214.57799999999997, "r_x1": 175.727, "r_y1": 214.57799999999997, "r_x2": 175.727, "r_y2": 206.938, "r_x3": 169.747, "r_y3": 206.938, "coord_origin": "TOPLEFT"}, "text": "B", "orig": "B", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 72, "label": "text", "bbox": {"l": 274.294, "t": 168.37900000000002, "r": 280.273, "b": 176.019, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 45, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 274.294, "r_y0": 176.019, "r_x1": 280.273, "r_y1": 176.019, "r_x2": 280.273, "r_y2": 168.37900000000002, "r_x3": 274.294, "r_y3": 168.37900000000002, "coord_origin": "TOPLEFT"}, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 73, "label": "text", "bbox": {"l": 359.562, "t": 168.37900000000002, "r": 365.541, "b": 176.019, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 46, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 359.562, "r_y0": 176.019, "r_x1": 365.541, "r_y1": 176.019, "r_x2": 365.541, "r_y2": 168.37900000000002, "r_x3": 359.562, "r_y3": 168.37900000000002, "coord_origin": "TOPLEFT"}, "text": "D", "orig": "D", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 74, "label": "text", "bbox": {"l": 169.747, "t": 243.31100000000004, "r": 175.271, "b": 250.95100000000002, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 47, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 169.747, "r_y0": 250.95100000000002, "r_x1": 175.271, "r_y1": 250.95100000000002, "r_x2": 175.271, "r_y2": 243.31100000000004, "r_x3": 169.747, "r_y3": 243.31100000000004, "coord_origin": "TOPLEFT"}, "text": "E", "orig": "E", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}]}, {"id": 9, "label": "section_header", "bbox": {"l": 134.765, "t": 305.296, "r": 246.652, "b": 314.103, "coord_origin": "TOPLEFT"}, "confidence": 0.9233023524284363, "cells": [{"index": 48, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 314.103, "r_x1": 149.402, "r_y1": 314.103, "r_x2": 149.402, "r_y2": 305.296, "r_x3": 134.765, "r_y3": 305.296, "coord_origin": "TOPLEFT"}, "text": "4.2", "orig": "4.2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 49, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 160.859, "r_y0": 314.103, "r_x1": 246.652, "r_y1": 314.103, "r_x2": 246.652, "r_y2": 305.296, "r_x3": 160.859, "r_y3": 305.296, "coord_origin": "TOPLEFT"}, "text": "Language Syntax", "orig": "Language Syntax", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 10, "label": "text", "bbox": {"l": 134.765, "t": 325.248, "r": 363.796, "b": 334.045, "coord_origin": "TOPLEFT"}, "confidence": 0.9169168472290039, "cells": [{"index": 50, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 334.045, "r_x1": 363.796, "r_y1": 334.045, "r_x2": 363.796, "r_y2": 325.248, "r_x3": 134.765, "r_y3": 325.248, "coord_origin": "TOPLEFT"}, "text": "The OTSL representation follows these syntax rules:", "orig": "The OTSL representation follows these syntax rules:", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 3, "label": "list_item", "bbox": {"l": 138.973, "t": 347.171, "r": 480.589, "b": 367.934, "coord_origin": "TOPLEFT"}, "confidence": 0.9588112235069275, "cells": [{"index": 51, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 138.973, "r_y0": 355.978, "r_x1": 146.72, "r_y1": 355.978, "r_x2": 146.72, "r_y2": 347.181, "r_x3": 138.973, "r_y3": 347.181, "coord_origin": "TOPLEFT"}, "text": "1.", "orig": "1.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 52, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 151.701, "r_y0": 355.978, "r_x1": 257.379, "r_y1": 355.978, "r_x2": 257.379, "r_y2": 347.171, "r_x3": 151.701, "r_y3": 347.171, "coord_origin": "TOPLEFT"}, "text": "Left-looking cell rule", "orig": "Left-looking cell rule", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 53, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 257.383, "r_y0": 355.978, "r_x1": 260.15, "r_y1": 355.978, "r_x2": 260.15, "r_y2": 347.181, "r_x3": 257.383, "r_y3": 347.181, "coord_origin": "TOPLEFT"}, "text": ":", "orig": ":", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 54, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 264.184, "r_y0": 355.978, "r_x1": 480.589, "r_y1": 355.978, "r_x2": 480.589, "r_y2": 347.181, "r_x3": 264.184, "r_y3": 347.181, "coord_origin": "TOPLEFT"}, "text": "The left neighbour of an \"L\" cell must be either", "orig": "The left neighbour of an \"L\" cell must be either", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 55, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 151.701, "r_y0": 367.934, "r_x1": 283.594, "r_y1": 367.934, "r_x2": 283.594, "r_y2": 359.137, "r_x3": 151.701, "r_y3": 359.137, "coord_origin": "TOPLEFT"}, "text": "another \"L\" cell or a \"C\" cell.", "orig": "another \"L\" cell or a \"C\" cell.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 4, "label": "list_item", "bbox": {"l": 138.973, "t": 371.085, "r": 480.592, "b": 391.847, "coord_origin": "TOPLEFT"}, "confidence": 0.9585386514663696, "cells": [{"index": 56, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 138.973, "r_y0": 379.892, "r_x1": 146.72, "r_y1": 379.892, "r_x2": 146.72, "r_y2": 371.095, "r_x3": 138.973, "r_y3": 371.095, "coord_origin": "TOPLEFT"}, "text": "2.", "orig": "2.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 57, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 151.701, "r_y0": 379.892, "r_x1": 252.112, "r_y1": 379.892, "r_x2": 252.112, "r_y2": 371.085, "r_x3": 151.701, "r_y3": 371.085, "coord_origin": "TOPLEFT"}, "text": "Up-looking cell rule", "orig": "Up-looking cell rule", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 58, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 252.112, "r_y0": 379.892, "r_x1": 254.879, "r_y1": 379.892, "r_x2": 254.879, "r_y2": 371.095, "r_x3": 252.112, "r_y3": 371.095, "coord_origin": "TOPLEFT"}, "text": ":", "orig": ":", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 59, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 258.764, "r_y0": 379.892, "r_x1": 480.592, "r_y1": 379.892, "r_x2": 480.592, "r_y2": 371.095, "r_x3": 258.764, "r_y3": 371.095, "coord_origin": "TOPLEFT"}, "text": "The upper neighbour of a \"U\" cell must be either", "orig": "The upper neighbour of a \"U\" cell must be either", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 60, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 151.701, "r_y0": 391.847, "r_x1": 284.839, "r_y1": 391.847, "r_x2": 284.839, "r_y2": 383.05, "r_x3": 151.701, "r_y3": 383.05, "coord_origin": "TOPLEFT"}, "text": "another \"U\" cell or a \"C\" cell.", "orig": "another \"U\" cell or a \"C\" cell.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 14, "label": "section_header", "bbox": {"l": 138.973, "t": 394.998, "r": 226.074, "b": 403.805, "coord_origin": "TOPLEFT"}, "confidence": 0.6506174206733704, "cells": [{"index": 61, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 138.973, "r_y0": 403.805, "r_x1": 146.72, "r_y1": 403.805, "r_x2": 146.72, "r_y2": 395.008, "r_x3": 138.973, "r_y3": 395.008, "coord_origin": "TOPLEFT"}, "text": "3.", "orig": "3.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 62, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 151.701, "r_y0": 403.805, "r_x1": 223.304, "r_y1": 403.805, "r_x2": 223.304, "r_y2": 394.998, "r_x3": 151.701, "r_y3": 394.998, "coord_origin": "TOPLEFT"}, "text": "Cross cell rule", "orig": "Cross cell rule", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 63, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 223.307, "r_y0": 403.805, "r_x1": 226.074, "r_y1": 403.805, "r_x2": 226.074, "r_y2": 395.008, "r_x3": 223.307, "r_y3": 395.008, "coord_origin": "TOPLEFT"}, "text": ":", "orig": ":", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 13, "label": "list_item", "bbox": {"l": 151.701, "t": 406.967, "r": 480.592, "b": 439.674, "coord_origin": "TOPLEFT"}, "confidence": 0.7247239947319031, "cells": [{"index": 64, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 151.701, "r_y0": 415.764, "r_x1": 480.592, "r_y1": 415.764, "r_x2": 480.592, "r_y2": 406.967, "r_x3": 151.701, "r_y3": 406.967, "coord_origin": "TOPLEFT"}, "text": "The left neighbour of an \"X\" cell must be either another \"X\" cell or a \"U\"", "orig": "The left neighbour of an \"X\" cell must be either another \"X\" cell or a \"U\"", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 65, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 151.701, "r_y0": 427.719, "r_x1": 480.592, "r_y1": 427.719, "r_x2": 480.592, "r_y2": 418.922, "r_x3": 151.701, "r_y3": 418.922, "coord_origin": "TOPLEFT"}, "text": "cell, and the upper neighbour of an \"X\" cell must be either another \"X\" cell", "orig": "cell, and the upper neighbour of an \"X\" cell must be either another \"X\" cell", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 66, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 151.701, "r_y0": 439.674, "r_x1": 214.397, "r_y1": 439.674, "r_x2": 214.397, "r_y2": 430.877, "r_x3": 151.701, "r_y3": 430.877, "coord_origin": "TOPLEFT"}, "text": "or an \"L\" cell.", "orig": "or an \"L\" cell.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 8, "label": "list_item", "bbox": {"l": 138.973, "t": 442.826, "r": 474.59, "b": 451.633, "coord_origin": "TOPLEFT"}, "confidence": 0.9259927272796631, "cells": [{"index": 67, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 138.973, "r_y0": 451.633, "r_x1": 146.72, "r_y1": 451.633, "r_x2": 146.72, "r_y2": 442.836, "r_x3": 138.973, "r_y3": 442.836, "coord_origin": "TOPLEFT"}, "text": "4.", "orig": "4.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 68, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 151.701, "r_y0": 451.633, "r_x1": 221.323, "r_y1": 451.633, "r_x2": 221.323, "r_y2": 442.826, "r_x3": 151.701, "r_y3": 442.826, "coord_origin": "TOPLEFT"}, "text": "First row rule", "orig": "First row rule", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 69, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 221.327, "r_y0": 451.633, "r_x1": 224.094, "r_y1": 451.633, "r_x2": 224.094, "r_y2": 442.836, "r_x3": 221.327, "r_y3": 442.836, "coord_origin": "TOPLEFT"}, "text": ":", "orig": ":", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 70, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 227.411, "r_y0": 451.633, "r_x1": 474.59, "r_y1": 451.633, "r_x2": 474.59, "r_y2": 442.836, "r_x3": 227.411, "r_y3": 442.836, "coord_origin": "TOPLEFT"}, "text": "Only \"L\" cells and \"C\" cells are allowed in the first row.", "orig": "Only \"L\" cells and \"C\" cells are allowed in the first row.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 5, "label": "list_item", "bbox": {"l": 138.973, "t": 454.784, "r": 480.588, "b": 475.546, "coord_origin": "TOPLEFT"}, "confidence": 0.9420599937438965, "cells": [{"index": 71, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 138.973, "r_y0": 463.591, "r_x1": 146.72, "r_y1": 463.591, "r_x2": 146.72, "r_y2": 454.794, "r_x3": 138.973, "r_y3": 454.794, "coord_origin": "TOPLEFT"}, "text": "5.", "orig": "5.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 72, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 151.701, "r_y0": 463.591, "r_x1": 240.72, "r_y1": 463.591, "r_x2": 240.72, "r_y2": 454.784, "r_x3": 151.701, "r_y3": 454.784, "coord_origin": "TOPLEFT"}, "text": "First column rule", "orig": "First column rule", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 73, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 240.716, "r_y0": 463.591, "r_x1": 243.483, "r_y1": 463.591, "r_x2": 243.483, "r_y2": 454.794, "r_x3": 240.716, "r_y3": 454.794, "coord_origin": "TOPLEFT"}, "text": ":", "orig": ":", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 74, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 247.458, "r_y0": 463.591, "r_x1": 480.588, "r_y1": 463.591, "r_x2": 480.588, "r_y2": 454.794, "r_x3": 247.458, "r_y3": 454.794, "coord_origin": "TOPLEFT"}, "text": "Only \"U\" cells and \"C\" cells are allowed in the first", "orig": "Only \"U\" cells and \"C\" cells are allowed in the first", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 75, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 151.701, "r_y0": 475.546, "r_x1": 186.007, "r_y1": 475.546, "r_x2": 186.007, "r_y2": 466.749, "r_x3": 151.701, "r_y3": 466.749, "coord_origin": "TOPLEFT"}, "text": "column.", "orig": "column.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 1, "label": "list_item", "bbox": {"l": 138.973, "t": 478.697, "r": 480.595, "b": 499.46, "coord_origin": "TOPLEFT"}, "confidence": 0.9617829918861389, "cells": [{"index": 76, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 138.973, "r_y0": 487.504, "r_x1": 146.72, "r_y1": 487.504, "r_x2": 146.72, "r_y2": 478.707, "r_x3": 138.973, "r_y3": 478.707, "coord_origin": "TOPLEFT"}, "text": "6.", "orig": "6.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 77, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 151.701, "r_y0": 487.504, "r_x1": 235.158, "r_y1": 487.504, "r_x2": 235.158, "r_y2": 478.697, "r_x3": 151.701, "r_y3": 478.697, "coord_origin": "TOPLEFT"}, "text": "Rectangular rule", "orig": "Rectangular rule", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 78, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 235.157, "r_y0": 487.504, "r_x1": 480.595, "r_y1": 487.504, "r_x2": 480.595, "r_y2": 478.707, "r_x3": 235.157, "r_y3": 478.707, "coord_origin": "TOPLEFT"}, "text": ": The table representation is always rectangular - all rows", "orig": ": The table representation is always rectangular - all rows", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 79, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 151.701, "r_y0": 499.46, "r_x1": 448.042, "r_y1": 499.46, "r_x2": 448.042, "r_y2": 490.663, "r_x3": 151.701, "r_y3": 490.663, "coord_origin": "TOPLEFT"}, "text": "must have an equal number of tokens, terminated with \"NL\" token.", "orig": "must have an equal number of tokens, terminated with \"NL\" token.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 0, "label": "text", "bbox": {"l": 134.765, "t": 512.5930000000001, "r": 480.596, "b": 640.942, "coord_origin": "TOPLEFT"}, "confidence": 0.9785562753677368, "cells": [{"index": 80, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 149.709, "r_y0": 521.39, "r_x1": 480.596, "r_y1": 521.39, "r_x2": 480.596, "r_y2": 512.5930000000001, "r_x3": 149.709, "r_y3": 512.5930000000001, "coord_origin": "TOPLEFT"}, "text": "The application of these rules gives OTSL a set of unique properties. First", "orig": "The application of these rules gives OTSL a set of unique properties. First", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 81, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 533.345, "r_x1": 480.591, "r_y1": 533.345, "r_x2": 480.591, "r_y2": 524.548, "r_x3": 134.765, "r_y3": 524.548, "coord_origin": "TOPLEFT"}, "text": "of all, the OTSL enforces a strictly rectangular structure representation, where", "orig": "of all, the OTSL enforces a strictly rectangular structure representation, where", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 82, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 545.3, "r_x1": 480.595, "r_y1": 545.3, "r_x2": 480.595, "r_y2": 536.5029999999999, "r_x3": 134.765, "r_y3": 536.5029999999999, "coord_origin": "TOPLEFT"}, "text": "every new-line token starts a new row. As a consequence, all rows and all columns", "orig": "every new-line token starts a new row. As a consequence, all rows and all columns", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 83, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 557.256, "r_x1": 480.589, "r_y1": 557.256, "r_x2": 480.589, "r_y2": 548.4590000000001, "r_x3": 134.765, "r_y3": 548.4590000000001, "coord_origin": "TOPLEFT"}, "text": "have exactly the same number of tokens, irrespective of cell spans. Secondly, the", "orig": "have exactly the same number of tokens, irrespective of cell spans. Secondly, the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 84, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 569.211, "r_x1": 480.594, "r_y1": 569.211, "r_x2": 480.594, "r_y2": 560.414, "r_x3": 134.765, "r_y3": 560.414, "coord_origin": "TOPLEFT"}, "text": "OTSL representation is unambiguous: Every table structure is represented in one", "orig": "OTSL representation is unambiguous: Every table structure is represented in one", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 85, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 581.1659999999999, "r_x1": 480.587, "r_y1": 581.1659999999999, "r_x2": 480.587, "r_y2": 572.369, "r_x3": 134.765, "r_y3": 572.369, "coord_origin": "TOPLEFT"}, "text": "way. In this representation every table cell corresponds to a \"C\"-cell token, which", "orig": "way. In this representation every table cell corresponds to a \"C\"-cell token, which", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 86, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 593.121, "r_x1": 480.592, "r_y1": 593.121, "r_x2": 480.592, "r_y2": 584.3240000000001, "r_x3": 134.765, "r_y3": 584.3240000000001, "coord_origin": "TOPLEFT"}, "text": "in case of spans is always located in the top-left corner of the table cell definition.", "orig": "in case of spans is always located in the top-left corner of the table cell definition.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 87, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 605.076, "r_x1": 480.592, "r_y1": 605.076, "r_x2": 480.592, "r_y2": 596.279, "r_x3": 134.765, "r_y3": 596.279, "coord_origin": "TOPLEFT"}, "text": "Third, OTSL syntax rules are only backward-looking. As a consequence, every", "orig": "Third, OTSL syntax rules are only backward-looking. As a consequence, every", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 88, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 617.032, "r_x1": 480.594, "r_y1": 617.032, "r_x2": 480.594, "r_y2": 608.235, "r_x3": 134.765, "r_y3": 608.235, "coord_origin": "TOPLEFT"}, "text": "predicted token can be validated straight during sequence generation by looking", "orig": "predicted token can be validated straight during sequence generation by looking", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 89, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 628.987, "r_x1": 480.591, "r_y1": 628.987, "r_x2": 480.591, "r_y2": 620.19, "r_x3": 134.765, "r_y3": 620.19, "coord_origin": "TOPLEFT"}, "text": "at the previously predicted sequence. As such, OTSL can guarantee that every", "orig": "at the previously predicted sequence. As such, OTSL can guarantee that every", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 90, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 640.942, "r_x1": 311.198, "r_y1": 640.942, "r_x2": 311.198, "r_y2": 632.145, "r_x3": 134.765, "r_y3": 632.145, "coord_origin": "TOPLEFT"}, "text": "predicted sequence is syntactically valid.", "orig": "predicted sequence is syntactically valid.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 2, "label": "text", "bbox": {"l": 134.765, "t": 644.1030000000001, "r": 480.593, "b": 664.855, "coord_origin": "TOPLEFT"}, "confidence": 0.9590610861778259, "cells": [{"index": 91, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 149.709, "r_y0": 652.9, "r_x1": 480.592, "r_y1": 652.9, "r_x2": 480.592, "r_y2": 644.1030000000001, "r_x3": 149.709, "r_y3": 644.1030000000001, "coord_origin": "TOPLEFT"}, "text": "These characteristics can be easily learned by sequence generator networks,", "orig": "These characteristics can be easily learned by sequence generator networks,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 92, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 664.855, "r_x1": 480.593, "r_y1": 664.855, "r_x2": 480.593, "r_y2": 656.058, "r_x3": 134.765, "r_y3": 656.058, "coord_origin": "TOPLEFT"}, "text": "as we demonstrate further below. We find strong indications that this pattern", "orig": "as we demonstrate further below. We find strong indications that this pattern", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}]}, "tablestructure": {"table_map": {}}, "figures_classification": null, "equations_prediction": null, "vlm_response": null}, "assembled": {"elements": [{"label": "page_header", "id": 7, "page_no": 6, "cluster": {"id": 7, "label": "page_header", "bbox": {"l": 194.478, "t": 91.49300000000005, "r": 447.543, "b": 102.78200000000004, "coord_origin": "TOPLEFT"}, "confidence": 0.932651162147522, "cells": [{"index": 0, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 194.478, "r_y0": 102.78200000000004, "r_x1": 447.543, "r_y1": 102.78200000000004, "r_x2": 447.543, "r_y2": 91.49300000000005, "r_x3": 194.478, "r_y3": 91.49300000000005, "coord_origin": "TOPLEFT"}, "text": "Optimized Table Tokenization for Table Structure Recognition", "orig": "Optimized Table Tokenization for Table Structure Recognition", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "Optimized Table Tokenization for Table Structure Recognition"}, {"label": "page_header", "id": 11, "page_no": 6, "cluster": {"id": 11, "label": "page_header", "bbox": {"l": 475.984, "t": 91.49300000000005, "r": 480.591, "b": 102.78200000000004, "coord_origin": "TOPLEFT"}, "confidence": 0.8749732375144958, "cells": [{"index": 1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 475.984, "r_y0": 102.78200000000004, "r_x1": 480.591, "r_y1": 102.78200000000004, "r_x2": 480.591, "r_y2": 91.49300000000005, "r_x3": 475.984, "r_y3": 91.49300000000005, "coord_origin": "TOPLEFT"}, "text": "7", "orig": "7", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "7"}, {"label": "caption", "id": 6, "page_no": 6, "cluster": {"id": 6, "label": "caption", "bbox": {"l": 134.765, "t": 123.58399999999995, "r": 480.587, "b": 156.79100000000005, "coord_origin": "TOPLEFT"}, "confidence": 0.9333080053329468, "cells": [{"index": 2, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 133.72500000000002, "r_x1": 162.644, "r_y1": 133.72500000000002, "r_x2": 162.644, "r_y2": 125.79899999999998, "r_x3": 134.765, "r_y3": 125.79899999999998, "coord_origin": "TOPLEFT"}, "text": "Fig. 3.", "orig": "Fig. 3.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 3, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 166.276, "r_y0": 134.87300000000005, "r_x1": 480.587, "r_y1": 134.87300000000005, "r_x2": 480.587, "r_y2": 123.58399999999995, "r_x3": 166.276, "r_y3": 123.58399999999995, "coord_origin": "TOPLEFT"}, "text": "OTSL description of table structure: A - table example; B - graphical repre-", "orig": "OTSL description of table structure: A - table example; B - graphical repre-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 4, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 145.832, "r_x1": 171.412, "r_y1": 145.832, "r_x2": 171.412, "r_y2": 134.543, "r_x3": 134.765, "r_y3": 134.543, "coord_origin": "TOPLEFT"}, "text": "sentation", "orig": "sentation", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 5, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 175.546, "r_y0": 145.832, "r_x1": 182.968, "r_y1": 145.832, "r_x2": 182.968, "r_y2": 134.543, "r_x3": 175.546, "r_y3": 134.543, "coord_origin": "TOPLEFT"}, "text": "of", "orig": "of", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 6, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 187.093, "r_y0": 145.832, "r_x1": 207.058, "r_y1": 145.832, "r_x2": 207.058, "r_y2": 134.543, "r_x3": 187.093, "r_y3": 134.543, "coord_origin": "TOPLEFT"}, "text": "table", "orig": "table", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 7, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 211.192, "r_y0": 145.832, "r_x1": 250.188, "r_y1": 145.832, "r_x2": 250.188, "r_y2": 134.543, "r_x3": 211.192, "r_y3": 134.543, "coord_origin": "TOPLEFT"}, "text": "structure;", "orig": "structure;", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 8, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 254.312, "r_y0": 145.832, "r_x1": 480.587, "r_y1": 145.832, "r_x2": 480.587, "r_y2": 134.543, "r_x3": 254.312, "r_y3": 134.543, "coord_origin": "TOPLEFT"}, "text": "C - mapping structure on a grid; D - OTSL structure", "orig": "C - mapping structure on a grid; D - OTSL structure", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 9, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 156.79100000000005, "r_x1": 306.116, "r_y1": 156.79100000000005, "r_x2": 306.116, "r_y2": 145.50199999999995, "r_x3": 134.765, "r_y3": 145.50199999999995, "coord_origin": "TOPLEFT"}, "text": "encoding; E - explanation on cell encoding", "orig": "encoding; E - explanation on cell encoding", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "Fig. 3. OTSL description of table structure: A - table example; B - graphical representation of table structure; C - mapping structure on a grid; D - OTSL structure encoding; E - explanation on cell encoding"}, {"label": "picture", "id": 12, "page_no": 6, "cluster": {"id": 12, "label": "picture", "bbox": {"l": 164.65028381347656, "t": 163.79708862304688, "r": 449.5505676269531, "b": 280.3409423828125, "coord_origin": "TOPLEFT"}, "confidence": 0.7868534922599792, "cells": [{"index": 10, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 374.493, "r_y0": 177.88099999999997, "r_x1": 428.861, "r_y1": 177.22199999999998, "r_x2": 428.861, "r_y2": 168.05399999999997, "r_x3": 374.493, "r_y3": 168.71299999999997, "coord_origin": "TOPLEFT"}, "text": "C L C L L", "orig": "C L C L L", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 11, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 373.769, "r_y0": 202.21299999999997, "r_x1": 448.17, "r_y1": 201.78200000000004, "r_x2": 448.17, "r_y2": 192.61400000000003, "r_x3": 373.769, "r_y3": 193.04499999999996, "coord_origin": "TOPLEFT"}, "text": "C C C C C NL", "orig": "C C C C C NL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 12, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 386.687, "r_y0": 214.42499999999995, "r_x1": 448.085, "r_y1": 214.11800000000005, "r_x2": 448.085, "r_y2": 204.95000000000005, "r_x3": 386.687, "r_y3": 205.25699999999995, "coord_origin": "TOPLEFT"}, "text": "C C C C NL", "orig": "C C C C NL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 13, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 398.657, "r_y0": 190.01999999999998, "r_x1": 448.147, "r_y1": 189.48800000000006, "r_x2": 448.147, "r_y2": 180.32000000000005, "r_x3": 398.657, "r_y3": 180.85199999999998, "coord_origin": "TOPLEFT"}, "text": "C C C NL", "orig": "C C C NL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 14, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 386.506, "r_y0": 226.32600000000002, "r_x1": 448.302, "r_y1": 226.52099999999996, "r_x2": 448.302, "r_y2": 217.35299999999995, "r_x3": 386.506, "r_y3": 217.15800000000002, "coord_origin": "TOPLEFT"}, "text": "C C C C NL", "orig": "C C C C NL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 15, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 435.16, "r_y0": 176.97699999999998, "r_x1": 447.863, "r_y1": 176.97699999999998, "r_x2": 447.863, "r_y2": 167.80899999999997, "r_x3": 435.16, "r_y3": 167.80899999999997, "coord_origin": "TOPLEFT"}, "text": "NL", "orig": "NL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 16, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 374.15, "r_y0": 214.52200000000005, "r_x1": 381.325, "r_y1": 214.52200000000005, "r_x2": 381.325, "r_y2": 205.35400000000004, "r_x3": 374.15, "r_y3": 205.35400000000004, "coord_origin": "TOPLEFT"}, "text": "U", "orig": "U", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 17, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 374.042, "r_y0": 226.43399999999997, "r_x1": 381.217, "r_y1": 226.43399999999997, "r_x2": 381.217, "r_y2": 217.26599999999996, "r_x3": 374.042, "r_y3": 217.26599999999996, "coord_origin": "TOPLEFT"}, "text": "U", "orig": "U", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 18, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 374.344, "r_y0": 190.22199999999998, "r_x1": 393.765, "r_y1": 190.07299999999998, "r_x2": 393.765, "r_y2": 180.90499999999997, "r_x3": 374.344, "r_y3": 181.05399999999997, "coord_origin": "TOPLEFT"}, "text": "U X", "orig": "U X", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 19, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 282.259, "r_y0": 253.79600000000005, "r_x1": 301.055, "r_y1": 253.78099999999995, "r_x2": 301.055, "r_y2": 244.61300000000006, "r_x3": 282.259, "r_y3": 244.62800000000004, "coord_origin": "TOPLEFT"}, "text": "C L", "orig": "C L", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 20, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 282.11, "r_y0": 266.13800000000003, "r_x1": 325.59, "r_y1": 265.58900000000006, "r_x2": 325.59, "r_y2": 256.42100000000005, "r_x3": 282.11, "r_y3": 256.96900000000005, "coord_origin": "TOPLEFT"}, "text": "U X X X", "orig": "U X X X", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 21, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 282.408, "r_y0": 278.41999999999996, "r_x1": 325.478, "r_y1": 278.14200000000005, "r_x2": 325.478, "r_y2": 268.97400000000005, "r_x3": 282.408, "r_y3": 269.25199999999995, "coord_origin": "TOPLEFT"}, "text": "U X X X", "orig": "U X X X", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 22, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 307.466, "r_y0": 253.861, "r_x1": 312.992, "r_y1": 253.861, "r_x2": 312.992, "r_y2": 244.69299999999998, "r_x3": 307.466, "r_y3": 244.69299999999998, "coord_origin": "TOPLEFT"}, "text": "L", "orig": "L", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 23, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 318.769, "r_y0": 253.72799999999995, "r_x1": 324.294, "r_y1": 253.72799999999995, "r_x2": 324.294, "r_y2": 244.55999999999995, "r_x3": 318.769, "r_y3": 244.55999999999995, "coord_origin": "TOPLEFT"}, "text": "L", "orig": "L", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 24, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 195.939, "r_y0": 278.03499999999997, "r_x1": 214.734, "r_y1": 278.02, "r_x2": 214.734, "r_y2": 268.852, "r_x3": 195.939, "r_y3": 268.86699999999996, "coord_origin": "TOPLEFT"}, "text": "C L", "orig": "C L", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 25, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 221.146, "r_y0": 278.1, "r_x1": 226.671, "r_y1": 278.1, "r_x2": 226.671, "r_y2": 268.932, "r_x3": 221.146, "r_y3": 268.932, "coord_origin": "TOPLEFT"}, "text": "L", "orig": "L", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 26, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 232.449, "r_y0": 277.967, "r_x1": 237.974, "r_y1": 277.967, "r_x2": 237.974, "r_y2": 268.799, "r_x3": 232.449, "r_y3": 268.799, "coord_origin": "TOPLEFT"}, "text": "L", "orig": "L", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 27, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 196.217, "r_y0": 253.827, "r_x1": 203.392, "r_y1": 253.827, "r_x2": 203.392, "r_y2": 244.659, "r_x3": 196.217, "r_y3": 244.659, "coord_origin": "TOPLEFT"}, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 28, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 250.321, "r_y0": 253.385, "r_x1": 257.497, "r_y1": 253.385, "r_x2": 257.497, "r_y2": 244.21699999999998, "r_x3": 250.321, "r_y3": 244.21699999999998, "coord_origin": "TOPLEFT"}, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 29, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 250.172, "r_y0": 265.727, "r_x1": 257.348, "r_y1": 265.727, "r_x2": 257.348, "r_y2": 256.55899999999997, "r_x3": 250.172, "r_y3": 256.55899999999997, "coord_origin": "TOPLEFT"}, "text": "U", "orig": "U", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 30, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 250.47, "r_y0": 278.01, "r_x1": 257.646, "r_y1": 278.01, "r_x2": 257.646, "r_y2": 268.842, "r_x3": 250.47, "r_y3": 268.842, "coord_origin": "TOPLEFT"}, "text": "U", "orig": "U", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 31, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 334.511, "r_y0": 249.18600000000004, "r_x1": 391.495, "r_y1": 249.18600000000004, "r_x2": 391.495, "r_y2": 243.07399999999996, "r_x3": 334.511, "r_y3": 243.07399999999996, "coord_origin": "TOPLEFT"}, "text": "1 - simple cells: \"C\"", "orig": "1 - simple cells: \"C\"", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 32, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 334.511, "r_y0": 259.124, "r_x1": 421.986, "r_y1": 259.124, "r_x2": 421.986, "r_y2": 253.01199999999994, "r_x3": 334.511, "r_y3": 253.01199999999994, "coord_origin": "TOPLEFT"}, "text": "2 - horizontal merges: \"C\", \"L\"", "orig": "2 - horizontal merges: \"C\", \"L\"", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 33, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 334.511, "r_y0": 269.062, "r_x1": 415.344, "r_y1": 269.062, "r_x2": 415.344, "r_y2": 262.95000000000005, "r_x3": 334.511, "r_y3": 262.95000000000005, "coord_origin": "TOPLEFT"}, "text": "3 - vertical merges: \"C\", \"U\"", "orig": "3 - vertical merges: \"C\", \"U\"", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 34, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 334.511, "r_y0": 279.0, "r_x1": 426.599, "r_y1": 279.0, "r_x2": 426.599, "r_y2": 272.88800000000003, "r_x3": 334.511, "r_y3": 272.88800000000003, "coord_origin": "TOPLEFT"}, "text": "4 - 2d merges: \"C\", \"L\", \"U\", \"X\"", "orig": "4 - 2d merges: \"C\", \"L\", \"U\", \"X\"", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 35, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 185.672, "r_y0": 250.23400000000004, "r_x1": 189.355, "r_y1": 250.23400000000004, "r_x2": 189.355, "r_y2": 244.12199999999996, "r_x3": 185.672, "r_y3": 244.12199999999996, "coord_origin": "TOPLEFT"}, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 36, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 185.968, "r_y0": 274.539, "r_x1": 189.651, "r_y1": 274.539, "r_x2": 189.651, "r_y2": 268.427, "r_x3": 185.968, "r_y3": 268.427, "coord_origin": "TOPLEFT"}, "text": "2", "orig": "2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 37, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 239.342, "r_y0": 249.817, "r_x1": 243.025, "r_y1": 249.817, "r_x2": 243.025, "r_y2": 243.70500000000004, "r_x3": 239.342, "r_y3": 243.70500000000004, "coord_origin": "TOPLEFT"}, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 38, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 271.329, "r_y0": 249.68499999999995, "r_x1": 275.012, "r_y1": 249.68499999999995, "r_x2": 275.012, "r_y2": 243.57299999999998, "r_x3": 271.329, "r_y3": 243.57299999999998, "coord_origin": "TOPLEFT"}, "text": "4", "orig": "4", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 39, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 229.816, "r_y0": 172.707, "r_x1": 233.5, "r_y1": 172.707, "r_x2": 233.5, "r_y2": 166.59400000000005, "r_x3": 229.816, "r_y3": 166.59400000000005, "coord_origin": "TOPLEFT"}, "text": "2", "orig": "2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 40, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 257.244, "r_y0": 196.15300000000002, "r_x1": 260.928, "r_y1": 196.15300000000002, "r_x2": 260.928, "r_y2": 190.03999999999996, "r_x3": 257.244, "r_y3": 190.03999999999996, "coord_origin": "TOPLEFT"}, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 41, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 186.875, "r_y0": 184.168, "r_x1": 190.559, "r_y1": 184.168, "r_x2": 190.559, "r_y2": 178.05600000000004, "r_x3": 186.875, "r_y3": 178.05600000000004, "coord_origin": "TOPLEFT"}, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 42, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 196.487, "r_y0": 175.207, "r_x1": 200.171, "r_y1": 175.207, "r_x2": 200.171, "r_y2": 169.09500000000003, "r_x3": 196.487, "r_y3": 169.09500000000003, "coord_origin": "TOPLEFT"}, "text": "4", "orig": "4", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 43, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 169.747, "r_y0": 175.62199999999996, "r_x1": 175.727, "r_y1": 175.62199999999996, "r_x2": 175.727, "r_y2": 167.98199999999997, "r_x3": 169.747, "r_y3": 167.98199999999997, "coord_origin": "TOPLEFT"}, "text": "A", "orig": "A", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 44, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 169.747, "r_y0": 214.57799999999997, "r_x1": 175.727, "r_y1": 214.57799999999997, "r_x2": 175.727, "r_y2": 206.938, "r_x3": 169.747, "r_y3": 206.938, "coord_origin": "TOPLEFT"}, "text": "B", "orig": "B", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 45, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 274.294, "r_y0": 176.019, "r_x1": 280.273, "r_y1": 176.019, "r_x2": 280.273, "r_y2": 168.37900000000002, "r_x3": 274.294, "r_y3": 168.37900000000002, "coord_origin": "TOPLEFT"}, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 46, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 359.562, "r_y0": 176.019, "r_x1": 365.541, "r_y1": 176.019, "r_x2": 365.541, "r_y2": 168.37900000000002, "r_x3": 359.562, "r_y3": 168.37900000000002, "coord_origin": "TOPLEFT"}, "text": "D", "orig": "D", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 47, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 169.747, "r_y0": 250.95100000000002, "r_x1": 175.271, "r_y1": 250.95100000000002, "r_x2": 175.271, "r_y2": 243.31100000000004, "r_x3": 169.747, "r_y3": 243.31100000000004, "coord_origin": "TOPLEFT"}, "text": "E", "orig": "E", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": [{"id": 38, "label": "text", "bbox": {"l": 374.493, "t": 168.05399999999997, "r": 428.861, "b": 177.88099999999997, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 10, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 374.493, "r_y0": 177.88099999999997, "r_x1": 428.861, "r_y1": 177.22199999999998, "r_x2": 428.861, "r_y2": 168.05399999999997, "r_x3": 374.493, "r_y3": 168.71299999999997, "coord_origin": "TOPLEFT"}, "text": "C L C L L", "orig": "C L C L L", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 39, "label": "text", "bbox": {"l": 373.769, "t": 192.61400000000003, "r": 448.17, "b": 202.21299999999997, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 11, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 373.769, "r_y0": 202.21299999999997, "r_x1": 448.17, "r_y1": 201.78200000000004, "r_x2": 448.17, "r_y2": 192.61400000000003, "r_x3": 373.769, "r_y3": 193.04499999999996, "coord_origin": "TOPLEFT"}, "text": "C C C C C NL", "orig": "C C C C C NL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 40, "label": "text", "bbox": {"l": 386.687, "t": 204.95000000000005, "r": 448.085, "b": 214.42499999999995, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 12, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 386.687, "r_y0": 214.42499999999995, "r_x1": 448.085, "r_y1": 214.11800000000005, "r_x2": 448.085, "r_y2": 204.95000000000005, "r_x3": 386.687, "r_y3": 205.25699999999995, "coord_origin": "TOPLEFT"}, "text": "C C C C NL", "orig": "C C C C NL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 41, "label": "text", "bbox": {"l": 398.657, "t": 180.32000000000005, "r": 448.147, "b": 190.01999999999998, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 13, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 398.657, "r_y0": 190.01999999999998, "r_x1": 448.147, "r_y1": 189.48800000000006, "r_x2": 448.147, "r_y2": 180.32000000000005, "r_x3": 398.657, "r_y3": 180.85199999999998, "coord_origin": "TOPLEFT"}, "text": "C C C NL", "orig": "C C C NL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 42, "label": "text", "bbox": {"l": 386.506, "t": 217.15800000000002, "r": 448.302, "b": 226.52099999999996, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 14, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 386.506, "r_y0": 226.32600000000002, "r_x1": 448.302, "r_y1": 226.52099999999996, "r_x2": 448.302, "r_y2": 217.35299999999995, "r_x3": 386.506, "r_y3": 217.15800000000002, "coord_origin": "TOPLEFT"}, "text": "C C C C NL", "orig": "C C C C NL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 43, "label": "text", "bbox": {"l": 435.16, "t": 167.80899999999997, "r": 447.863, "b": 176.97699999999998, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 15, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 435.16, "r_y0": 176.97699999999998, "r_x1": 447.863, "r_y1": 176.97699999999998, "r_x2": 447.863, "r_y2": 167.80899999999997, "r_x3": 435.16, "r_y3": 167.80899999999997, "coord_origin": "TOPLEFT"}, "text": "NL", "orig": "NL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 44, "label": "text", "bbox": {"l": 374.15, "t": 205.35400000000004, "r": 381.325, "b": 214.52200000000005, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 16, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 374.15, "r_y0": 214.52200000000005, "r_x1": 381.325, "r_y1": 214.52200000000005, "r_x2": 381.325, "r_y2": 205.35400000000004, "r_x3": 374.15, "r_y3": 205.35400000000004, "coord_origin": "TOPLEFT"}, "text": "U", "orig": "U", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 45, "label": "text", "bbox": {"l": 374.042, "t": 217.26599999999996, "r": 381.217, "b": 226.43399999999997, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 17, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 374.042, "r_y0": 226.43399999999997, "r_x1": 381.217, "r_y1": 226.43399999999997, "r_x2": 381.217, "r_y2": 217.26599999999996, "r_x3": 374.042, "r_y3": 217.26599999999996, "coord_origin": "TOPLEFT"}, "text": "U", "orig": "U", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 46, "label": "text", "bbox": {"l": 374.344, "t": 180.90499999999997, "r": 393.765, "b": 190.22199999999998, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 18, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 374.344, "r_y0": 190.22199999999998, "r_x1": 393.765, "r_y1": 190.07299999999998, "r_x2": 393.765, "r_y2": 180.90499999999997, "r_x3": 374.344, "r_y3": 181.05399999999997, "coord_origin": "TOPLEFT"}, "text": "U X", "orig": "U X", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 47, "label": "text", "bbox": {"l": 282.259, "t": 244.61300000000006, "r": 301.055, "b": 253.79600000000005, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 19, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 282.259, "r_y0": 253.79600000000005, "r_x1": 301.055, "r_y1": 253.78099999999995, "r_x2": 301.055, "r_y2": 244.61300000000006, "r_x3": 282.259, "r_y3": 244.62800000000004, "coord_origin": "TOPLEFT"}, "text": "C L", "orig": "C L", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 48, "label": "text", "bbox": {"l": 282.11, "t": 256.42100000000005, "r": 325.59, "b": 266.13800000000003, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 20, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 282.11, "r_y0": 266.13800000000003, "r_x1": 325.59, "r_y1": 265.58900000000006, "r_x2": 325.59, "r_y2": 256.42100000000005, "r_x3": 282.11, "r_y3": 256.96900000000005, "coord_origin": "TOPLEFT"}, "text": "U X X X", "orig": "U X X X", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 49, "label": "text", "bbox": {"l": 282.408, "t": 268.97400000000005, "r": 325.478, "b": 278.41999999999996, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 21, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 282.408, "r_y0": 278.41999999999996, "r_x1": 325.478, "r_y1": 278.14200000000005, "r_x2": 325.478, "r_y2": 268.97400000000005, "r_x3": 282.408, "r_y3": 269.25199999999995, "coord_origin": "TOPLEFT"}, "text": "U X X X", "orig": "U X X X", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 50, "label": "text", "bbox": {"l": 307.466, "t": 244.69299999999998, "r": 312.992, "b": 253.861, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 22, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 307.466, "r_y0": 253.861, "r_x1": 312.992, "r_y1": 253.861, "r_x2": 312.992, "r_y2": 244.69299999999998, "r_x3": 307.466, "r_y3": 244.69299999999998, "coord_origin": "TOPLEFT"}, "text": "L", "orig": "L", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 51, "label": "text", "bbox": {"l": 318.769, "t": 244.55999999999995, "r": 324.294, "b": 253.72799999999995, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 23, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 318.769, "r_y0": 253.72799999999995, "r_x1": 324.294, "r_y1": 253.72799999999995, "r_x2": 324.294, "r_y2": 244.55999999999995, "r_x3": 318.769, "r_y3": 244.55999999999995, "coord_origin": "TOPLEFT"}, "text": "L", "orig": "L", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 52, "label": "text", "bbox": {"l": 195.939, "t": 268.852, "r": 214.734, "b": 278.03499999999997, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 24, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 195.939, "r_y0": 278.03499999999997, "r_x1": 214.734, "r_y1": 278.02, "r_x2": 214.734, "r_y2": 268.852, "r_x3": 195.939, "r_y3": 268.86699999999996, "coord_origin": "TOPLEFT"}, "text": "C L", "orig": "C L", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 53, "label": "text", "bbox": {"l": 221.146, "t": 268.932, "r": 226.671, "b": 278.1, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 25, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 221.146, "r_y0": 278.1, "r_x1": 226.671, "r_y1": 278.1, "r_x2": 226.671, "r_y2": 268.932, "r_x3": 221.146, "r_y3": 268.932, "coord_origin": "TOPLEFT"}, "text": "L", "orig": "L", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 54, "label": "text", "bbox": {"l": 232.449, "t": 268.799, "r": 237.974, "b": 277.967, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 26, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 232.449, "r_y0": 277.967, "r_x1": 237.974, "r_y1": 277.967, "r_x2": 237.974, "r_y2": 268.799, "r_x3": 232.449, "r_y3": 268.799, "coord_origin": "TOPLEFT"}, "text": "L", "orig": "L", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 55, "label": "text", "bbox": {"l": 196.217, "t": 244.659, "r": 203.392, "b": 253.827, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 27, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 196.217, "r_y0": 253.827, "r_x1": 203.392, "r_y1": 253.827, "r_x2": 203.392, "r_y2": 244.659, "r_x3": 196.217, "r_y3": 244.659, "coord_origin": "TOPLEFT"}, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 56, "label": "text", "bbox": {"l": 250.321, "t": 244.21699999999998, "r": 257.497, "b": 253.385, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 28, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 250.321, "r_y0": 253.385, "r_x1": 257.497, "r_y1": 253.385, "r_x2": 257.497, "r_y2": 244.21699999999998, "r_x3": 250.321, "r_y3": 244.21699999999998, "coord_origin": "TOPLEFT"}, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 57, "label": "text", "bbox": {"l": 250.172, "t": 256.55899999999997, "r": 257.348, "b": 265.727, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 29, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 250.172, "r_y0": 265.727, "r_x1": 257.348, "r_y1": 265.727, "r_x2": 257.348, "r_y2": 256.55899999999997, "r_x3": 250.172, "r_y3": 256.55899999999997, "coord_origin": "TOPLEFT"}, "text": "U", "orig": "U", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 58, "label": "text", "bbox": {"l": 250.47, "t": 268.842, "r": 257.646, "b": 278.01, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 30, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 250.47, "r_y0": 278.01, "r_x1": 257.646, "r_y1": 278.01, "r_x2": 257.646, "r_y2": 268.842, "r_x3": 250.47, "r_y3": 268.842, "coord_origin": "TOPLEFT"}, "text": "U", "orig": "U", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 59, "label": "text", "bbox": {"l": 334.511, "t": 243.07399999999996, "r": 391.495, "b": 249.18600000000004, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 31, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 334.511, "r_y0": 249.18600000000004, "r_x1": 391.495, "r_y1": 249.18600000000004, "r_x2": 391.495, "r_y2": 243.07399999999996, "r_x3": 334.511, "r_y3": 243.07399999999996, "coord_origin": "TOPLEFT"}, "text": "1 - simple cells: \"C\"", "orig": "1 - simple cells: \"C\"", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 60, "label": "text", "bbox": {"l": 334.511, "t": 253.01199999999994, "r": 421.986, "b": 259.124, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 32, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 334.511, "r_y0": 259.124, "r_x1": 421.986, "r_y1": 259.124, "r_x2": 421.986, "r_y2": 253.01199999999994, "r_x3": 334.511, "r_y3": 253.01199999999994, "coord_origin": "TOPLEFT"}, "text": "2 - horizontal merges: \"C\", \"L\"", "orig": "2 - horizontal merges: \"C\", \"L\"", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 61, "label": "text", "bbox": {"l": 334.511, "t": 262.95000000000005, "r": 415.344, "b": 269.062, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 33, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 334.511, "r_y0": 269.062, "r_x1": 415.344, "r_y1": 269.062, "r_x2": 415.344, "r_y2": 262.95000000000005, "r_x3": 334.511, "r_y3": 262.95000000000005, "coord_origin": "TOPLEFT"}, "text": "3 - vertical merges: \"C\", \"U\"", "orig": "3 - vertical merges: \"C\", \"U\"", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 18, "label": "list_item", "bbox": {"l": 334.511, "t": 272.88800000000003, "r": 426.599, "b": 279.0, "coord_origin": "TOPLEFT"}, "confidence": 0.5250625610351562, "cells": [{"index": 34, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 334.511, "r_y0": 279.0, "r_x1": 426.599, "r_y1": 279.0, "r_x2": 426.599, "r_y2": 272.88800000000003, "r_x3": 334.511, "r_y3": 272.88800000000003, "coord_origin": "TOPLEFT"}, "text": "4 - 2d merges: \"C\", \"L\", \"U\", \"X\"", "orig": "4 - 2d merges: \"C\", \"L\", \"U\", \"X\"", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 62, "label": "text", "bbox": {"l": 185.672, "t": 244.12199999999996, "r": 189.355, "b": 250.23400000000004, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 35, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 185.672, "r_y0": 250.23400000000004, "r_x1": 189.355, "r_y1": 250.23400000000004, "r_x2": 189.355, "r_y2": 244.12199999999996, "r_x3": 185.672, "r_y3": 244.12199999999996, "coord_origin": "TOPLEFT"}, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 63, "label": "text", "bbox": {"l": 185.968, "t": 268.427, "r": 189.651, "b": 274.539, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 36, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 185.968, "r_y0": 274.539, "r_x1": 189.651, "r_y1": 274.539, "r_x2": 189.651, "r_y2": 268.427, "r_x3": 185.968, "r_y3": 268.427, "coord_origin": "TOPLEFT"}, "text": "2", "orig": "2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 64, "label": "text", "bbox": {"l": 239.342, "t": 243.70500000000004, "r": 243.025, "b": 249.817, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 37, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 239.342, "r_y0": 249.817, "r_x1": 243.025, "r_y1": 249.817, "r_x2": 243.025, "r_y2": 243.70500000000004, "r_x3": 239.342, "r_y3": 243.70500000000004, "coord_origin": "TOPLEFT"}, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 65, "label": "text", "bbox": {"l": 271.329, "t": 243.57299999999998, "r": 275.012, "b": 249.68499999999995, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 38, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 271.329, "r_y0": 249.68499999999995, "r_x1": 275.012, "r_y1": 249.68499999999995, "r_x2": 275.012, "r_y2": 243.57299999999998, "r_x3": 271.329, "r_y3": 243.57299999999998, "coord_origin": "TOPLEFT"}, "text": "4", "orig": "4", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 66, "label": "text", "bbox": {"l": 229.816, "t": 166.59400000000005, "r": 233.5, "b": 172.707, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 39, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 229.816, "r_y0": 172.707, "r_x1": 233.5, "r_y1": 172.707, "r_x2": 233.5, "r_y2": 166.59400000000005, "r_x3": 229.816, "r_y3": 166.59400000000005, "coord_origin": "TOPLEFT"}, "text": "2", "orig": "2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 67, "label": "text", "bbox": {"l": 257.244, "t": 190.03999999999996, "r": 260.928, "b": 196.15300000000002, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 40, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 257.244, "r_y0": 196.15300000000002, "r_x1": 260.928, "r_y1": 196.15300000000002, "r_x2": 260.928, "r_y2": 190.03999999999996, "r_x3": 257.244, "r_y3": 190.03999999999996, "coord_origin": "TOPLEFT"}, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 68, "label": "text", "bbox": {"l": 186.875, "t": 178.05600000000004, "r": 190.559, "b": 184.168, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 41, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 186.875, "r_y0": 184.168, "r_x1": 190.559, "r_y1": 184.168, "r_x2": 190.559, "r_y2": 178.05600000000004, "r_x3": 186.875, "r_y3": 178.05600000000004, "coord_origin": "TOPLEFT"}, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 69, "label": "text", "bbox": {"l": 196.487, "t": 169.09500000000003, "r": 200.171, "b": 175.207, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 42, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 196.487, "r_y0": 175.207, "r_x1": 200.171, "r_y1": 175.207, "r_x2": 200.171, "r_y2": 169.09500000000003, "r_x3": 196.487, "r_y3": 169.09500000000003, "coord_origin": "TOPLEFT"}, "text": "4", "orig": "4", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 70, "label": "text", "bbox": {"l": 169.747, "t": 167.98199999999997, "r": 175.727, "b": 175.62199999999996, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 43, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 169.747, "r_y0": 175.62199999999996, "r_x1": 175.727, "r_y1": 175.62199999999996, "r_x2": 175.727, "r_y2": 167.98199999999997, "r_x3": 169.747, "r_y3": 167.98199999999997, "coord_origin": "TOPLEFT"}, "text": "A", "orig": "A", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 71, "label": "text", "bbox": {"l": 169.747, "t": 206.938, "r": 175.727, "b": 214.57799999999997, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 44, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 169.747, "r_y0": 214.57799999999997, "r_x1": 175.727, "r_y1": 214.57799999999997, "r_x2": 175.727, "r_y2": 206.938, "r_x3": 169.747, "r_y3": 206.938, "coord_origin": "TOPLEFT"}, "text": "B", "orig": "B", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 72, "label": "text", "bbox": {"l": 274.294, "t": 168.37900000000002, "r": 280.273, "b": 176.019, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 45, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 274.294, "r_y0": 176.019, "r_x1": 280.273, "r_y1": 176.019, "r_x2": 280.273, "r_y2": 168.37900000000002, "r_x3": 274.294, "r_y3": 168.37900000000002, "coord_origin": "TOPLEFT"}, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 73, "label": "text", "bbox": {"l": 359.562, "t": 168.37900000000002, "r": 365.541, "b": 176.019, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 46, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 359.562, "r_y0": 176.019, "r_x1": 365.541, "r_y1": 176.019, "r_x2": 365.541, "r_y2": 168.37900000000002, "r_x3": 359.562, "r_y3": 168.37900000000002, "coord_origin": "TOPLEFT"}, "text": "D", "orig": "D", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 74, "label": "text", "bbox": {"l": 169.747, "t": 243.31100000000004, "r": 175.271, "b": 250.95100000000002, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 47, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 169.747, "r_y0": 250.95100000000002, "r_x1": 175.271, "r_y1": 250.95100000000002, "r_x2": 175.271, "r_y2": 243.31100000000004, "r_x3": 169.747, "r_y3": 243.31100000000004, "coord_origin": "TOPLEFT"}, "text": "E", "orig": "E", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}]}, "text": "", "annotations": [], "provenance": null, "predicted_class": null, "confidence": null}, {"label": "section_header", "id": 9, "page_no": 6, "cluster": {"id": 9, "label": "section_header", "bbox": {"l": 134.765, "t": 305.296, "r": 246.652, "b": 314.103, "coord_origin": "TOPLEFT"}, "confidence": 0.9233023524284363, "cells": [{"index": 48, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 314.103, "r_x1": 149.402, "r_y1": 314.103, "r_x2": 149.402, "r_y2": 305.296, "r_x3": 134.765, "r_y3": 305.296, "coord_origin": "TOPLEFT"}, "text": "4.2", "orig": "4.2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 49, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 160.859, "r_y0": 314.103, "r_x1": 246.652, "r_y1": 314.103, "r_x2": 246.652, "r_y2": 305.296, "r_x3": 160.859, "r_y3": 305.296, "coord_origin": "TOPLEFT"}, "text": "Language Syntax", "orig": "Language Syntax", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "4.2 Language Syntax"}, {"label": "text", "id": 10, "page_no": 6, "cluster": {"id": 10, "label": "text", "bbox": {"l": 134.765, "t": 325.248, "r": 363.796, "b": 334.045, "coord_origin": "TOPLEFT"}, "confidence": 0.9169168472290039, "cells": [{"index": 50, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 334.045, "r_x1": 363.796, "r_y1": 334.045, "r_x2": 363.796, "r_y2": 325.248, "r_x3": 134.765, "r_y3": 325.248, "coord_origin": "TOPLEFT"}, "text": "The OTSL representation follows these syntax rules:", "orig": "The OTSL representation follows these syntax rules:", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "The OTSL representation follows these syntax rules:"}, {"label": "list_item", "id": 3, "page_no": 6, "cluster": {"id": 3, "label": "list_item", "bbox": {"l": 138.973, "t": 347.171, "r": 480.589, "b": 367.934, "coord_origin": "TOPLEFT"}, "confidence": 0.9588112235069275, "cells": [{"index": 51, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 138.973, "r_y0": 355.978, "r_x1": 146.72, "r_y1": 355.978, "r_x2": 146.72, "r_y2": 347.181, "r_x3": 138.973, "r_y3": 347.181, "coord_origin": "TOPLEFT"}, "text": "1.", "orig": "1.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 52, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 151.701, "r_y0": 355.978, "r_x1": 257.379, "r_y1": 355.978, "r_x2": 257.379, "r_y2": 347.171, "r_x3": 151.701, "r_y3": 347.171, "coord_origin": "TOPLEFT"}, "text": "Left-looking cell rule", "orig": "Left-looking cell rule", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 53, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 257.383, "r_y0": 355.978, "r_x1": 260.15, "r_y1": 355.978, "r_x2": 260.15, "r_y2": 347.181, "r_x3": 257.383, "r_y3": 347.181, "coord_origin": "TOPLEFT"}, "text": ":", "orig": ":", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 54, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 264.184, "r_y0": 355.978, "r_x1": 480.589, "r_y1": 355.978, "r_x2": 480.589, "r_y2": 347.181, "r_x3": 264.184, "r_y3": 347.181, "coord_origin": "TOPLEFT"}, "text": "The left neighbour of an \"L\" cell must be either", "orig": "The left neighbour of an \"L\" cell must be either", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 55, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 151.701, "r_y0": 367.934, "r_x1": 283.594, "r_y1": 367.934, "r_x2": 283.594, "r_y2": 359.137, "r_x3": 151.701, "r_y3": 359.137, "coord_origin": "TOPLEFT"}, "text": "another \"L\" cell or a \"C\" cell.", "orig": "another \"L\" cell or a \"C\" cell.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "1. Left-looking cell rule : The left neighbour of an \"L\" cell must be either another \"L\" cell or a \"C\" cell."}, {"label": "list_item", "id": 4, "page_no": 6, "cluster": {"id": 4, "label": "list_item", "bbox": {"l": 138.973, "t": 371.085, "r": 480.592, "b": 391.847, "coord_origin": "TOPLEFT"}, "confidence": 0.9585386514663696, "cells": [{"index": 56, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 138.973, "r_y0": 379.892, "r_x1": 146.72, "r_y1": 379.892, "r_x2": 146.72, "r_y2": 371.095, "r_x3": 138.973, "r_y3": 371.095, "coord_origin": "TOPLEFT"}, "text": "2.", "orig": "2.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 57, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 151.701, "r_y0": 379.892, "r_x1": 252.112, "r_y1": 379.892, "r_x2": 252.112, "r_y2": 371.085, "r_x3": 151.701, "r_y3": 371.085, "coord_origin": "TOPLEFT"}, "text": "Up-looking cell rule", "orig": "Up-looking cell rule", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 58, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 252.112, "r_y0": 379.892, "r_x1": 254.879, "r_y1": 379.892, "r_x2": 254.879, "r_y2": 371.095, "r_x3": 252.112, "r_y3": 371.095, "coord_origin": "TOPLEFT"}, "text": ":", "orig": ":", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 59, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 258.764, "r_y0": 379.892, "r_x1": 480.592, "r_y1": 379.892, "r_x2": 480.592, "r_y2": 371.095, "r_x3": 258.764, "r_y3": 371.095, "coord_origin": "TOPLEFT"}, "text": "The upper neighbour of a \"U\" cell must be either", "orig": "The upper neighbour of a \"U\" cell must be either", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 60, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 151.701, "r_y0": 391.847, "r_x1": 284.839, "r_y1": 391.847, "r_x2": 284.839, "r_y2": 383.05, "r_x3": 151.701, "r_y3": 383.05, "coord_origin": "TOPLEFT"}, "text": "another \"U\" cell or a \"C\" cell.", "orig": "another \"U\" cell or a \"C\" cell.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "2. Up-looking cell rule : The upper neighbour of a \"U\" cell must be either another \"U\" cell or a \"C\" cell."}, {"label": "section_header", "id": 14, "page_no": 6, "cluster": {"id": 14, "label": "section_header", "bbox": {"l": 138.973, "t": 394.998, "r": 226.074, "b": 403.805, "coord_origin": "TOPLEFT"}, "confidence": 0.6506174206733704, "cells": [{"index": 61, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 138.973, "r_y0": 403.805, "r_x1": 146.72, "r_y1": 403.805, "r_x2": 146.72, "r_y2": 395.008, "r_x3": 138.973, "r_y3": 395.008, "coord_origin": "TOPLEFT"}, "text": "3.", "orig": "3.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 62, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 151.701, "r_y0": 403.805, "r_x1": 223.304, "r_y1": 403.805, "r_x2": 223.304, "r_y2": 394.998, "r_x3": 151.701, "r_y3": 394.998, "coord_origin": "TOPLEFT"}, "text": "Cross cell rule", "orig": "Cross cell rule", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 63, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 223.307, "r_y0": 403.805, "r_x1": 226.074, "r_y1": 403.805, "r_x2": 226.074, "r_y2": 395.008, "r_x3": 223.307, "r_y3": 395.008, "coord_origin": "TOPLEFT"}, "text": ":", "orig": ":", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "3. Cross cell rule :"}, {"label": "list_item", "id": 13, "page_no": 6, "cluster": {"id": 13, "label": "list_item", "bbox": {"l": 151.701, "t": 406.967, "r": 480.592, "b": 439.674, "coord_origin": "TOPLEFT"}, "confidence": 0.7247239947319031, "cells": [{"index": 64, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 151.701, "r_y0": 415.764, "r_x1": 480.592, "r_y1": 415.764, "r_x2": 480.592, "r_y2": 406.967, "r_x3": 151.701, "r_y3": 406.967, "coord_origin": "TOPLEFT"}, "text": "The left neighbour of an \"X\" cell must be either another \"X\" cell or a \"U\"", "orig": "The left neighbour of an \"X\" cell must be either another \"X\" cell or a \"U\"", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 65, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 151.701, "r_y0": 427.719, "r_x1": 480.592, "r_y1": 427.719, "r_x2": 480.592, "r_y2": 418.922, "r_x3": 151.701, "r_y3": 418.922, "coord_origin": "TOPLEFT"}, "text": "cell, and the upper neighbour of an \"X\" cell must be either another \"X\" cell", "orig": "cell, and the upper neighbour of an \"X\" cell must be either another \"X\" cell", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 66, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 151.701, "r_y0": 439.674, "r_x1": 214.397, "r_y1": 439.674, "r_x2": 214.397, "r_y2": 430.877, "r_x3": 151.701, "r_y3": 430.877, "coord_origin": "TOPLEFT"}, "text": "or an \"L\" cell.", "orig": "or an \"L\" cell.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "The left neighbour of an \"X\" cell must be either another \"X\" cell or a \"U\" cell, and the upper neighbour of an \"X\" cell must be either another \"X\" cell or an \"L\" cell."}, {"label": "list_item", "id": 8, "page_no": 6, "cluster": {"id": 8, "label": "list_item", "bbox": {"l": 138.973, "t": 442.826, "r": 474.59, "b": 451.633, "coord_origin": "TOPLEFT"}, "confidence": 0.9259927272796631, "cells": [{"index": 67, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 138.973, "r_y0": 451.633, "r_x1": 146.72, "r_y1": 451.633, "r_x2": 146.72, "r_y2": 442.836, "r_x3": 138.973, "r_y3": 442.836, "coord_origin": "TOPLEFT"}, "text": "4.", "orig": "4.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 68, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 151.701, "r_y0": 451.633, "r_x1": 221.323, "r_y1": 451.633, "r_x2": 221.323, "r_y2": 442.826, "r_x3": 151.701, "r_y3": 442.826, "coord_origin": "TOPLEFT"}, "text": "First row rule", "orig": "First row rule", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 69, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 221.327, "r_y0": 451.633, "r_x1": 224.094, "r_y1": 451.633, "r_x2": 224.094, "r_y2": 442.836, "r_x3": 221.327, "r_y3": 442.836, "coord_origin": "TOPLEFT"}, "text": ":", "orig": ":", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 70, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 227.411, "r_y0": 451.633, "r_x1": 474.59, "r_y1": 451.633, "r_x2": 474.59, "r_y2": 442.836, "r_x3": 227.411, "r_y3": 442.836, "coord_origin": "TOPLEFT"}, "text": "Only \"L\" cells and \"C\" cells are allowed in the first row.", "orig": "Only \"L\" cells and \"C\" cells are allowed in the first row.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "4. First row rule : Only \"L\" cells and \"C\" cells are allowed in the first row."}, {"label": "list_item", "id": 5, "page_no": 6, "cluster": {"id": 5, "label": "list_item", "bbox": {"l": 138.973, "t": 454.784, "r": 480.588, "b": 475.546, "coord_origin": "TOPLEFT"}, "confidence": 0.9420599937438965, "cells": [{"index": 71, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 138.973, "r_y0": 463.591, "r_x1": 146.72, "r_y1": 463.591, "r_x2": 146.72, "r_y2": 454.794, "r_x3": 138.973, "r_y3": 454.794, "coord_origin": "TOPLEFT"}, "text": "5.", "orig": "5.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 72, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 151.701, "r_y0": 463.591, "r_x1": 240.72, "r_y1": 463.591, "r_x2": 240.72, "r_y2": 454.784, "r_x3": 151.701, "r_y3": 454.784, "coord_origin": "TOPLEFT"}, "text": "First column rule", "orig": "First column rule", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 73, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 240.716, "r_y0": 463.591, "r_x1": 243.483, "r_y1": 463.591, "r_x2": 243.483, "r_y2": 454.794, "r_x3": 240.716, "r_y3": 454.794, "coord_origin": "TOPLEFT"}, "text": ":", "orig": ":", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 74, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 247.458, "r_y0": 463.591, "r_x1": 480.588, "r_y1": 463.591, "r_x2": 480.588, "r_y2": 454.794, "r_x3": 247.458, "r_y3": 454.794, "coord_origin": "TOPLEFT"}, "text": "Only \"U\" cells and \"C\" cells are allowed in the first", "orig": "Only \"U\" cells and \"C\" cells are allowed in the first", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 75, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 151.701, "r_y0": 475.546, "r_x1": 186.007, "r_y1": 475.546, "r_x2": 186.007, "r_y2": 466.749, "r_x3": 151.701, "r_y3": 466.749, "coord_origin": "TOPLEFT"}, "text": "column.", "orig": "column.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "5. First column rule : Only \"U\" cells and \"C\" cells are allowed in the first column."}, {"label": "list_item", "id": 1, "page_no": 6, "cluster": {"id": 1, "label": "list_item", "bbox": {"l": 138.973, "t": 478.697, "r": 480.595, "b": 499.46, "coord_origin": "TOPLEFT"}, "confidence": 0.9617829918861389, "cells": [{"index": 76, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 138.973, "r_y0": 487.504, "r_x1": 146.72, "r_y1": 487.504, "r_x2": 146.72, "r_y2": 478.707, "r_x3": 138.973, "r_y3": 478.707, "coord_origin": "TOPLEFT"}, "text": "6.", "orig": "6.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 77, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 151.701, "r_y0": 487.504, "r_x1": 235.158, "r_y1": 487.504, "r_x2": 235.158, "r_y2": 478.697, "r_x3": 151.701, "r_y3": 478.697, "coord_origin": "TOPLEFT"}, "text": "Rectangular rule", "orig": "Rectangular rule", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 78, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 235.157, "r_y0": 487.504, "r_x1": 480.595, "r_y1": 487.504, "r_x2": 480.595, "r_y2": 478.707, "r_x3": 235.157, "r_y3": 478.707, "coord_origin": "TOPLEFT"}, "text": ": The table representation is always rectangular - all rows", "orig": ": The table representation is always rectangular - all rows", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 79, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 151.701, "r_y0": 499.46, "r_x1": 448.042, "r_y1": 499.46, "r_x2": 448.042, "r_y2": 490.663, "r_x3": 151.701, "r_y3": 490.663, "coord_origin": "TOPLEFT"}, "text": "must have an equal number of tokens, terminated with \"NL\" token.", "orig": "must have an equal number of tokens, terminated with \"NL\" token.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "6. Rectangular rule : The table representation is always rectangular - all rows must have an equal number of tokens, terminated with \"NL\" token."}, {"label": "text", "id": 0, "page_no": 6, "cluster": {"id": 0, "label": "text", "bbox": {"l": 134.765, "t": 512.5930000000001, "r": 480.596, "b": 640.942, "coord_origin": "TOPLEFT"}, "confidence": 0.9785562753677368, "cells": [{"index": 80, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 149.709, "r_y0": 521.39, "r_x1": 480.596, "r_y1": 521.39, "r_x2": 480.596, "r_y2": 512.5930000000001, "r_x3": 149.709, "r_y3": 512.5930000000001, "coord_origin": "TOPLEFT"}, "text": "The application of these rules gives OTSL a set of unique properties. First", "orig": "The application of these rules gives OTSL a set of unique properties. First", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 81, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 533.345, "r_x1": 480.591, "r_y1": 533.345, "r_x2": 480.591, "r_y2": 524.548, "r_x3": 134.765, "r_y3": 524.548, "coord_origin": "TOPLEFT"}, "text": "of all, the OTSL enforces a strictly rectangular structure representation, where", "orig": "of all, the OTSL enforces a strictly rectangular structure representation, where", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 82, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 545.3, "r_x1": 480.595, "r_y1": 545.3, "r_x2": 480.595, "r_y2": 536.5029999999999, "r_x3": 134.765, "r_y3": 536.5029999999999, "coord_origin": "TOPLEFT"}, "text": "every new-line token starts a new row. As a consequence, all rows and all columns", "orig": "every new-line token starts a new row. As a consequence, all rows and all columns", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 83, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 557.256, "r_x1": 480.589, "r_y1": 557.256, "r_x2": 480.589, "r_y2": 548.4590000000001, "r_x3": 134.765, "r_y3": 548.4590000000001, "coord_origin": "TOPLEFT"}, "text": "have exactly the same number of tokens, irrespective of cell spans. Secondly, the", "orig": "have exactly the same number of tokens, irrespective of cell spans. Secondly, the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 84, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 569.211, "r_x1": 480.594, "r_y1": 569.211, "r_x2": 480.594, "r_y2": 560.414, "r_x3": 134.765, "r_y3": 560.414, "coord_origin": "TOPLEFT"}, "text": "OTSL representation is unambiguous: Every table structure is represented in one", "orig": "OTSL representation is unambiguous: Every table structure is represented in one", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 85, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 581.1659999999999, "r_x1": 480.587, "r_y1": 581.1659999999999, "r_x2": 480.587, "r_y2": 572.369, "r_x3": 134.765, "r_y3": 572.369, "coord_origin": "TOPLEFT"}, "text": "way. In this representation every table cell corresponds to a \"C\"-cell token, which", "orig": "way. In this representation every table cell corresponds to a \"C\"-cell token, which", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 86, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 593.121, "r_x1": 480.592, "r_y1": 593.121, "r_x2": 480.592, "r_y2": 584.3240000000001, "r_x3": 134.765, "r_y3": 584.3240000000001, "coord_origin": "TOPLEFT"}, "text": "in case of spans is always located in the top-left corner of the table cell definition.", "orig": "in case of spans is always located in the top-left corner of the table cell definition.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 87, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 605.076, "r_x1": 480.592, "r_y1": 605.076, "r_x2": 480.592, "r_y2": 596.279, "r_x3": 134.765, "r_y3": 596.279, "coord_origin": "TOPLEFT"}, "text": "Third, OTSL syntax rules are only backward-looking. As a consequence, every", "orig": "Third, OTSL syntax rules are only backward-looking. As a consequence, every", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 88, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 617.032, "r_x1": 480.594, "r_y1": 617.032, "r_x2": 480.594, "r_y2": 608.235, "r_x3": 134.765, "r_y3": 608.235, "coord_origin": "TOPLEFT"}, "text": "predicted token can be validated straight during sequence generation by looking", "orig": "predicted token can be validated straight during sequence generation by looking", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 89, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 628.987, "r_x1": 480.591, "r_y1": 628.987, "r_x2": 480.591, "r_y2": 620.19, "r_x3": 134.765, "r_y3": 620.19, "coord_origin": "TOPLEFT"}, "text": "at the previously predicted sequence. As such, OTSL can guarantee that every", "orig": "at the previously predicted sequence. As such, OTSL can guarantee that every", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 90, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 640.942, "r_x1": 311.198, "r_y1": 640.942, "r_x2": 311.198, "r_y2": 632.145, "r_x3": 134.765, "r_y3": 632.145, "coord_origin": "TOPLEFT"}, "text": "predicted sequence is syntactically valid.", "orig": "predicted sequence is syntactically valid.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "The application of these rules gives OTSL a set of unique properties. First of all, the OTSL enforces a strictly rectangular structure representation, where every new-line token starts a new row. As a consequence, all rows and all columns have exactly the same number of tokens, irrespective of cell spans. Secondly, the OTSL representation is unambiguous: Every table structure is represented in one way. In this representation every table cell corresponds to a \"C\"-cell token, which in case of spans is always located in the top-left corner of the table cell definition. Third, OTSL syntax rules are only backward-looking. As a consequence, every predicted token can be validated straight during sequence generation by looking at the previously predicted sequence. As such, OTSL can guarantee that every predicted sequence is syntactically valid."}, {"label": "text", "id": 2, "page_no": 6, "cluster": {"id": 2, "label": "text", "bbox": {"l": 134.765, "t": 644.1030000000001, "r": 480.593, "b": 664.855, "coord_origin": "TOPLEFT"}, "confidence": 0.9590610861778259, "cells": [{"index": 91, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 149.709, "r_y0": 652.9, "r_x1": 480.592, "r_y1": 652.9, "r_x2": 480.592, "r_y2": 644.1030000000001, "r_x3": 149.709, "r_y3": 644.1030000000001, "coord_origin": "TOPLEFT"}, "text": "These characteristics can be easily learned by sequence generator networks,", "orig": "These characteristics can be easily learned by sequence generator networks,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 92, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 664.855, "r_x1": 480.593, "r_y1": 664.855, "r_x2": 480.593, "r_y2": 656.058, "r_x3": 134.765, "r_y3": 656.058, "coord_origin": "TOPLEFT"}, "text": "as we demonstrate further below. We find strong indications that this pattern", "orig": "as we demonstrate further below. We find strong indications that this pattern", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "These characteristics can be easily learned by sequence generator networks, as we demonstrate further below. We find strong indications that this pattern"}], "body": [{"label": "caption", "id": 6, "page_no": 6, "cluster": {"id": 6, "label": "caption", "bbox": {"l": 134.765, "t": 123.58399999999995, "r": 480.587, "b": 156.79100000000005, "coord_origin": "TOPLEFT"}, "confidence": 0.9333080053329468, "cells": [{"index": 2, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 133.72500000000002, "r_x1": 162.644, "r_y1": 133.72500000000002, "r_x2": 162.644, "r_y2": 125.79899999999998, "r_x3": 134.765, "r_y3": 125.79899999999998, "coord_origin": "TOPLEFT"}, "text": "Fig. 3.", "orig": "Fig. 3.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 3, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 166.276, "r_y0": 134.87300000000005, "r_x1": 480.587, "r_y1": 134.87300000000005, "r_x2": 480.587, "r_y2": 123.58399999999995, "r_x3": 166.276, "r_y3": 123.58399999999995, "coord_origin": "TOPLEFT"}, "text": "OTSL description of table structure: A - table example; B - graphical repre-", "orig": "OTSL description of table structure: A - table example; B - graphical repre-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 4, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 145.832, "r_x1": 171.412, "r_y1": 145.832, "r_x2": 171.412, "r_y2": 134.543, "r_x3": 134.765, "r_y3": 134.543, "coord_origin": "TOPLEFT"}, "text": "sentation", "orig": "sentation", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 5, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 175.546, "r_y0": 145.832, "r_x1": 182.968, "r_y1": 145.832, "r_x2": 182.968, "r_y2": 134.543, "r_x3": 175.546, "r_y3": 134.543, "coord_origin": "TOPLEFT"}, "text": "of", "orig": "of", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 6, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 187.093, "r_y0": 145.832, "r_x1": 207.058, "r_y1": 145.832, "r_x2": 207.058, "r_y2": 134.543, "r_x3": 187.093, "r_y3": 134.543, "coord_origin": "TOPLEFT"}, "text": "table", "orig": "table", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 7, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 211.192, "r_y0": 145.832, "r_x1": 250.188, "r_y1": 145.832, "r_x2": 250.188, "r_y2": 134.543, "r_x3": 211.192, "r_y3": 134.543, "coord_origin": "TOPLEFT"}, "text": "structure;", "orig": "structure;", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 8, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 254.312, "r_y0": 145.832, "r_x1": 480.587, "r_y1": 145.832, "r_x2": 480.587, "r_y2": 134.543, "r_x3": 254.312, "r_y3": 134.543, "coord_origin": "TOPLEFT"}, "text": "C - mapping structure on a grid; D - OTSL structure", "orig": "C - mapping structure on a grid; D - OTSL structure", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 9, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 156.79100000000005, "r_x1": 306.116, "r_y1": 156.79100000000005, "r_x2": 306.116, "r_y2": 145.50199999999995, "r_x3": 134.765, "r_y3": 145.50199999999995, "coord_origin": "TOPLEFT"}, "text": "encoding; E - explanation on cell encoding", "orig": "encoding; E - explanation on cell encoding", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "Fig. 3. OTSL description of table structure: A - table example; B - graphical representation of table structure; C - mapping structure on a grid; D - OTSL structure encoding; E - explanation on cell encoding"}, {"label": "picture", "id": 12, "page_no": 6, "cluster": {"id": 12, "label": "picture", "bbox": {"l": 164.65028381347656, "t": 163.79708862304688, "r": 449.5505676269531, "b": 280.3409423828125, "coord_origin": "TOPLEFT"}, "confidence": 0.7868534922599792, "cells": [{"index": 10, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 374.493, "r_y0": 177.88099999999997, "r_x1": 428.861, "r_y1": 177.22199999999998, "r_x2": 428.861, "r_y2": 168.05399999999997, "r_x3": 374.493, "r_y3": 168.71299999999997, "coord_origin": "TOPLEFT"}, "text": "C L C L L", "orig": "C L C L L", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 11, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 373.769, "r_y0": 202.21299999999997, "r_x1": 448.17, "r_y1": 201.78200000000004, "r_x2": 448.17, "r_y2": 192.61400000000003, "r_x3": 373.769, "r_y3": 193.04499999999996, "coord_origin": "TOPLEFT"}, "text": "C C C C C NL", "orig": "C C C C C NL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 12, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 386.687, "r_y0": 214.42499999999995, "r_x1": 448.085, "r_y1": 214.11800000000005, "r_x2": 448.085, "r_y2": 204.95000000000005, "r_x3": 386.687, "r_y3": 205.25699999999995, "coord_origin": "TOPLEFT"}, "text": "C C C C NL", "orig": "C C C C NL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 13, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 398.657, "r_y0": 190.01999999999998, "r_x1": 448.147, "r_y1": 189.48800000000006, "r_x2": 448.147, "r_y2": 180.32000000000005, "r_x3": 398.657, "r_y3": 180.85199999999998, "coord_origin": "TOPLEFT"}, "text": "C C C NL", "orig": "C C C NL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 14, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 386.506, "r_y0": 226.32600000000002, "r_x1": 448.302, "r_y1": 226.52099999999996, "r_x2": 448.302, "r_y2": 217.35299999999995, "r_x3": 386.506, "r_y3": 217.15800000000002, "coord_origin": "TOPLEFT"}, "text": "C C C C NL", "orig": "C C C C NL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 15, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 435.16, "r_y0": 176.97699999999998, "r_x1": 447.863, "r_y1": 176.97699999999998, "r_x2": 447.863, "r_y2": 167.80899999999997, "r_x3": 435.16, "r_y3": 167.80899999999997, "coord_origin": "TOPLEFT"}, "text": "NL", "orig": "NL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 16, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 374.15, "r_y0": 214.52200000000005, "r_x1": 381.325, "r_y1": 214.52200000000005, "r_x2": 381.325, "r_y2": 205.35400000000004, "r_x3": 374.15, "r_y3": 205.35400000000004, "coord_origin": "TOPLEFT"}, "text": "U", "orig": "U", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 17, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 374.042, "r_y0": 226.43399999999997, "r_x1": 381.217, "r_y1": 226.43399999999997, "r_x2": 381.217, "r_y2": 217.26599999999996, "r_x3": 374.042, "r_y3": 217.26599999999996, "coord_origin": "TOPLEFT"}, "text": "U", "orig": "U", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 18, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 374.344, "r_y0": 190.22199999999998, "r_x1": 393.765, "r_y1": 190.07299999999998, "r_x2": 393.765, "r_y2": 180.90499999999997, "r_x3": 374.344, "r_y3": 181.05399999999997, "coord_origin": "TOPLEFT"}, "text": "U X", "orig": "U X", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 19, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 282.259, "r_y0": 253.79600000000005, "r_x1": 301.055, "r_y1": 253.78099999999995, "r_x2": 301.055, "r_y2": 244.61300000000006, "r_x3": 282.259, "r_y3": 244.62800000000004, "coord_origin": "TOPLEFT"}, "text": "C L", "orig": "C L", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 20, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 282.11, "r_y0": 266.13800000000003, "r_x1": 325.59, "r_y1": 265.58900000000006, "r_x2": 325.59, "r_y2": 256.42100000000005, "r_x3": 282.11, "r_y3": 256.96900000000005, "coord_origin": "TOPLEFT"}, "text": "U X X X", "orig": "U X X X", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 21, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 282.408, "r_y0": 278.41999999999996, "r_x1": 325.478, "r_y1": 278.14200000000005, "r_x2": 325.478, "r_y2": 268.97400000000005, "r_x3": 282.408, "r_y3": 269.25199999999995, "coord_origin": "TOPLEFT"}, "text": "U X X X", "orig": "U X X X", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 22, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 307.466, "r_y0": 253.861, "r_x1": 312.992, "r_y1": 253.861, "r_x2": 312.992, "r_y2": 244.69299999999998, "r_x3": 307.466, "r_y3": 244.69299999999998, "coord_origin": "TOPLEFT"}, "text": "L", "orig": "L", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 23, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 318.769, "r_y0": 253.72799999999995, "r_x1": 324.294, "r_y1": 253.72799999999995, "r_x2": 324.294, "r_y2": 244.55999999999995, "r_x3": 318.769, "r_y3": 244.55999999999995, "coord_origin": "TOPLEFT"}, "text": "L", "orig": "L", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 24, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 195.939, "r_y0": 278.03499999999997, "r_x1": 214.734, "r_y1": 278.02, "r_x2": 214.734, "r_y2": 268.852, "r_x3": 195.939, "r_y3": 268.86699999999996, "coord_origin": "TOPLEFT"}, "text": "C L", "orig": "C L", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 25, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 221.146, "r_y0": 278.1, "r_x1": 226.671, "r_y1": 278.1, "r_x2": 226.671, "r_y2": 268.932, "r_x3": 221.146, "r_y3": 268.932, "coord_origin": "TOPLEFT"}, "text": "L", "orig": "L", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 26, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 232.449, "r_y0": 277.967, "r_x1": 237.974, "r_y1": 277.967, "r_x2": 237.974, "r_y2": 268.799, "r_x3": 232.449, "r_y3": 268.799, "coord_origin": "TOPLEFT"}, "text": "L", "orig": "L", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 27, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 196.217, "r_y0": 253.827, "r_x1": 203.392, "r_y1": 253.827, "r_x2": 203.392, "r_y2": 244.659, "r_x3": 196.217, "r_y3": 244.659, "coord_origin": "TOPLEFT"}, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 28, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 250.321, "r_y0": 253.385, "r_x1": 257.497, "r_y1": 253.385, "r_x2": 257.497, "r_y2": 244.21699999999998, "r_x3": 250.321, "r_y3": 244.21699999999998, "coord_origin": "TOPLEFT"}, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 29, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 250.172, "r_y0": 265.727, "r_x1": 257.348, "r_y1": 265.727, "r_x2": 257.348, "r_y2": 256.55899999999997, "r_x3": 250.172, "r_y3": 256.55899999999997, "coord_origin": "TOPLEFT"}, "text": "U", "orig": "U", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 30, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 250.47, "r_y0": 278.01, "r_x1": 257.646, "r_y1": 278.01, "r_x2": 257.646, "r_y2": 268.842, "r_x3": 250.47, "r_y3": 268.842, "coord_origin": "TOPLEFT"}, "text": "U", "orig": "U", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 31, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 334.511, "r_y0": 249.18600000000004, "r_x1": 391.495, "r_y1": 249.18600000000004, "r_x2": 391.495, "r_y2": 243.07399999999996, "r_x3": 334.511, "r_y3": 243.07399999999996, "coord_origin": "TOPLEFT"}, "text": "1 - simple cells: \"C\"", "orig": "1 - simple cells: \"C\"", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 32, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 334.511, "r_y0": 259.124, "r_x1": 421.986, "r_y1": 259.124, "r_x2": 421.986, "r_y2": 253.01199999999994, "r_x3": 334.511, "r_y3": 253.01199999999994, "coord_origin": "TOPLEFT"}, "text": "2 - horizontal merges: \"C\", \"L\"", "orig": "2 - horizontal merges: \"C\", \"L\"", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 33, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 334.511, "r_y0": 269.062, "r_x1": 415.344, "r_y1": 269.062, "r_x2": 415.344, "r_y2": 262.95000000000005, "r_x3": 334.511, "r_y3": 262.95000000000005, "coord_origin": "TOPLEFT"}, "text": "3 - vertical merges: \"C\", \"U\"", "orig": "3 - vertical merges: \"C\", \"U\"", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 34, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 334.511, "r_y0": 279.0, "r_x1": 426.599, "r_y1": 279.0, "r_x2": 426.599, "r_y2": 272.88800000000003, "r_x3": 334.511, "r_y3": 272.88800000000003, "coord_origin": "TOPLEFT"}, "text": "4 - 2d merges: \"C\", \"L\", \"U\", \"X\"", "orig": "4 - 2d merges: \"C\", \"L\", \"U\", \"X\"", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 35, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 185.672, "r_y0": 250.23400000000004, "r_x1": 189.355, "r_y1": 250.23400000000004, "r_x2": 189.355, "r_y2": 244.12199999999996, "r_x3": 185.672, "r_y3": 244.12199999999996, "coord_origin": "TOPLEFT"}, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 36, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 185.968, "r_y0": 274.539, "r_x1": 189.651, "r_y1": 274.539, "r_x2": 189.651, "r_y2": 268.427, "r_x3": 185.968, "r_y3": 268.427, "coord_origin": "TOPLEFT"}, "text": "2", "orig": "2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 37, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 239.342, "r_y0": 249.817, "r_x1": 243.025, "r_y1": 249.817, "r_x2": 243.025, "r_y2": 243.70500000000004, "r_x3": 239.342, "r_y3": 243.70500000000004, "coord_origin": "TOPLEFT"}, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 38, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 271.329, "r_y0": 249.68499999999995, "r_x1": 275.012, "r_y1": 249.68499999999995, "r_x2": 275.012, "r_y2": 243.57299999999998, "r_x3": 271.329, "r_y3": 243.57299999999998, "coord_origin": "TOPLEFT"}, "text": "4", "orig": "4", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 39, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 229.816, "r_y0": 172.707, "r_x1": 233.5, "r_y1": 172.707, "r_x2": 233.5, "r_y2": 166.59400000000005, "r_x3": 229.816, "r_y3": 166.59400000000005, "coord_origin": "TOPLEFT"}, "text": "2", "orig": "2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 40, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 257.244, "r_y0": 196.15300000000002, "r_x1": 260.928, "r_y1": 196.15300000000002, "r_x2": 260.928, "r_y2": 190.03999999999996, "r_x3": 257.244, "r_y3": 190.03999999999996, "coord_origin": "TOPLEFT"}, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 41, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 186.875, "r_y0": 184.168, "r_x1": 190.559, "r_y1": 184.168, "r_x2": 190.559, "r_y2": 178.05600000000004, "r_x3": 186.875, "r_y3": 178.05600000000004, "coord_origin": "TOPLEFT"}, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 42, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 196.487, "r_y0": 175.207, "r_x1": 200.171, "r_y1": 175.207, "r_x2": 200.171, "r_y2": 169.09500000000003, "r_x3": 196.487, "r_y3": 169.09500000000003, "coord_origin": "TOPLEFT"}, "text": "4", "orig": "4", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 43, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 169.747, "r_y0": 175.62199999999996, "r_x1": 175.727, "r_y1": 175.62199999999996, "r_x2": 175.727, "r_y2": 167.98199999999997, "r_x3": 169.747, "r_y3": 167.98199999999997, "coord_origin": "TOPLEFT"}, "text": "A", "orig": "A", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 44, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 169.747, "r_y0": 214.57799999999997, "r_x1": 175.727, "r_y1": 214.57799999999997, "r_x2": 175.727, "r_y2": 206.938, "r_x3": 169.747, "r_y3": 206.938, "coord_origin": "TOPLEFT"}, "text": "B", "orig": "B", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 45, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 274.294, "r_y0": 176.019, "r_x1": 280.273, "r_y1": 176.019, "r_x2": 280.273, "r_y2": 168.37900000000002, "r_x3": 274.294, "r_y3": 168.37900000000002, "coord_origin": "TOPLEFT"}, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 46, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 359.562, "r_y0": 176.019, "r_x1": 365.541, "r_y1": 176.019, "r_x2": 365.541, "r_y2": 168.37900000000002, "r_x3": 359.562, "r_y3": 168.37900000000002, "coord_origin": "TOPLEFT"}, "text": "D", "orig": "D", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 47, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 169.747, "r_y0": 250.95100000000002, "r_x1": 175.271, "r_y1": 250.95100000000002, "r_x2": 175.271, "r_y2": 243.31100000000004, "r_x3": 169.747, "r_y3": 243.31100000000004, "coord_origin": "TOPLEFT"}, "text": "E", "orig": "E", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": [{"id": 38, "label": "text", "bbox": {"l": 374.493, "t": 168.05399999999997, "r": 428.861, "b": 177.88099999999997, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 10, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 374.493, "r_y0": 177.88099999999997, "r_x1": 428.861, "r_y1": 177.22199999999998, "r_x2": 428.861, "r_y2": 168.05399999999997, "r_x3": 374.493, "r_y3": 168.71299999999997, "coord_origin": "TOPLEFT"}, "text": "C L C L L", "orig": "C L C L L", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 39, "label": "text", "bbox": {"l": 373.769, "t": 192.61400000000003, "r": 448.17, "b": 202.21299999999997, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 11, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 373.769, "r_y0": 202.21299999999997, "r_x1": 448.17, "r_y1": 201.78200000000004, "r_x2": 448.17, "r_y2": 192.61400000000003, "r_x3": 373.769, "r_y3": 193.04499999999996, "coord_origin": "TOPLEFT"}, "text": "C C C C C NL", "orig": "C C C C C NL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 40, "label": "text", "bbox": {"l": 386.687, "t": 204.95000000000005, "r": 448.085, "b": 214.42499999999995, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 12, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 386.687, "r_y0": 214.42499999999995, "r_x1": 448.085, "r_y1": 214.11800000000005, "r_x2": 448.085, "r_y2": 204.95000000000005, "r_x3": 386.687, "r_y3": 205.25699999999995, "coord_origin": "TOPLEFT"}, "text": "C C C C NL", "orig": "C C C C NL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 41, "label": "text", "bbox": {"l": 398.657, "t": 180.32000000000005, "r": 448.147, "b": 190.01999999999998, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 13, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 398.657, "r_y0": 190.01999999999998, "r_x1": 448.147, "r_y1": 189.48800000000006, "r_x2": 448.147, "r_y2": 180.32000000000005, "r_x3": 398.657, "r_y3": 180.85199999999998, "coord_origin": "TOPLEFT"}, "text": "C C C NL", "orig": "C C C NL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 42, "label": "text", "bbox": {"l": 386.506, "t": 217.15800000000002, "r": 448.302, "b": 226.52099999999996, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 14, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 386.506, "r_y0": 226.32600000000002, "r_x1": 448.302, "r_y1": 226.52099999999996, "r_x2": 448.302, "r_y2": 217.35299999999995, "r_x3": 386.506, "r_y3": 217.15800000000002, "coord_origin": "TOPLEFT"}, "text": "C C C C NL", "orig": "C C C C NL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 43, "label": "text", "bbox": {"l": 435.16, "t": 167.80899999999997, "r": 447.863, "b": 176.97699999999998, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 15, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 435.16, "r_y0": 176.97699999999998, "r_x1": 447.863, "r_y1": 176.97699999999998, "r_x2": 447.863, "r_y2": 167.80899999999997, "r_x3": 435.16, "r_y3": 167.80899999999997, "coord_origin": "TOPLEFT"}, "text": "NL", "orig": "NL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 44, "label": "text", "bbox": {"l": 374.15, "t": 205.35400000000004, "r": 381.325, "b": 214.52200000000005, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 16, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 374.15, "r_y0": 214.52200000000005, "r_x1": 381.325, "r_y1": 214.52200000000005, "r_x2": 381.325, "r_y2": 205.35400000000004, "r_x3": 374.15, "r_y3": 205.35400000000004, "coord_origin": "TOPLEFT"}, "text": "U", "orig": "U", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 45, "label": "text", "bbox": {"l": 374.042, "t": 217.26599999999996, "r": 381.217, "b": 226.43399999999997, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 17, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 374.042, "r_y0": 226.43399999999997, "r_x1": 381.217, "r_y1": 226.43399999999997, "r_x2": 381.217, "r_y2": 217.26599999999996, "r_x3": 374.042, "r_y3": 217.26599999999996, "coord_origin": "TOPLEFT"}, "text": "U", "orig": "U", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 46, "label": "text", "bbox": {"l": 374.344, "t": 180.90499999999997, "r": 393.765, "b": 190.22199999999998, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 18, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 374.344, "r_y0": 190.22199999999998, "r_x1": 393.765, "r_y1": 190.07299999999998, "r_x2": 393.765, "r_y2": 180.90499999999997, "r_x3": 374.344, "r_y3": 181.05399999999997, "coord_origin": "TOPLEFT"}, "text": "U X", "orig": "U X", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 47, "label": "text", "bbox": {"l": 282.259, "t": 244.61300000000006, "r": 301.055, "b": 253.79600000000005, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 19, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 282.259, "r_y0": 253.79600000000005, "r_x1": 301.055, "r_y1": 253.78099999999995, "r_x2": 301.055, "r_y2": 244.61300000000006, "r_x3": 282.259, "r_y3": 244.62800000000004, "coord_origin": "TOPLEFT"}, "text": "C L", "orig": "C L", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 48, "label": "text", "bbox": {"l": 282.11, "t": 256.42100000000005, "r": 325.59, "b": 266.13800000000003, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 20, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 282.11, "r_y0": 266.13800000000003, "r_x1": 325.59, "r_y1": 265.58900000000006, "r_x2": 325.59, "r_y2": 256.42100000000005, "r_x3": 282.11, "r_y3": 256.96900000000005, "coord_origin": "TOPLEFT"}, "text": "U X X X", "orig": "U X X X", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 49, "label": "text", "bbox": {"l": 282.408, "t": 268.97400000000005, "r": 325.478, "b": 278.41999999999996, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 21, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 282.408, "r_y0": 278.41999999999996, "r_x1": 325.478, "r_y1": 278.14200000000005, "r_x2": 325.478, "r_y2": 268.97400000000005, "r_x3": 282.408, "r_y3": 269.25199999999995, "coord_origin": "TOPLEFT"}, "text": "U X X X", "orig": "U X X X", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 50, "label": "text", "bbox": {"l": 307.466, "t": 244.69299999999998, "r": 312.992, "b": 253.861, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 22, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 307.466, "r_y0": 253.861, "r_x1": 312.992, "r_y1": 253.861, "r_x2": 312.992, "r_y2": 244.69299999999998, "r_x3": 307.466, "r_y3": 244.69299999999998, "coord_origin": "TOPLEFT"}, "text": "L", "orig": "L", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 51, "label": "text", "bbox": {"l": 318.769, "t": 244.55999999999995, "r": 324.294, "b": 253.72799999999995, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 23, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 318.769, "r_y0": 253.72799999999995, "r_x1": 324.294, "r_y1": 253.72799999999995, "r_x2": 324.294, "r_y2": 244.55999999999995, "r_x3": 318.769, "r_y3": 244.55999999999995, "coord_origin": "TOPLEFT"}, "text": "L", "orig": "L", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 52, "label": "text", "bbox": {"l": 195.939, "t": 268.852, "r": 214.734, "b": 278.03499999999997, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 24, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 195.939, "r_y0": 278.03499999999997, "r_x1": 214.734, "r_y1": 278.02, "r_x2": 214.734, "r_y2": 268.852, "r_x3": 195.939, "r_y3": 268.86699999999996, "coord_origin": "TOPLEFT"}, "text": "C L", "orig": "C L", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 53, "label": "text", "bbox": {"l": 221.146, "t": 268.932, "r": 226.671, "b": 278.1, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 25, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 221.146, "r_y0": 278.1, "r_x1": 226.671, "r_y1": 278.1, "r_x2": 226.671, "r_y2": 268.932, "r_x3": 221.146, "r_y3": 268.932, "coord_origin": "TOPLEFT"}, "text": "L", "orig": "L", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 54, "label": "text", "bbox": {"l": 232.449, "t": 268.799, "r": 237.974, "b": 277.967, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 26, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 232.449, "r_y0": 277.967, "r_x1": 237.974, "r_y1": 277.967, "r_x2": 237.974, "r_y2": 268.799, "r_x3": 232.449, "r_y3": 268.799, "coord_origin": "TOPLEFT"}, "text": "L", "orig": "L", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 55, "label": "text", "bbox": {"l": 196.217, "t": 244.659, "r": 203.392, "b": 253.827, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 27, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 196.217, "r_y0": 253.827, "r_x1": 203.392, "r_y1": 253.827, "r_x2": 203.392, "r_y2": 244.659, "r_x3": 196.217, "r_y3": 244.659, "coord_origin": "TOPLEFT"}, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 56, "label": "text", "bbox": {"l": 250.321, "t": 244.21699999999998, "r": 257.497, "b": 253.385, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 28, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 250.321, "r_y0": 253.385, "r_x1": 257.497, "r_y1": 253.385, "r_x2": 257.497, "r_y2": 244.21699999999998, "r_x3": 250.321, "r_y3": 244.21699999999998, "coord_origin": "TOPLEFT"}, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 57, "label": "text", "bbox": {"l": 250.172, "t": 256.55899999999997, "r": 257.348, "b": 265.727, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 29, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 250.172, "r_y0": 265.727, "r_x1": 257.348, "r_y1": 265.727, "r_x2": 257.348, "r_y2": 256.55899999999997, "r_x3": 250.172, "r_y3": 256.55899999999997, "coord_origin": "TOPLEFT"}, "text": "U", "orig": "U", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 58, "label": "text", "bbox": {"l": 250.47, "t": 268.842, "r": 257.646, "b": 278.01, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 30, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 250.47, "r_y0": 278.01, "r_x1": 257.646, "r_y1": 278.01, "r_x2": 257.646, "r_y2": 268.842, "r_x3": 250.47, "r_y3": 268.842, "coord_origin": "TOPLEFT"}, "text": "U", "orig": "U", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 59, "label": "text", "bbox": {"l": 334.511, "t": 243.07399999999996, "r": 391.495, "b": 249.18600000000004, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 31, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 334.511, "r_y0": 249.18600000000004, "r_x1": 391.495, "r_y1": 249.18600000000004, "r_x2": 391.495, "r_y2": 243.07399999999996, "r_x3": 334.511, "r_y3": 243.07399999999996, "coord_origin": "TOPLEFT"}, "text": "1 - simple cells: \"C\"", "orig": "1 - simple cells: \"C\"", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 60, "label": "text", "bbox": {"l": 334.511, "t": 253.01199999999994, "r": 421.986, "b": 259.124, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 32, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 334.511, "r_y0": 259.124, "r_x1": 421.986, "r_y1": 259.124, "r_x2": 421.986, "r_y2": 253.01199999999994, "r_x3": 334.511, "r_y3": 253.01199999999994, "coord_origin": "TOPLEFT"}, "text": "2 - horizontal merges: \"C\", \"L\"", "orig": "2 - horizontal merges: \"C\", \"L\"", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 61, "label": "text", "bbox": {"l": 334.511, "t": 262.95000000000005, "r": 415.344, "b": 269.062, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 33, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 334.511, "r_y0": 269.062, "r_x1": 415.344, "r_y1": 269.062, "r_x2": 415.344, "r_y2": 262.95000000000005, "r_x3": 334.511, "r_y3": 262.95000000000005, "coord_origin": "TOPLEFT"}, "text": "3 - vertical merges: \"C\", \"U\"", "orig": "3 - vertical merges: \"C\", \"U\"", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 18, "label": "list_item", "bbox": {"l": 334.511, "t": 272.88800000000003, "r": 426.599, "b": 279.0, "coord_origin": "TOPLEFT"}, "confidence": 0.5250625610351562, "cells": [{"index": 34, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 334.511, "r_y0": 279.0, "r_x1": 426.599, "r_y1": 279.0, "r_x2": 426.599, "r_y2": 272.88800000000003, "r_x3": 334.511, "r_y3": 272.88800000000003, "coord_origin": "TOPLEFT"}, "text": "4 - 2d merges: \"C\", \"L\", \"U\", \"X\"", "orig": "4 - 2d merges: \"C\", \"L\", \"U\", \"X\"", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 62, "label": "text", "bbox": {"l": 185.672, "t": 244.12199999999996, "r": 189.355, "b": 250.23400000000004, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 35, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 185.672, "r_y0": 250.23400000000004, "r_x1": 189.355, "r_y1": 250.23400000000004, "r_x2": 189.355, "r_y2": 244.12199999999996, "r_x3": 185.672, "r_y3": 244.12199999999996, "coord_origin": "TOPLEFT"}, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 63, "label": "text", "bbox": {"l": 185.968, "t": 268.427, "r": 189.651, "b": 274.539, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 36, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 185.968, "r_y0": 274.539, "r_x1": 189.651, "r_y1": 274.539, "r_x2": 189.651, "r_y2": 268.427, "r_x3": 185.968, "r_y3": 268.427, "coord_origin": "TOPLEFT"}, "text": "2", "orig": "2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 64, "label": "text", "bbox": {"l": 239.342, "t": 243.70500000000004, "r": 243.025, "b": 249.817, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 37, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 239.342, "r_y0": 249.817, "r_x1": 243.025, "r_y1": 249.817, "r_x2": 243.025, "r_y2": 243.70500000000004, "r_x3": 239.342, "r_y3": 243.70500000000004, "coord_origin": "TOPLEFT"}, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 65, "label": "text", "bbox": {"l": 271.329, "t": 243.57299999999998, "r": 275.012, "b": 249.68499999999995, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 38, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 271.329, "r_y0": 249.68499999999995, "r_x1": 275.012, "r_y1": 249.68499999999995, "r_x2": 275.012, "r_y2": 243.57299999999998, "r_x3": 271.329, "r_y3": 243.57299999999998, "coord_origin": "TOPLEFT"}, "text": "4", "orig": "4", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 66, "label": "text", "bbox": {"l": 229.816, "t": 166.59400000000005, "r": 233.5, "b": 172.707, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 39, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 229.816, "r_y0": 172.707, "r_x1": 233.5, "r_y1": 172.707, "r_x2": 233.5, "r_y2": 166.59400000000005, "r_x3": 229.816, "r_y3": 166.59400000000005, "coord_origin": "TOPLEFT"}, "text": "2", "orig": "2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 67, "label": "text", "bbox": {"l": 257.244, "t": 190.03999999999996, "r": 260.928, "b": 196.15300000000002, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 40, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 257.244, "r_y0": 196.15300000000002, "r_x1": 260.928, "r_y1": 196.15300000000002, "r_x2": 260.928, "r_y2": 190.03999999999996, "r_x3": 257.244, "r_y3": 190.03999999999996, "coord_origin": "TOPLEFT"}, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 68, "label": "text", "bbox": {"l": 186.875, "t": 178.05600000000004, "r": 190.559, "b": 184.168, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 41, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 186.875, "r_y0": 184.168, "r_x1": 190.559, "r_y1": 184.168, "r_x2": 190.559, "r_y2": 178.05600000000004, "r_x3": 186.875, "r_y3": 178.05600000000004, "coord_origin": "TOPLEFT"}, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 69, "label": "text", "bbox": {"l": 196.487, "t": 169.09500000000003, "r": 200.171, "b": 175.207, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 42, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 196.487, "r_y0": 175.207, "r_x1": 200.171, "r_y1": 175.207, "r_x2": 200.171, "r_y2": 169.09500000000003, "r_x3": 196.487, "r_y3": 169.09500000000003, "coord_origin": "TOPLEFT"}, "text": "4", "orig": "4", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 70, "label": "text", "bbox": {"l": 169.747, "t": 167.98199999999997, "r": 175.727, "b": 175.62199999999996, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 43, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 169.747, "r_y0": 175.62199999999996, "r_x1": 175.727, "r_y1": 175.62199999999996, "r_x2": 175.727, "r_y2": 167.98199999999997, "r_x3": 169.747, "r_y3": 167.98199999999997, "coord_origin": "TOPLEFT"}, "text": "A", "orig": "A", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 71, "label": "text", "bbox": {"l": 169.747, "t": 206.938, "r": 175.727, "b": 214.57799999999997, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 44, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 169.747, "r_y0": 214.57799999999997, "r_x1": 175.727, "r_y1": 214.57799999999997, "r_x2": 175.727, "r_y2": 206.938, "r_x3": 169.747, "r_y3": 206.938, "coord_origin": "TOPLEFT"}, "text": "B", "orig": "B", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 72, "label": "text", "bbox": {"l": 274.294, "t": 168.37900000000002, "r": 280.273, "b": 176.019, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 45, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 274.294, "r_y0": 176.019, "r_x1": 280.273, "r_y1": 176.019, "r_x2": 280.273, "r_y2": 168.37900000000002, "r_x3": 274.294, "r_y3": 168.37900000000002, "coord_origin": "TOPLEFT"}, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 73, "label": "text", "bbox": {"l": 359.562, "t": 168.37900000000002, "r": 365.541, "b": 176.019, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 46, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 359.562, "r_y0": 176.019, "r_x1": 365.541, "r_y1": 176.019, "r_x2": 365.541, "r_y2": 168.37900000000002, "r_x3": 359.562, "r_y3": 168.37900000000002, "coord_origin": "TOPLEFT"}, "text": "D", "orig": "D", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 74, "label": "text", "bbox": {"l": 169.747, "t": 243.31100000000004, "r": 175.271, "b": 250.95100000000002, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 47, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 169.747, "r_y0": 250.95100000000002, "r_x1": 175.271, "r_y1": 250.95100000000002, "r_x2": 175.271, "r_y2": 243.31100000000004, "r_x3": 169.747, "r_y3": 243.31100000000004, "coord_origin": "TOPLEFT"}, "text": "E", "orig": "E", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}]}, "text": "", "annotations": [], "provenance": null, "predicted_class": null, "confidence": null}, {"label": "section_header", "id": 9, "page_no": 6, "cluster": {"id": 9, "label": "section_header", "bbox": {"l": 134.765, "t": 305.296, "r": 246.652, "b": 314.103, "coord_origin": "TOPLEFT"}, "confidence": 0.9233023524284363, "cells": [{"index": 48, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 314.103, "r_x1": 149.402, "r_y1": 314.103, "r_x2": 149.402, "r_y2": 305.296, "r_x3": 134.765, "r_y3": 305.296, "coord_origin": "TOPLEFT"}, "text": "4.2", "orig": "4.2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 49, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 160.859, "r_y0": 314.103, "r_x1": 246.652, "r_y1": 314.103, "r_x2": 246.652, "r_y2": 305.296, "r_x3": 160.859, "r_y3": 305.296, "coord_origin": "TOPLEFT"}, "text": "Language Syntax", "orig": "Language Syntax", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "4.2 Language Syntax"}, {"label": "text", "id": 10, "page_no": 6, "cluster": {"id": 10, "label": "text", "bbox": {"l": 134.765, "t": 325.248, "r": 363.796, "b": 334.045, "coord_origin": "TOPLEFT"}, "confidence": 0.9169168472290039, "cells": [{"index": 50, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 334.045, "r_x1": 363.796, "r_y1": 334.045, "r_x2": 363.796, "r_y2": 325.248, "r_x3": 134.765, "r_y3": 325.248, "coord_origin": "TOPLEFT"}, "text": "The OTSL representation follows these syntax rules:", "orig": "The OTSL representation follows these syntax rules:", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "The OTSL representation follows these syntax rules:"}, {"label": "list_item", "id": 3, "page_no": 6, "cluster": {"id": 3, "label": "list_item", "bbox": {"l": 138.973, "t": 347.171, "r": 480.589, "b": 367.934, "coord_origin": "TOPLEFT"}, "confidence": 0.9588112235069275, "cells": [{"index": 51, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 138.973, "r_y0": 355.978, "r_x1": 146.72, "r_y1": 355.978, "r_x2": 146.72, "r_y2": 347.181, "r_x3": 138.973, "r_y3": 347.181, "coord_origin": "TOPLEFT"}, "text": "1.", "orig": "1.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 52, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 151.701, "r_y0": 355.978, "r_x1": 257.379, "r_y1": 355.978, "r_x2": 257.379, "r_y2": 347.171, "r_x3": 151.701, "r_y3": 347.171, "coord_origin": "TOPLEFT"}, "text": "Left-looking cell rule", "orig": "Left-looking cell rule", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 53, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 257.383, "r_y0": 355.978, "r_x1": 260.15, "r_y1": 355.978, "r_x2": 260.15, "r_y2": 347.181, "r_x3": 257.383, "r_y3": 347.181, "coord_origin": "TOPLEFT"}, "text": ":", "orig": ":", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 54, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 264.184, "r_y0": 355.978, "r_x1": 480.589, "r_y1": 355.978, "r_x2": 480.589, "r_y2": 347.181, "r_x3": 264.184, "r_y3": 347.181, "coord_origin": "TOPLEFT"}, "text": "The left neighbour of an \"L\" cell must be either", "orig": "The left neighbour of an \"L\" cell must be either", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 55, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 151.701, "r_y0": 367.934, "r_x1": 283.594, "r_y1": 367.934, "r_x2": 283.594, "r_y2": 359.137, "r_x3": 151.701, "r_y3": 359.137, "coord_origin": "TOPLEFT"}, "text": "another \"L\" cell or a \"C\" cell.", "orig": "another \"L\" cell or a \"C\" cell.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "1. Left-looking cell rule : The left neighbour of an \"L\" cell must be either another \"L\" cell or a \"C\" cell."}, {"label": "list_item", "id": 4, "page_no": 6, "cluster": {"id": 4, "label": "list_item", "bbox": {"l": 138.973, "t": 371.085, "r": 480.592, "b": 391.847, "coord_origin": "TOPLEFT"}, "confidence": 0.9585386514663696, "cells": [{"index": 56, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 138.973, "r_y0": 379.892, "r_x1": 146.72, "r_y1": 379.892, "r_x2": 146.72, "r_y2": 371.095, "r_x3": 138.973, "r_y3": 371.095, "coord_origin": "TOPLEFT"}, "text": "2.", "orig": "2.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 57, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 151.701, "r_y0": 379.892, "r_x1": 252.112, "r_y1": 379.892, "r_x2": 252.112, "r_y2": 371.085, "r_x3": 151.701, "r_y3": 371.085, "coord_origin": "TOPLEFT"}, "text": "Up-looking cell rule", "orig": "Up-looking cell rule", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 58, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 252.112, "r_y0": 379.892, "r_x1": 254.879, "r_y1": 379.892, "r_x2": 254.879, "r_y2": 371.095, "r_x3": 252.112, "r_y3": 371.095, "coord_origin": "TOPLEFT"}, "text": ":", "orig": ":", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 59, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 258.764, "r_y0": 379.892, "r_x1": 480.592, "r_y1": 379.892, "r_x2": 480.592, "r_y2": 371.095, "r_x3": 258.764, "r_y3": 371.095, "coord_origin": "TOPLEFT"}, "text": "The upper neighbour of a \"U\" cell must be either", "orig": "The upper neighbour of a \"U\" cell must be either", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 60, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 151.701, "r_y0": 391.847, "r_x1": 284.839, "r_y1": 391.847, "r_x2": 284.839, "r_y2": 383.05, "r_x3": 151.701, "r_y3": 383.05, "coord_origin": "TOPLEFT"}, "text": "another \"U\" cell or a \"C\" cell.", "orig": "another \"U\" cell or a \"C\" cell.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "2. Up-looking cell rule : The upper neighbour of a \"U\" cell must be either another \"U\" cell or a \"C\" cell."}, {"label": "section_header", "id": 14, "page_no": 6, "cluster": {"id": 14, "label": "section_header", "bbox": {"l": 138.973, "t": 394.998, "r": 226.074, "b": 403.805, "coord_origin": "TOPLEFT"}, "confidence": 0.6506174206733704, "cells": [{"index": 61, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 138.973, "r_y0": 403.805, "r_x1": 146.72, "r_y1": 403.805, "r_x2": 146.72, "r_y2": 395.008, "r_x3": 138.973, "r_y3": 395.008, "coord_origin": "TOPLEFT"}, "text": "3.", "orig": "3.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 62, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 151.701, "r_y0": 403.805, "r_x1": 223.304, "r_y1": 403.805, "r_x2": 223.304, "r_y2": 394.998, "r_x3": 151.701, "r_y3": 394.998, "coord_origin": "TOPLEFT"}, "text": "Cross cell rule", "orig": "Cross cell rule", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 63, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 223.307, "r_y0": 403.805, "r_x1": 226.074, "r_y1": 403.805, "r_x2": 226.074, "r_y2": 395.008, "r_x3": 223.307, "r_y3": 395.008, "coord_origin": "TOPLEFT"}, "text": ":", "orig": ":", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "3. Cross cell rule :"}, {"label": "list_item", "id": 13, "page_no": 6, "cluster": {"id": 13, "label": "list_item", "bbox": {"l": 151.701, "t": 406.967, "r": 480.592, "b": 439.674, "coord_origin": "TOPLEFT"}, "confidence": 0.7247239947319031, "cells": [{"index": 64, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 151.701, "r_y0": 415.764, "r_x1": 480.592, "r_y1": 415.764, "r_x2": 480.592, "r_y2": 406.967, "r_x3": 151.701, "r_y3": 406.967, "coord_origin": "TOPLEFT"}, "text": "The left neighbour of an \"X\" cell must be either another \"X\" cell or a \"U\"", "orig": "The left neighbour of an \"X\" cell must be either another \"X\" cell or a \"U\"", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 65, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 151.701, "r_y0": 427.719, "r_x1": 480.592, "r_y1": 427.719, "r_x2": 480.592, "r_y2": 418.922, "r_x3": 151.701, "r_y3": 418.922, "coord_origin": "TOPLEFT"}, "text": "cell, and the upper neighbour of an \"X\" cell must be either another \"X\" cell", "orig": "cell, and the upper neighbour of an \"X\" cell must be either another \"X\" cell", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 66, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 151.701, "r_y0": 439.674, "r_x1": 214.397, "r_y1": 439.674, "r_x2": 214.397, "r_y2": 430.877, "r_x3": 151.701, "r_y3": 430.877, "coord_origin": "TOPLEFT"}, "text": "or an \"L\" cell.", "orig": "or an \"L\" cell.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "The left neighbour of an \"X\" cell must be either another \"X\" cell or a \"U\" cell, and the upper neighbour of an \"X\" cell must be either another \"X\" cell or an \"L\" cell."}, {"label": "list_item", "id": 8, "page_no": 6, "cluster": {"id": 8, "label": "list_item", "bbox": {"l": 138.973, "t": 442.826, "r": 474.59, "b": 451.633, "coord_origin": "TOPLEFT"}, "confidence": 0.9259927272796631, "cells": [{"index": 67, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 138.973, "r_y0": 451.633, "r_x1": 146.72, "r_y1": 451.633, "r_x2": 146.72, "r_y2": 442.836, "r_x3": 138.973, "r_y3": 442.836, "coord_origin": "TOPLEFT"}, "text": "4.", "orig": "4.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 68, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 151.701, "r_y0": 451.633, "r_x1": 221.323, "r_y1": 451.633, "r_x2": 221.323, "r_y2": 442.826, "r_x3": 151.701, "r_y3": 442.826, "coord_origin": "TOPLEFT"}, "text": "First row rule", "orig": "First row rule", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 69, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 221.327, "r_y0": 451.633, "r_x1": 224.094, "r_y1": 451.633, "r_x2": 224.094, "r_y2": 442.836, "r_x3": 221.327, "r_y3": 442.836, "coord_origin": "TOPLEFT"}, "text": ":", "orig": ":", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 70, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 227.411, "r_y0": 451.633, "r_x1": 474.59, "r_y1": 451.633, "r_x2": 474.59, "r_y2": 442.836, "r_x3": 227.411, "r_y3": 442.836, "coord_origin": "TOPLEFT"}, "text": "Only \"L\" cells and \"C\" cells are allowed in the first row.", "orig": "Only \"L\" cells and \"C\" cells are allowed in the first row.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "4. First row rule : Only \"L\" cells and \"C\" cells are allowed in the first row."}, {"label": "list_item", "id": 5, "page_no": 6, "cluster": {"id": 5, "label": "list_item", "bbox": {"l": 138.973, "t": 454.784, "r": 480.588, "b": 475.546, "coord_origin": "TOPLEFT"}, "confidence": 0.9420599937438965, "cells": [{"index": 71, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 138.973, "r_y0": 463.591, "r_x1": 146.72, "r_y1": 463.591, "r_x2": 146.72, "r_y2": 454.794, "r_x3": 138.973, "r_y3": 454.794, "coord_origin": "TOPLEFT"}, "text": "5.", "orig": "5.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 72, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 151.701, "r_y0": 463.591, "r_x1": 240.72, "r_y1": 463.591, "r_x2": 240.72, "r_y2": 454.784, "r_x3": 151.701, "r_y3": 454.784, "coord_origin": "TOPLEFT"}, "text": "First column rule", "orig": "First column rule", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 73, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 240.716, "r_y0": 463.591, "r_x1": 243.483, "r_y1": 463.591, "r_x2": 243.483, "r_y2": 454.794, "r_x3": 240.716, "r_y3": 454.794, "coord_origin": "TOPLEFT"}, "text": ":", "orig": ":", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 74, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 247.458, "r_y0": 463.591, "r_x1": 480.588, "r_y1": 463.591, "r_x2": 480.588, "r_y2": 454.794, "r_x3": 247.458, "r_y3": 454.794, "coord_origin": "TOPLEFT"}, "text": "Only \"U\" cells and \"C\" cells are allowed in the first", "orig": "Only \"U\" cells and \"C\" cells are allowed in the first", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 75, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 151.701, "r_y0": 475.546, "r_x1": 186.007, "r_y1": 475.546, "r_x2": 186.007, "r_y2": 466.749, "r_x3": 151.701, "r_y3": 466.749, "coord_origin": "TOPLEFT"}, "text": "column.", "orig": "column.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "5. First column rule : Only \"U\" cells and \"C\" cells are allowed in the first column."}, {"label": "list_item", "id": 1, "page_no": 6, "cluster": {"id": 1, "label": "list_item", "bbox": {"l": 138.973, "t": 478.697, "r": 480.595, "b": 499.46, "coord_origin": "TOPLEFT"}, "confidence": 0.9617829918861389, "cells": [{"index": 76, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 138.973, "r_y0": 487.504, "r_x1": 146.72, "r_y1": 487.504, "r_x2": 146.72, "r_y2": 478.707, "r_x3": 138.973, "r_y3": 478.707, "coord_origin": "TOPLEFT"}, "text": "6.", "orig": "6.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 77, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 151.701, "r_y0": 487.504, "r_x1": 235.158, "r_y1": 487.504, "r_x2": 235.158, "r_y2": 478.697, "r_x3": 151.701, "r_y3": 478.697, "coord_origin": "TOPLEFT"}, "text": "Rectangular rule", "orig": "Rectangular rule", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 78, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 235.157, "r_y0": 487.504, "r_x1": 480.595, "r_y1": 487.504, "r_x2": 480.595, "r_y2": 478.707, "r_x3": 235.157, "r_y3": 478.707, "coord_origin": "TOPLEFT"}, "text": ": The table representation is always rectangular - all rows", "orig": ": The table representation is always rectangular - all rows", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 79, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 151.701, "r_y0": 499.46, "r_x1": 448.042, "r_y1": 499.46, "r_x2": 448.042, "r_y2": 490.663, "r_x3": 151.701, "r_y3": 490.663, "coord_origin": "TOPLEFT"}, "text": "must have an equal number of tokens, terminated with \"NL\" token.", "orig": "must have an equal number of tokens, terminated with \"NL\" token.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "6. Rectangular rule : The table representation is always rectangular - all rows must have an equal number of tokens, terminated with \"NL\" token."}, {"label": "text", "id": 0, "page_no": 6, "cluster": {"id": 0, "label": "text", "bbox": {"l": 134.765, "t": 512.5930000000001, "r": 480.596, "b": 640.942, "coord_origin": "TOPLEFT"}, "confidence": 0.9785562753677368, "cells": [{"index": 80, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 149.709, "r_y0": 521.39, "r_x1": 480.596, "r_y1": 521.39, "r_x2": 480.596, "r_y2": 512.5930000000001, "r_x3": 149.709, "r_y3": 512.5930000000001, "coord_origin": "TOPLEFT"}, "text": "The application of these rules gives OTSL a set of unique properties. First", "orig": "The application of these rules gives OTSL a set of unique properties. First", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 81, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 533.345, "r_x1": 480.591, "r_y1": 533.345, "r_x2": 480.591, "r_y2": 524.548, "r_x3": 134.765, "r_y3": 524.548, "coord_origin": "TOPLEFT"}, "text": "of all, the OTSL enforces a strictly rectangular structure representation, where", "orig": "of all, the OTSL enforces a strictly rectangular structure representation, where", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 82, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 545.3, "r_x1": 480.595, "r_y1": 545.3, "r_x2": 480.595, "r_y2": 536.5029999999999, "r_x3": 134.765, "r_y3": 536.5029999999999, "coord_origin": "TOPLEFT"}, "text": "every new-line token starts a new row. As a consequence, all rows and all columns", "orig": "every new-line token starts a new row. As a consequence, all rows and all columns", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 83, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 557.256, "r_x1": 480.589, "r_y1": 557.256, "r_x2": 480.589, "r_y2": 548.4590000000001, "r_x3": 134.765, "r_y3": 548.4590000000001, "coord_origin": "TOPLEFT"}, "text": "have exactly the same number of tokens, irrespective of cell spans. Secondly, the", "orig": "have exactly the same number of tokens, irrespective of cell spans. Secondly, the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 84, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 569.211, "r_x1": 480.594, "r_y1": 569.211, "r_x2": 480.594, "r_y2": 560.414, "r_x3": 134.765, "r_y3": 560.414, "coord_origin": "TOPLEFT"}, "text": "OTSL representation is unambiguous: Every table structure is represented in one", "orig": "OTSL representation is unambiguous: Every table structure is represented in one", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 85, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 581.1659999999999, "r_x1": 480.587, "r_y1": 581.1659999999999, "r_x2": 480.587, "r_y2": 572.369, "r_x3": 134.765, "r_y3": 572.369, "coord_origin": "TOPLEFT"}, "text": "way. In this representation every table cell corresponds to a \"C\"-cell token, which", "orig": "way. In this representation every table cell corresponds to a \"C\"-cell token, which", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 86, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 593.121, "r_x1": 480.592, "r_y1": 593.121, "r_x2": 480.592, "r_y2": 584.3240000000001, "r_x3": 134.765, "r_y3": 584.3240000000001, "coord_origin": "TOPLEFT"}, "text": "in case of spans is always located in the top-left corner of the table cell definition.", "orig": "in case of spans is always located in the top-left corner of the table cell definition.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 87, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 605.076, "r_x1": 480.592, "r_y1": 605.076, "r_x2": 480.592, "r_y2": 596.279, "r_x3": 134.765, "r_y3": 596.279, "coord_origin": "TOPLEFT"}, "text": "Third, OTSL syntax rules are only backward-looking. As a consequence, every", "orig": "Third, OTSL syntax rules are only backward-looking. As a consequence, every", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 88, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 617.032, "r_x1": 480.594, "r_y1": 617.032, "r_x2": 480.594, "r_y2": 608.235, "r_x3": 134.765, "r_y3": 608.235, "coord_origin": "TOPLEFT"}, "text": "predicted token can be validated straight during sequence generation by looking", "orig": "predicted token can be validated straight during sequence generation by looking", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 89, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 628.987, "r_x1": 480.591, "r_y1": 628.987, "r_x2": 480.591, "r_y2": 620.19, "r_x3": 134.765, "r_y3": 620.19, "coord_origin": "TOPLEFT"}, "text": "at the previously predicted sequence. As such, OTSL can guarantee that every", "orig": "at the previously predicted sequence. As such, OTSL can guarantee that every", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 90, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 640.942, "r_x1": 311.198, "r_y1": 640.942, "r_x2": 311.198, "r_y2": 632.145, "r_x3": 134.765, "r_y3": 632.145, "coord_origin": "TOPLEFT"}, "text": "predicted sequence is syntactically valid.", "orig": "predicted sequence is syntactically valid.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "The application of these rules gives OTSL a set of unique properties. First of all, the OTSL enforces a strictly rectangular structure representation, where every new-line token starts a new row. As a consequence, all rows and all columns have exactly the same number of tokens, irrespective of cell spans. Secondly, the OTSL representation is unambiguous: Every table structure is represented in one way. In this representation every table cell corresponds to a \"C\"-cell token, which in case of spans is always located in the top-left corner of the table cell definition. Third, OTSL syntax rules are only backward-looking. As a consequence, every predicted token can be validated straight during sequence generation by looking at the previously predicted sequence. As such, OTSL can guarantee that every predicted sequence is syntactically valid."}, {"label": "text", "id": 2, "page_no": 6, "cluster": {"id": 2, "label": "text", "bbox": {"l": 134.765, "t": 644.1030000000001, "r": 480.593, "b": 664.855, "coord_origin": "TOPLEFT"}, "confidence": 0.9590610861778259, "cells": [{"index": 91, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 149.709, "r_y0": 652.9, "r_x1": 480.592, "r_y1": 652.9, "r_x2": 480.592, "r_y2": 644.1030000000001, "r_x3": 149.709, "r_y3": 644.1030000000001, "coord_origin": "TOPLEFT"}, "text": "These characteristics can be easily learned by sequence generator networks,", "orig": "These characteristics can be easily learned by sequence generator networks,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 92, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 664.855, "r_x1": 480.593, "r_y1": 664.855, "r_x2": 480.593, "r_y2": 656.058, "r_x3": 134.765, "r_y3": 656.058, "coord_origin": "TOPLEFT"}, "text": "as we demonstrate further below. We find strong indications that this pattern", "orig": "as we demonstrate further below. We find strong indications that this pattern", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "These characteristics can be easily learned by sequence generator networks, as we demonstrate further below. We find strong indications that this pattern"}], "headers": [{"label": "page_header", "id": 7, "page_no": 6, "cluster": {"id": 7, "label": "page_header", "bbox": {"l": 194.478, "t": 91.49300000000005, "r": 447.543, "b": 102.78200000000004, "coord_origin": "TOPLEFT"}, "confidence": 0.932651162147522, "cells": [{"index": 0, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 194.478, "r_y0": 102.78200000000004, "r_x1": 447.543, "r_y1": 102.78200000000004, "r_x2": 447.543, "r_y2": 91.49300000000005, "r_x3": 194.478, "r_y3": 91.49300000000005, "coord_origin": "TOPLEFT"}, "text": "Optimized Table Tokenization for Table Structure Recognition", "orig": "Optimized Table Tokenization for Table Structure Recognition", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "Optimized Table Tokenization for Table Structure Recognition"}, {"label": "page_header", "id": 11, "page_no": 6, "cluster": {"id": 11, "label": "page_header", "bbox": {"l": 475.984, "t": 91.49300000000005, "r": 480.591, "b": 102.78200000000004, "coord_origin": "TOPLEFT"}, "confidence": 0.8749732375144958, "cells": [{"index": 1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 475.984, "r_y0": 102.78200000000004, "r_x1": 480.591, "r_y1": 102.78200000000004, "r_x2": 480.591, "r_y2": 91.49300000000005, "r_x3": 475.984, "r_y3": 91.49300000000005, "coord_origin": "TOPLEFT"}, "text": "7", "orig": "7", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "7"}]}}, {"page_no": 7, "size": {"width": 612.0, "height": 792.0}, "cells": [{"index": 0, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 102.78200000000004, "r_x1": 139.372, "r_y1": 102.78200000000004, "r_x2": 139.372, "r_y2": 91.49300000000005, "r_x3": 134.765, "r_y3": 91.49300000000005, "coord_origin": "TOPLEFT"}, "text": "8", "orig": "8", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 167.813, "r_y0": 102.78200000000004, "r_x1": 231.722, "r_y1": 102.78200000000004, "r_x2": 231.722, "r_y2": 91.49300000000005, "r_x3": 167.813, "r_y3": 91.49300000000005, "coord_origin": "TOPLEFT"}, "text": "M. Lysak, et al.", "orig": "M. Lysak, et al.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 2, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 127.731, "r_x1": 480.589, "r_y1": 127.731, "r_x2": 480.589, "r_y2": 118.93399999999997, "r_x3": 134.765, "r_y3": 118.93399999999997, "coord_origin": "TOPLEFT"}, "text": "reduces significantly the column drift seen in the HTML based models (see Fig-", "orig": "reduces significantly the column drift seen in the HTML based models (see Fig-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 3, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 139.68600000000004, "r_x1": 163.564, "r_y1": 139.68600000000004, "r_x2": 163.564, "r_y2": 130.889, "r_x3": 134.765, "r_y3": 130.889, "coord_origin": "TOPLEFT"}, "text": "ure 5).", "orig": "ure 5).", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 4, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 170.36400000000003, "r_x1": 149.402, "r_y1": 170.36400000000003, "r_x2": 149.402, "r_y2": 161.55700000000002, "r_x3": 134.765, "r_y3": 161.55700000000002, "coord_origin": "TOPLEFT"}, "text": "4.3", "orig": "4.3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 5, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 160.859, "r_y0": 170.36400000000003, "r_x1": 319.347, "r_y1": 170.36400000000003, "r_x2": 319.347, "r_y2": 161.55700000000002, "r_x3": 160.859, "r_y3": 161.55700000000002, "coord_origin": "TOPLEFT"}, "text": "Error-detection and -mitigation", "orig": "Error-detection and -mitigation", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 6, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 191.07899999999995, "r_x1": 480.596, "r_y1": 191.07899999999995, "r_x2": 480.596, "r_y2": 182.28200000000004, "r_x3": 134.765, "r_y3": 182.28200000000004, "coord_origin": "TOPLEFT"}, "text": "The design of OTSL allows to validate a table structure easily on an unfinished", "orig": "The design of OTSL allows to validate a table structure easily on an unfinished", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 7, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 203.03499999999997, "r_x1": 480.595, "r_y1": 203.03499999999997, "r_x2": 480.595, "r_y2": 194.23800000000006, "r_x3": 134.765, "r_y3": 194.23800000000006, "coord_origin": "TOPLEFT"}, "text": "sequence. The detection of an invalid sequence token is a clear indication of a", "orig": "sequence. The detection of an invalid sequence token is a clear indication of a", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 8, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 214.99, "r_x1": 480.587, "r_y1": 214.99, "r_x2": 480.587, "r_y2": 206.19299999999998, "r_x3": 134.765, "r_y3": 206.19299999999998, "coord_origin": "TOPLEFT"}, "text": "prediction mistake, however a valid sequence by itself does not guarantee pre-", "orig": "prediction mistake, however a valid sequence by itself does not guarantee pre-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 9, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 226.94500000000005, "r_x1": 480.592, "r_y1": 226.94500000000005, "r_x2": 480.592, "r_y2": 218.14800000000002, "r_x3": 134.765, "r_y3": 218.14800000000002, "coord_origin": "TOPLEFT"}, "text": "diction correctness. Different heuristics can be used to correct token errors in", "orig": "diction correctness. Different heuristics can be used to correct token errors in", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 10, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 238.89999999999998, "r_x1": 480.588, "r_y1": 238.89999999999998, "r_x2": 480.588, "r_y2": 230.10299999999995, "r_x3": 134.765, "r_y3": 230.10299999999995, "coord_origin": "TOPLEFT"}, "text": "an invalid sequence and thus increase the chances for accurate predictions. Such", "orig": "an invalid sequence and thus increase the chances for accurate predictions. Such", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 11, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 250.85500000000002, "r_x1": 480.587, "r_y1": 250.85500000000002, "r_x2": 480.587, "r_y2": 242.058, "r_x3": 134.765, "r_y3": 242.058, "coord_origin": "TOPLEFT"}, "text": "heuristics can be applied either after the prediction of each token, or at the end", "orig": "heuristics can be applied either after the prediction of each token, or at the end", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 12, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 262.80999999999995, "r_x1": 480.594, "r_y1": 262.80999999999995, "r_x2": 480.594, "r_y2": 254.01300000000003, "r_x3": 134.765, "r_y3": 254.01300000000003, "coord_origin": "TOPLEFT"}, "text": "on the entire predicted sequence. For example a simple heuristic which can cor-", "orig": "on the entire predicted sequence. For example a simple heuristic which can cor-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 13, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 274.76599999999996, "r_x1": 480.591, "r_y1": 274.76599999999996, "r_x2": 480.591, "r_y2": 265.96900000000005, "r_x3": 134.765, "r_y3": 265.96900000000005, "coord_origin": "TOPLEFT"}, "text": "rect the predicted OTSL sequence on-the-fly is to verify if the token with the", "orig": "rect the predicted OTSL sequence on-the-fly is to verify if the token with the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 14, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 286.721, "r_x1": 480.596, "r_y1": 286.721, "r_x2": 480.596, "r_y2": 277.924, "r_x3": 134.765, "r_y3": 277.924, "coord_origin": "TOPLEFT"}, "text": "highest prediction confidence invalidates the predicted sequence, and replace it", "orig": "highest prediction confidence invalidates the predicted sequence, and replace it", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 15, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 298.676, "r_x1": 469.404, "r_y1": 298.676, "r_x2": 469.404, "r_y2": 289.879, "r_x3": 134.765, "r_y3": 289.879, "coord_origin": "TOPLEFT"}, "text": "by the token with the next highest confidence until OTSL rules are satisfied.", "orig": "by the token with the next highest confidence until OTSL rules are satisfied.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 16, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 331.732, "r_x1": 141.489, "r_y1": 331.732, "r_x2": 141.489, "r_y2": 321.164, "r_x3": 134.765, "r_y3": 321.164, "coord_origin": "TOPLEFT"}, "text": "5", "orig": "5", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 17, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 154.938, "r_y0": 331.732, "r_x1": 229.035, "r_y1": 331.732, "r_x2": 229.035, "r_y2": 321.164, "r_x3": 154.938, "r_y3": 321.164, "coord_origin": "TOPLEFT"}, "text": "Experiments", "orig": "Experiments", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 18, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 356.047, "r_x1": 480.594, "r_y1": 356.047, "r_x2": 480.594, "r_y2": 347.25, "r_x3": 134.765, "r_y3": 347.25, "coord_origin": "TOPLEFT"}, "text": "To evaluate the impact of OTSL on prediction accuracy and inference times, we", "orig": "To evaluate the impact of OTSL on prediction accuracy and inference times, we", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 19, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 368.002, "r_x1": 480.595, "r_y1": 368.002, "r_x2": 480.595, "r_y2": 359.205, "r_x3": 134.765, "r_y3": 359.205, "coord_origin": "TOPLEFT"}, "text": "conducted a series of experiments based on the TableFormer model (Figure 4)", "orig": "conducted a series of experiments based on the TableFormer model (Figure 4)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 20, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 379.957, "r_x1": 480.588, "r_y1": 379.957, "r_x2": 480.588, "r_y2": 371.16, "r_x3": 134.765, "r_y3": 371.16, "coord_origin": "TOPLEFT"}, "text": "with two objectives: Firstly we evaluate the prediction quality and performance", "orig": "with two objectives: Firstly we evaluate the prediction quality and performance", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 21, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 391.912, "r_x1": 480.588, "r_y1": 391.912, "r_x2": 480.588, "r_y2": 383.115, "r_x3": 134.765, "r_y3": 383.115, "coord_origin": "TOPLEFT"}, "text": "of OTSL vs. HTML after performing Hyper Parameter Optimization (HPO) on", "orig": "of OTSL vs. HTML after performing Hyper Parameter Optimization (HPO) on", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 22, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 403.867, "r_x1": 148.598, "r_y1": 403.867, "r_x2": 148.598, "r_y2": 395.07, "r_x3": 134.765, "r_y3": 395.07, "coord_origin": "TOPLEFT"}, "text": "the", "orig": "the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 23, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 151.627, "r_y0": 403.867, "r_x1": 191.847, "r_y1": 403.867, "r_x2": 191.847, "r_y2": 395.07, "r_x3": 151.627, "r_y3": 395.07, "coord_origin": "TOPLEFT"}, "text": "canonical", "orig": "canonical", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 24, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 195.902, "r_y0": 403.867, "r_x1": 480.595, "r_y1": 403.867, "r_x2": 480.595, "r_y2": 395.07, "r_x3": 195.902, "r_y3": 395.07, "coord_origin": "TOPLEFT"}, "text": "PubTabNet data set. Secondly we pick the best hyper-parameters", "orig": "PubTabNet data set. Secondly we pick the best hyper-parameters", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 25, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 415.822, "r_x1": 172.59, "r_y1": 415.822, "r_x2": 172.59, "r_y2": 407.025, "r_x3": 134.765, "r_y3": 407.025, "coord_origin": "TOPLEFT"}, "text": "found in", "orig": "found in", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 26, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 177.492, "r_y0": 415.822, "r_x1": 191.325, "r_y1": 415.822, "r_x2": 191.325, "r_y2": 407.025, "r_x3": 177.492, "r_y3": 407.025, "coord_origin": "TOPLEFT"}, "text": "the", "orig": "the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 27, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 196.226, "r_y0": 415.822, "r_x1": 213.463, "r_y1": 415.822, "r_x2": 213.463, "r_y2": 407.025, "r_x3": 196.226, "r_y3": 407.025, "coord_origin": "TOPLEFT"}, "text": "first", "orig": "first", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 28, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 218.364, "r_y0": 415.822, "r_x1": 236.125, "r_y1": 415.822, "r_x2": 236.125, "r_y2": 407.025, "r_x3": 218.364, "r_y3": 407.025, "coord_origin": "TOPLEFT"}, "text": "step", "orig": "step", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 29, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 241.027, "r_y0": 415.822, "r_x1": 297.661, "r_y1": 415.822, "r_x2": 297.661, "r_y2": 407.025, "r_x3": 241.027, "r_y3": 407.025, "coord_origin": "TOPLEFT"}, "text": "and evaluate", "orig": "and evaluate", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 30, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 302.563, "r_y0": 415.822, "r_x1": 480.593, "r_y1": 415.822, "r_x2": 480.593, "r_y2": 407.025, "r_x3": 302.563, "r_y3": 407.025, "coord_origin": "TOPLEFT"}, "text": "how OTSL impacts the performance of", "orig": "how OTSL impacts the performance of", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 31, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 427.778, "r_x1": 377.321, "r_y1": 427.778, "r_x2": 377.321, "r_y2": 418.981, "r_x3": 134.765, "r_y3": 418.981, "coord_origin": "TOPLEFT"}, "text": "TableFormer after training on other publicly available", "orig": "TableFormer after training on other publicly available", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 32, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 381.874, "r_y0": 427.778, "r_x1": 421.951, "r_y1": 427.778, "r_x2": 421.951, "r_y2": 418.981, "r_x3": 381.874, "r_y3": 418.981, "coord_origin": "TOPLEFT"}, "text": "data sets", "orig": "data sets", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 33, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 426.504, "r_y0": 427.778, "r_x1": 480.595, "r_y1": 427.778, "r_x2": 480.595, "r_y2": 418.981, "r_x3": 426.504, "r_y3": 418.981, "coord_origin": "TOPLEFT"}, "text": "(FinTabNet,", "orig": "(FinTabNet,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 34, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 439.733, "r_x1": 480.592, "r_y1": 439.733, "r_x2": 480.592, "r_y2": 430.936, "r_x3": 134.765, "r_y3": 430.936, "coord_origin": "TOPLEFT"}, "text": "PubTables-1M [14]). The ground truth (GT) from all data sets has been con-", "orig": "PubTables-1M [14]). The ground truth (GT) from all data sets has been con-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 35, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 451.688, "r_x1": 479.303, "r_y1": 451.688, "r_x2": 479.303, "r_y2": 442.891, "r_x3": 134.765, "r_y3": 442.891, "coord_origin": "TOPLEFT"}, "text": "verted into OTSL format for this purpose, and will be made publicly available.", "orig": "verted into OTSL format for this purpose, and will be made publicly available.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 36, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 492.574, "r_x1": 162.644, "r_y1": 492.574, "r_x2": 162.644, "r_y2": 484.648, "r_x3": 134.765, "r_y3": 484.648, "coord_origin": "TOPLEFT"}, "text": "Fig. 4.", "orig": "Fig. 4.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 37, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 165.196, "r_y0": 493.722, "r_x1": 480.591, "r_y1": 493.722, "r_x2": 480.591, "r_y2": 482.433, "r_x3": 165.196, "r_y3": 482.433, "coord_origin": "TOPLEFT"}, "text": "Architecture sketch of the TableFormer model, which is a representative for the", "orig": "Architecture sketch of the TableFormer model, which is a representative for the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 38, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 504.681, "r_x1": 206.702, "r_y1": 504.681, "r_x2": 206.702, "r_y2": 493.392, "r_x3": 134.765, "r_y3": 493.392, "coord_origin": "TOPLEFT"}, "text": "Im2Seq approach.", "orig": "Im2Seq approach.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 39, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 147.3, "r_y0": 543.091, "r_x1": 149.407, "r_y1": 543.091, "r_x2": 149.407, "r_y2": 540.762, "r_x3": 147.3, "r_y3": 540.762, "coord_origin": "TOPLEFT"}, "text": "1.", "orig": "1.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 40, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 150.809, "r_y0": 543.091, "r_x1": 155.721, "r_y1": 543.091, "r_x2": 155.721, "r_y2": 540.762, "r_x3": 150.809, "r_y3": 540.762, "coord_origin": "TOPLEFT"}, "text": "Item", "orig": "Item", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 41, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 162.76, "r_y0": 537.754, "r_x1": 172.296, "r_y1": 537.754, "r_x2": 172.296, "r_y2": 535.424, "r_x3": 162.76, "r_y3": 535.424, "coord_origin": "TOPLEFT"}, "text": "Amount", "orig": "Amount", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 42, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 147.636, "r_y0": 537.726, "r_x1": 155.918, "r_y1": 537.726, "r_x2": 155.918, "r_y2": 535.396, "r_x3": 147.636, "r_y3": 535.396, "coord_origin": "TOPLEFT"}, "text": "Names", "orig": "Names", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 43, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 158.485, "r_y0": 543.091, "r_x1": 164.102, "r_y1": 543.091, "r_x2": 164.102, "r_y2": 540.762, "r_x3": 158.485, "r_y3": 540.762, "coord_origin": "TOPLEFT"}, "text": "1000", "orig": "1000", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 44, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 158.485, "r_y0": 547.03, "r_x1": 162.697, "r_y1": 547.03, "r_x2": 162.697, "r_y2": 544.701, "r_x3": 158.485, "r_y3": 544.701, "coord_origin": "TOPLEFT"}, "text": "500", "orig": "500", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 45, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 158.485, "r_y0": 551.2719999999999, "r_x1": 164.102, "r_y1": 551.2719999999999, "r_x2": 164.102, "r_y2": 548.943, "r_x3": 158.485, "r_y3": 548.943, "coord_origin": "TOPLEFT"}, "text": "3500", "orig": "3500", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 46, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 158.485, "r_y0": 555.514, "r_x1": 162.697, "r_y1": 555.514, "r_x2": 162.697, "r_y2": 553.185, "r_x3": 158.485, "r_y3": 553.185, "coord_origin": "TOPLEFT"}, "text": "150", "orig": "150", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 47, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 168.817, "r_y0": 543.091, "r_x1": 172.889, "r_y1": 543.091, "r_x2": 172.889, "r_y2": 540.762, "r_x3": 168.817, "r_y3": 540.762, "coord_origin": "TOPLEFT"}, "text": "unit", "orig": "unit", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 48, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 168.817, "r_y0": 547.03, "r_x1": 172.889, "r_y1": 547.03, "r_x2": 172.889, "r_y2": 544.701, "r_x3": 168.817, "r_y3": 544.701, "coord_origin": "TOPLEFT"}, "text": "unit", "orig": "unit", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 49, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 168.817, "r_y0": 551.2719999999999, "r_x1": 172.889, "r_y1": 551.2719999999999, "r_x2": 172.889, "r_y2": 548.943, "r_x3": 168.817, "r_y3": 548.943, "coord_origin": "TOPLEFT"}, "text": "unit", "orig": "unit", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 50, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 168.817, "r_y0": 555.514, "r_x1": 172.889, "r_y1": 555.514, "r_x2": 172.889, "r_y2": 553.185, "r_x3": 168.817, "r_y3": 553.185, "coord_origin": "TOPLEFT"}, "text": "unit", "orig": "unit", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 51, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 147.3, "r_y0": 547.03, "r_x1": 149.407, "r_y1": 547.03, "r_x2": 149.407, "r_y2": 544.701, "r_x3": 147.3, "r_y3": 544.701, "coord_origin": "TOPLEFT"}, "text": "2.", "orig": "2.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 52, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 150.809, "r_y0": 547.03, "r_x1": 155.721, "r_y1": 547.03, "r_x2": 155.721, "r_y2": 544.701, "r_x3": 150.809, "r_y3": 544.701, "coord_origin": "TOPLEFT"}, "text": "Item", "orig": "Item", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 53, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 147.3, "r_y0": 551.2719999999999, "r_x1": 149.407, "r_y1": 551.2719999999999, "r_x2": 149.407, "r_y2": 548.943, "r_x3": 147.3, "r_y3": 548.943, "coord_origin": "TOPLEFT"}, "text": "3.", "orig": "3.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 54, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 150.809, "r_y0": 551.2719999999999, "r_x1": 155.721, "r_y1": 551.2719999999999, "r_x2": 155.721, "r_y2": 548.943, "r_x3": 150.809, "r_y3": 548.943, "coord_origin": "TOPLEFT"}, "text": "Item", "orig": "Item", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 55, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 147.3, "r_y0": 555.514, "r_x1": 149.407, "r_y1": 555.514, "r_x2": 149.407, "r_y2": 553.185, "r_x3": 147.3, "r_y3": 553.185, "coord_origin": "TOPLEFT"}, "text": "4.", "orig": "4.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 56, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 150.809, "r_y0": 555.514, "r_x1": 155.721, "r_y1": 555.514, "r_x2": 155.721, "r_y2": 553.185, "r_x3": 150.809, "r_y3": 553.185, "coord_origin": "TOPLEFT"}, "text": "Item", "orig": "Item", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 57, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 152.05, "r_y0": 521.2570000000001, "r_x1": 171.249, "r_y1": 521.2570000000001, "r_x2": 171.249, "r_y2": 517.0640000000001, "r_x3": 152.05, "r_y3": 517.0640000000001, "coord_origin": "TOPLEFT"}, "text": "Extracted", "orig": "Extracted", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 58, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 148.133, "r_y0": 526.56, "r_x1": 175.168, "r_y1": 526.56, "r_x2": 175.168, "r_y2": 522.367, "r_x3": 148.133, "r_y3": 522.367, "coord_origin": "TOPLEFT"}, "text": "Table Images", "orig": "Table Images", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 59, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 193.533, "r_y0": 528.762, "r_x1": 220.32, "r_y1": 528.762, "r_x2": 220.32, "r_y2": 524.569, "r_x3": 193.533, "r_y3": 524.569, "coord_origin": "TOPLEFT"}, "text": "Standardized", "orig": "Standardized", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 60, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 199.473, "r_y0": 534.0640000000001, "r_x1": 214.379, "r_y1": 534.0640000000001, "r_x2": 214.379, "r_y2": 529.871, "r_x3": 199.473, "r_y3": 529.871, "coord_origin": "TOPLEFT"}, "text": "Images", "orig": "Images", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 61, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 273.611, "r_y0": 514.153, "r_x1": 284.473, "r_y1": 514.153, "r_x2": 284.473, "r_y2": 509.96, "r_x3": 273.611, "r_y3": 509.96, "coord_origin": "TOPLEFT"}, "text": "BBox", "orig": "BBox", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 62, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 270.452, "r_y0": 517.94, "r_x1": 287.632, "r_y1": 517.94, "r_x2": 287.632, "r_y2": 513.7470000000001, "r_x3": 270.452, "r_y3": 513.7470000000001, "coord_origin": "TOPLEFT"}, "text": "Decoder", "orig": "Decoder", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 63, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 332.478, "r_y0": 512.392, "r_x1": 348.14, "r_y1": 512.392, "r_x2": 348.14, "r_y2": 508.199, "r_x3": 332.478, "r_y3": 508.199, "coord_origin": "TOPLEFT"}, "text": "BBoxes", "orig": "BBoxes", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 64, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 376.686, "r_y0": 525.3679999999999, "r_x1": 407.255, "r_y1": 525.3679999999999, "r_x2": 407.255, "r_y2": 521.175, "r_x3": 376.686, "r_y3": 521.175, "coord_origin": "TOPLEFT"}, "text": "BBoxes can be", "orig": "BBoxes can be", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 65, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 373.909, "r_y0": 529.913, "r_x1": 410.035, "r_y1": 529.913, "r_x2": 410.035, "r_y2": 525.72, "r_x3": 373.909, "r_y3": 525.72, "coord_origin": "TOPLEFT"}, "text": "traced back to the", "orig": "traced back to the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 66, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 375.299, "r_y0": 534.4580000000001, "r_x1": 408.649, "r_y1": 534.4580000000001, "r_x2": 408.649, "r_y2": 530.265, "r_x3": 375.299, "r_y3": 530.265, "coord_origin": "TOPLEFT"}, "text": "original image to", "orig": "original image to", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 67, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 377.067, "r_y0": 539.0029999999999, "r_x1": 406.883, "r_y1": 539.0029999999999, "r_x2": 406.883, "r_y2": 534.81, "r_x3": 377.067, "r_y3": 534.81, "coord_origin": "TOPLEFT"}, "text": "extract content", "orig": "extract content", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 68, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 383.567, "r_y0": 567.489, "r_x1": 433.765, "r_y1": 567.489, "r_x2": 433.765, "r_y2": 563.296, "r_x3": 383.567, "r_y3": 563.296, "coord_origin": "TOPLEFT"}, "text": "Structure Tags sequence", "orig": "Structure Tags sequence", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 69, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 383.528, "r_y0": 572.034, "r_x1": 433.808, "r_y1": 572.034, "r_x2": 433.808, "r_y2": 567.841, "r_x3": 383.528, "r_y3": 567.841, "coord_origin": "TOPLEFT"}, "text": "provide full description of", "orig": "provide full description of", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 70, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 390.475, "r_y0": 576.579, "r_x1": 426.857, "r_y1": 576.579, "r_x2": 426.857, "r_y2": 572.386, "r_x3": 390.475, "r_y3": 572.386, "coord_origin": "TOPLEFT"}, "text": "the table structure", "orig": "the table structure", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 71, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 293.947, "r_y0": 582.139, "r_x1": 323.169, "r_y1": 582.139, "r_x2": 323.169, "r_y2": 577.946, "r_x3": 293.947, "r_y3": 577.946, "coord_origin": "TOPLEFT"}, "text": "Structure Tags", "orig": "Structure Tags", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 72, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 293.947, "r_y0": 586.684, "r_x1": 324.594, "r_y1": 586.684, "r_x2": 324.594, "r_y2": 582.491, "r_x3": 293.947, "r_y3": 582.491, "coord_origin": "TOPLEFT"}, "text": "in OTSL format", "orig": "in OTSL format", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 73, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 333.078, "r_y0": 546.0699999999999, "r_x1": 364.147, "r_y1": 546.0699999999999, "r_x2": 364.147, "r_y2": 541.877, "r_x3": 333.078, "r_y3": 541.877, "coord_origin": "TOPLEFT"}, "text": "BBoxes in sync", "orig": "BBoxes in sync", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 74, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 333.078, "r_y0": 549.858, "r_x1": 369.715, "r_y1": 549.858, "r_x2": 369.715, "r_y2": 545.665, "r_x3": 333.078, "r_y3": 545.665, "coord_origin": "TOPLEFT"}, "text": "with tag sequence", "orig": "with tag sequence", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 75, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 232.659, "r_y0": 519.489, "r_x1": 249.589, "r_y1": 519.489, "r_x2": 249.589, "r_y2": 515.296, "r_x3": 232.659, "r_y3": 515.296, "coord_origin": "TOPLEFT"}, "text": "Encoder", "orig": "Encoder", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 76, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 269.822, "r_y0": 550.218, "r_x1": 288.263, "r_y1": 550.218, "r_x2": 288.263, "r_y2": 546.0260000000001, "r_x3": 269.822, "r_y3": 546.0260000000001, "coord_origin": "TOPLEFT"}, "text": "Structure", "orig": "Structure", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 77, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 270.452, "r_y0": 554.006, "r_x1": 287.632, "r_y1": 554.006, "r_x2": 287.632, "r_y2": 549.813, "r_x3": 270.452, "r_y3": 549.813, "coord_origin": "TOPLEFT"}, "text": "Decoder", "orig": "Decoder", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 78, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 332.177, "r_y0": 520.1600000000001, "r_x1": 358.112, "r_y1": 520.1600000000001, "r_x2": 358.112, "r_y2": 515.967, "r_x3": 332.177, "r_y3": 515.967, "coord_origin": "TOPLEFT"}, "text": "[x1, y2, x2, y2]", "orig": "[x1, y2, x2, y2]", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 79, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 332.177, "r_y0": 526.22, "r_x1": 361.583, "r_y1": 526.22, "r_x2": 361.583, "r_y2": 522.027, "r_x3": 332.177, "r_y3": 522.027, "coord_origin": "TOPLEFT"}, "text": "[x1', y2', x2', y2']", "orig": "[x1', y2', x2', y2']", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 80, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 332.177, "r_y0": 532.28, "r_x1": 364.765, "r_y1": 532.28, "r_x2": 364.765, "r_y2": 528.087, "r_x3": 332.177, "r_y3": 528.087, "coord_origin": "TOPLEFT"}, "text": "[x1'', y2'', x2'', y2'']", "orig": "[x1'', y2'', x2'', y2'']", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 81, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 332.177, "r_y0": 538.34, "r_x1": 335.965, "r_y1": 538.34, "r_x2": 335.965, "r_y2": 534.1469999999999, "r_x3": 332.177, "r_y3": 534.1469999999999, "coord_origin": "TOPLEFT"}, "text": "...", "orig": "...", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 82, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 326.889, "r_y0": 520.643, "r_x1": 329.416, "r_y1": 520.643, "r_x2": 329.416, "r_y2": 516.45, "r_x3": 326.889, "r_y3": 516.45, "coord_origin": "TOPLEFT"}, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 83, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 327.041, "r_y0": 526.672, "r_x1": 329.568, "r_y1": 526.672, "r_x2": 329.568, "r_y2": 522.479, "r_x3": 327.041, "r_y3": 522.479, "coord_origin": "TOPLEFT"}, "text": "2", "orig": "2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 84, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 327.041, "r_y0": 532.7629999999999, "r_x1": 329.568, "r_y1": 532.7629999999999, "r_x2": 329.568, "r_y2": 528.5699999999999, "r_x3": 327.041, "r_y3": 528.5699999999999, "coord_origin": "TOPLEFT"}, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 85, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 424.141, "r_y0": 531.69, "r_x1": 426.668, "r_y1": 531.69, "r_x2": 426.668, "r_y2": 527.4970000000001, "r_x3": 424.141, "r_y3": 527.4970000000001, "coord_origin": "TOPLEFT"}, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 86, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 453.002, "r_y0": 521.701, "r_x1": 455.529, "r_y1": 521.701, "r_x2": 455.529, "r_y2": 517.508, "r_x3": 453.002, "r_y3": 517.508, "coord_origin": "TOPLEFT"}, "text": "2", "orig": "2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 87, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 423.858, "r_y0": 521.31, "r_x1": 426.385, "r_y1": 521.31, "r_x2": 426.385, "r_y2": 517.117, "r_x3": 423.858, "r_y3": 517.117, "coord_origin": "TOPLEFT"}, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 88, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 333.434, "r_y0": 562.3389999999999, "r_x1": 359.834, "r_y1": 561.855, "r_x2": 359.834, "r_y2": 556.947, "r_x3": 333.434, "r_y3": 557.431, "coord_origin": "TOPLEFT"}, "text": "C C L NL", "orig": "C C L NL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 89, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 340.31, "r_y0": 568.837, "r_x1": 359.986, "r_y1": 568.552, "r_x2": 359.986, "r_y2": 563.644, "r_x3": 340.31, "r_y3": 563.929, "coord_origin": "TOPLEFT"}, "text": "C C NL", "orig": "C C NL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 90, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 333.596, "r_y0": 568.795, "r_x1": 337.437, "r_y1": 568.795, "r_x2": 337.437, "r_y2": 563.887, "r_x3": 333.596, "r_y3": 563.887, "coord_origin": "TOPLEFT"}, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 91, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 340.375, "r_y0": 575.399, "r_x1": 359.999, "r_y1": 575.134, "r_x2": 359.999, "r_y2": 570.226, "r_x3": 340.375, "r_y3": 570.491, "coord_origin": "TOPLEFT"}, "text": "C C NL", "orig": "C C NL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 92, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 333.661, "r_y0": 575.356, "r_x1": 337.503, "r_y1": 575.356, "r_x2": 337.503, "r_y2": 570.448, "r_x3": 333.661, "r_y3": 570.448, "coord_origin": "TOPLEFT"}, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 93, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 340.377, "r_y0": 581.998, "r_x1": 359.954, "r_y1": 581.738, "r_x2": 359.954, "r_y2": 576.83, "r_x3": 340.377, "r_y3": 577.09, "coord_origin": "TOPLEFT"}, "text": "C C NL", "orig": "C C NL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 94, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 333.663, "r_y0": 581.955, "r_x1": 337.504, "r_y1": 581.955, "r_x2": 337.504, "r_y2": 577.047, "r_x3": 333.663, "r_y3": 577.047, "coord_origin": "TOPLEFT"}, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 95, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 340.279, "r_y0": 588.369, "r_x1": 360.07, "r_y1": 588.3779999999999, "r_x2": 360.07, "r_y2": 583.47, "r_x3": 340.279, "r_y3": 583.461, "coord_origin": "TOPLEFT"}, "text": "C C NL", "orig": "C C NL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 96, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 333.566, "r_y0": 588.327, "r_x1": 337.407, "r_y1": 588.327, "r_x2": 337.407, "r_y2": 583.419, "r_x3": 333.566, "r_y3": 583.419, "coord_origin": "TOPLEFT"}, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 97, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 331.14, "r_y0": 568.538, "r_x1": 333.667, "r_y1": 568.538, "r_x2": 333.667, "r_y2": 564.345, "r_x3": 331.14, "r_y3": 564.345, "coord_origin": "TOPLEFT"}, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 98, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 340.81, "r_y0": 558.841, "r_x1": 343.337, "r_y1": 558.841, "r_x2": 343.337, "r_y2": 554.648, "r_x3": 340.81, "r_y3": 554.648, "coord_origin": "TOPLEFT"}, "text": "2", "orig": "2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 99, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 330.98, "r_y0": 559.078, "r_x1": 333.507, "r_y1": 559.078, "r_x2": 333.507, "r_y2": 554.885, "r_x3": 330.98, "r_y3": 554.885, "coord_origin": "TOPLEFT"}, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 100, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 149.709, "r_y0": 628.99, "r_x1": 480.588, "r_y1": 628.99, "r_x2": 480.588, "r_y2": 620.193, "r_x3": 149.709, "r_y3": 620.193, "coord_origin": "TOPLEFT"}, "text": "We rely on standard metrics such as Tree Edit Distance score (TEDs) for", "orig": "We rely on standard metrics such as Tree Edit Distance score (TEDs) for", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 101, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 640.9449999999999, "r_x1": 480.589, "r_y1": 640.9449999999999, "r_x2": 480.589, "r_y2": 632.148, "r_x3": 134.765, "r_y3": 632.148, "coord_origin": "TOPLEFT"}, "text": "table structure prediction, and Mean Average Precision (mAP) with 0.75 Inter-", "orig": "table structure prediction, and Mean Average Precision (mAP) with 0.75 Inter-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 102, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 652.9, "r_x1": 480.592, "r_y1": 652.9, "r_x2": 480.592, "r_y2": 644.1030000000001, "r_x3": 134.765, "r_y3": 644.1030000000001, "coord_origin": "TOPLEFT"}, "text": "section Over Union (IOU) threshold for the bounding-box predictions of table", "orig": "section Over Union (IOU) threshold for the bounding-box predictions of table", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 103, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 664.855, "r_x1": 155.846, "r_y1": 664.855, "r_x2": 155.846, "r_y2": 656.058, "r_x3": 134.765, "r_y3": 656.058, "coord_origin": "TOPLEFT"}, "text": "cells.", "orig": "cells.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 104, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 159.442, "r_y0": 664.855, "r_x1": 480.59, "r_y1": 664.855, "r_x2": 480.59, "r_y2": 656.058, "r_x3": 159.442, "r_y3": 656.058, "coord_origin": "TOPLEFT"}, "text": "The predicted OTSL structures were converted back to HTML format in", "orig": "The predicted OTSL structures were converted back to HTML format in", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "parsed_page": null, "predictions": {"layout": {"clusters": [{"id": 9, "label": "page_header", "bbox": {"l": 134.765, "t": 91.49300000000005, "r": 139.372, "b": 102.78200000000004, "coord_origin": "TOPLEFT"}, "confidence": 0.8301323056221008, "cells": [{"index": 0, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 102.78200000000004, "r_x1": 139.372, "r_y1": 102.78200000000004, "r_x2": 139.372, "r_y2": 91.49300000000005, "r_x3": 134.765, "r_y3": 91.49300000000005, "coord_origin": "TOPLEFT"}, "text": "8", "orig": "8", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 8, "label": "page_header", "bbox": {"l": 167.813, "t": 91.49300000000005, "r": 231.722, "b": 102.78200000000004, "coord_origin": "TOPLEFT"}, "confidence": 0.8631826043128967, "cells": [{"index": 1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 167.813, "r_y0": 102.78200000000004, "r_x1": 231.722, "r_y1": 102.78200000000004, "r_x2": 231.722, "r_y2": 91.49300000000005, "r_x3": 167.813, "r_y3": 91.49300000000005, "coord_origin": "TOPLEFT"}, "text": "M. Lysak, et al.", "orig": "M. Lysak, et al.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 5, "label": "text", "bbox": {"l": 134.765, "t": 118.93399999999997, "r": 480.589, "b": 139.68600000000004, "coord_origin": "TOPLEFT"}, "confidence": 0.9464744925498962, "cells": [{"index": 2, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 127.731, "r_x1": 480.589, "r_y1": 127.731, "r_x2": 480.589, "r_y2": 118.93399999999997, "r_x3": 134.765, "r_y3": 118.93399999999997, "coord_origin": "TOPLEFT"}, "text": "reduces significantly the column drift seen in the HTML based models (see Fig-", "orig": "reduces significantly the column drift seen in the HTML based models (see Fig-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 3, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 139.68600000000004, "r_x1": 163.564, "r_y1": 139.68600000000004, "r_x2": 163.564, "r_y2": 130.889, "r_x3": 134.765, "r_y3": 130.889, "coord_origin": "TOPLEFT"}, "text": "ure 5).", "orig": "ure 5).", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 2, "label": "section_header", "bbox": {"l": 134.765, "t": 161.55700000000002, "r": 319.347, "b": 170.36400000000003, "coord_origin": "TOPLEFT"}, "confidence": 0.9549514651298523, "cells": [{"index": 4, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 170.36400000000003, "r_x1": 149.402, "r_y1": 170.36400000000003, "r_x2": 149.402, "r_y2": 161.55700000000002, "r_x3": 134.765, "r_y3": 161.55700000000002, "coord_origin": "TOPLEFT"}, "text": "4.3", "orig": "4.3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 5, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 160.859, "r_y0": 170.36400000000003, "r_x1": 319.347, "r_y1": 170.36400000000003, "r_x2": 319.347, "r_y2": 161.55700000000002, "r_x3": 160.859, "r_y3": 161.55700000000002, "coord_origin": "TOPLEFT"}, "text": "Error-detection and -mitigation", "orig": "Error-detection and -mitigation", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 0, "label": "text", "bbox": {"l": 134.765, "t": 182.28200000000004, "r": 480.596, "b": 298.676, "coord_origin": "TOPLEFT"}, "confidence": 0.9879790544509888, "cells": [{"index": 6, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 191.07899999999995, "r_x1": 480.596, "r_y1": 191.07899999999995, "r_x2": 480.596, "r_y2": 182.28200000000004, "r_x3": 134.765, "r_y3": 182.28200000000004, "coord_origin": "TOPLEFT"}, "text": "The design of OTSL allows to validate a table structure easily on an unfinished", "orig": "The design of OTSL allows to validate a table structure easily on an unfinished", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 7, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 203.03499999999997, "r_x1": 480.595, "r_y1": 203.03499999999997, "r_x2": 480.595, "r_y2": 194.23800000000006, "r_x3": 134.765, "r_y3": 194.23800000000006, "coord_origin": "TOPLEFT"}, "text": "sequence. The detection of an invalid sequence token is a clear indication of a", "orig": "sequence. The detection of an invalid sequence token is a clear indication of a", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 8, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 214.99, "r_x1": 480.587, "r_y1": 214.99, "r_x2": 480.587, "r_y2": 206.19299999999998, "r_x3": 134.765, "r_y3": 206.19299999999998, "coord_origin": "TOPLEFT"}, "text": "prediction mistake, however a valid sequence by itself does not guarantee pre-", "orig": "prediction mistake, however a valid sequence by itself does not guarantee pre-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 9, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 226.94500000000005, "r_x1": 480.592, "r_y1": 226.94500000000005, "r_x2": 480.592, "r_y2": 218.14800000000002, "r_x3": 134.765, "r_y3": 218.14800000000002, "coord_origin": "TOPLEFT"}, "text": "diction correctness. Different heuristics can be used to correct token errors in", "orig": "diction correctness. Different heuristics can be used to correct token errors in", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 10, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 238.89999999999998, "r_x1": 480.588, "r_y1": 238.89999999999998, "r_x2": 480.588, "r_y2": 230.10299999999995, "r_x3": 134.765, "r_y3": 230.10299999999995, "coord_origin": "TOPLEFT"}, "text": "an invalid sequence and thus increase the chances for accurate predictions. Such", "orig": "an invalid sequence and thus increase the chances for accurate predictions. Such", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 11, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 250.85500000000002, "r_x1": 480.587, "r_y1": 250.85500000000002, "r_x2": 480.587, "r_y2": 242.058, "r_x3": 134.765, "r_y3": 242.058, "coord_origin": "TOPLEFT"}, "text": "heuristics can be applied either after the prediction of each token, or at the end", "orig": "heuristics can be applied either after the prediction of each token, or at the end", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 12, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 262.80999999999995, "r_x1": 480.594, "r_y1": 262.80999999999995, "r_x2": 480.594, "r_y2": 254.01300000000003, "r_x3": 134.765, "r_y3": 254.01300000000003, "coord_origin": "TOPLEFT"}, "text": "on the entire predicted sequence. For example a simple heuristic which can cor-", "orig": "on the entire predicted sequence. For example a simple heuristic which can cor-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 13, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 274.76599999999996, "r_x1": 480.591, "r_y1": 274.76599999999996, "r_x2": 480.591, "r_y2": 265.96900000000005, "r_x3": 134.765, "r_y3": 265.96900000000005, "coord_origin": "TOPLEFT"}, "text": "rect the predicted OTSL sequence on-the-fly is to verify if the token with the", "orig": "rect the predicted OTSL sequence on-the-fly is to verify if the token with the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 14, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 286.721, "r_x1": 480.596, "r_y1": 286.721, "r_x2": 480.596, "r_y2": 277.924, "r_x3": 134.765, "r_y3": 277.924, "coord_origin": "TOPLEFT"}, "text": "highest prediction confidence invalidates the predicted sequence, and replace it", "orig": "highest prediction confidence invalidates the predicted sequence, and replace it", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 15, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 298.676, "r_x1": 469.404, "r_y1": 298.676, "r_x2": 469.404, "r_y2": 289.879, "r_x3": 134.765, "r_y3": 289.879, "coord_origin": "TOPLEFT"}, "text": "by the token with the next highest confidence until OTSL rules are satisfied.", "orig": "by the token with the next highest confidence until OTSL rules are satisfied.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 3, "label": "section_header", "bbox": {"l": 134.765, "t": 321.164, "r": 229.035, "b": 331.732, "coord_origin": "TOPLEFT"}, "confidence": 0.95152747631073, "cells": [{"index": 16, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 331.732, "r_x1": 141.489, "r_y1": 331.732, "r_x2": 141.489, "r_y2": 321.164, "r_x3": 134.765, "r_y3": 321.164, "coord_origin": "TOPLEFT"}, "text": "5", "orig": "5", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 17, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 154.938, "r_y0": 331.732, "r_x1": 229.035, "r_y1": 331.732, "r_x2": 229.035, "r_y2": 321.164, "r_x3": 154.938, "r_y3": 321.164, "coord_origin": "TOPLEFT"}, "text": "Experiments", "orig": "Experiments", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 1, "label": "text", "bbox": {"l": 134.765, "t": 347.25, "r": 480.595, "b": 451.688, "coord_origin": "TOPLEFT"}, "confidence": 0.9877985119819641, "cells": [{"index": 18, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 356.047, "r_x1": 480.594, "r_y1": 356.047, "r_x2": 480.594, "r_y2": 347.25, "r_x3": 134.765, "r_y3": 347.25, "coord_origin": "TOPLEFT"}, "text": "To evaluate the impact of OTSL on prediction accuracy and inference times, we", "orig": "To evaluate the impact of OTSL on prediction accuracy and inference times, we", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 19, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 368.002, "r_x1": 480.595, "r_y1": 368.002, "r_x2": 480.595, "r_y2": 359.205, "r_x3": 134.765, "r_y3": 359.205, "coord_origin": "TOPLEFT"}, "text": "conducted a series of experiments based on the TableFormer model (Figure 4)", "orig": "conducted a series of experiments based on the TableFormer model (Figure 4)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 20, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 379.957, "r_x1": 480.588, "r_y1": 379.957, "r_x2": 480.588, "r_y2": 371.16, "r_x3": 134.765, "r_y3": 371.16, "coord_origin": "TOPLEFT"}, "text": "with two objectives: Firstly we evaluate the prediction quality and performance", "orig": "with two objectives: Firstly we evaluate the prediction quality and performance", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 21, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 391.912, "r_x1": 480.588, "r_y1": 391.912, "r_x2": 480.588, "r_y2": 383.115, "r_x3": 134.765, "r_y3": 383.115, "coord_origin": "TOPLEFT"}, "text": "of OTSL vs. HTML after performing Hyper Parameter Optimization (HPO) on", "orig": "of OTSL vs. HTML after performing Hyper Parameter Optimization (HPO) on", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 22, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 403.867, "r_x1": 148.598, "r_y1": 403.867, "r_x2": 148.598, "r_y2": 395.07, "r_x3": 134.765, "r_y3": 395.07, "coord_origin": "TOPLEFT"}, "text": "the", "orig": "the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 23, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 151.627, "r_y0": 403.867, "r_x1": 191.847, "r_y1": 403.867, "r_x2": 191.847, "r_y2": 395.07, "r_x3": 151.627, "r_y3": 395.07, "coord_origin": "TOPLEFT"}, "text": "canonical", "orig": "canonical", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 24, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 195.902, "r_y0": 403.867, "r_x1": 480.595, "r_y1": 403.867, "r_x2": 480.595, "r_y2": 395.07, "r_x3": 195.902, "r_y3": 395.07, "coord_origin": "TOPLEFT"}, "text": "PubTabNet data set. Secondly we pick the best hyper-parameters", "orig": "PubTabNet data set. Secondly we pick the best hyper-parameters", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 25, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 415.822, "r_x1": 172.59, "r_y1": 415.822, "r_x2": 172.59, "r_y2": 407.025, "r_x3": 134.765, "r_y3": 407.025, "coord_origin": "TOPLEFT"}, "text": "found in", "orig": "found in", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 26, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 177.492, "r_y0": 415.822, "r_x1": 191.325, "r_y1": 415.822, "r_x2": 191.325, "r_y2": 407.025, "r_x3": 177.492, "r_y3": 407.025, "coord_origin": "TOPLEFT"}, "text": "the", "orig": "the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 27, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 196.226, "r_y0": 415.822, "r_x1": 213.463, "r_y1": 415.822, "r_x2": 213.463, "r_y2": 407.025, "r_x3": 196.226, "r_y3": 407.025, "coord_origin": "TOPLEFT"}, "text": "first", "orig": "first", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 28, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 218.364, "r_y0": 415.822, "r_x1": 236.125, "r_y1": 415.822, "r_x2": 236.125, "r_y2": 407.025, "r_x3": 218.364, "r_y3": 407.025, "coord_origin": "TOPLEFT"}, "text": "step", "orig": "step", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 29, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 241.027, "r_y0": 415.822, "r_x1": 297.661, "r_y1": 415.822, "r_x2": 297.661, "r_y2": 407.025, "r_x3": 241.027, "r_y3": 407.025, "coord_origin": "TOPLEFT"}, "text": "and evaluate", "orig": "and evaluate", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 30, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 302.563, "r_y0": 415.822, "r_x1": 480.593, "r_y1": 415.822, "r_x2": 480.593, "r_y2": 407.025, "r_x3": 302.563, "r_y3": 407.025, "coord_origin": "TOPLEFT"}, "text": "how OTSL impacts the performance of", "orig": "how OTSL impacts the performance of", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 31, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 427.778, "r_x1": 377.321, "r_y1": 427.778, "r_x2": 377.321, "r_y2": 418.981, "r_x3": 134.765, "r_y3": 418.981, "coord_origin": "TOPLEFT"}, "text": "TableFormer after training on other publicly available", "orig": "TableFormer after training on other publicly available", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 32, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 381.874, "r_y0": 427.778, "r_x1": 421.951, "r_y1": 427.778, "r_x2": 421.951, "r_y2": 418.981, "r_x3": 381.874, "r_y3": 418.981, "coord_origin": "TOPLEFT"}, "text": "data sets", "orig": "data sets", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 33, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 426.504, "r_y0": 427.778, "r_x1": 480.595, "r_y1": 427.778, "r_x2": 480.595, "r_y2": 418.981, "r_x3": 426.504, "r_y3": 418.981, "coord_origin": "TOPLEFT"}, "text": "(FinTabNet,", "orig": "(FinTabNet,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 34, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 439.733, "r_x1": 480.592, "r_y1": 439.733, "r_x2": 480.592, "r_y2": 430.936, "r_x3": 134.765, "r_y3": 430.936, "coord_origin": "TOPLEFT"}, "text": "PubTables-1M [14]). The ground truth (GT) from all data sets has been con-", "orig": "PubTables-1M [14]). The ground truth (GT) from all data sets has been con-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 35, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 451.688, "r_x1": 479.303, "r_y1": 451.688, "r_x2": 479.303, "r_y2": 442.891, "r_x3": 134.765, "r_y3": 442.891, "coord_origin": "TOPLEFT"}, "text": "verted into OTSL format for this purpose, and will be made publicly available.", "orig": "verted into OTSL format for this purpose, and will be made publicly available.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 7, "label": "caption", "bbox": {"l": 134.765, "t": 482.433, "r": 480.591, "b": 504.681, "coord_origin": "TOPLEFT"}, "confidence": 0.9297956228256226, "cells": [{"index": 36, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 492.574, "r_x1": 162.644, "r_y1": 492.574, "r_x2": 162.644, "r_y2": 484.648, "r_x3": 134.765, "r_y3": 484.648, "coord_origin": "TOPLEFT"}, "text": "Fig. 4.", "orig": "Fig. 4.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 37, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 165.196, "r_y0": 493.722, "r_x1": 480.591, "r_y1": 493.722, "r_x2": 480.591, "r_y2": 482.433, "r_x3": 165.196, "r_y3": 482.433, "coord_origin": "TOPLEFT"}, "text": "Architecture sketch of the TableFormer model, which is a representative for the", "orig": "Architecture sketch of the TableFormer model, which is a representative for the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 38, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 504.681, "r_x1": 206.702, "r_y1": 504.681, "r_x2": 206.702, "r_y2": 493.392, "r_x3": 134.765, "r_y3": 493.392, "coord_origin": "TOPLEFT"}, "text": "Im2Seq approach.", "orig": "Im2Seq approach.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 6, "label": "picture", "bbox": {"l": 140.70968627929688, "t": 508.0638427734375, "r": 472.73382568359375, "b": 593.6771850585938, "coord_origin": "TOPLEFT"}, "confidence": 0.9303396344184875, "cells": [{"index": 39, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 147.3, "r_y0": 543.091, "r_x1": 149.407, "r_y1": 543.091, "r_x2": 149.407, "r_y2": 540.762, "r_x3": 147.3, "r_y3": 540.762, "coord_origin": "TOPLEFT"}, "text": "1.", "orig": "1.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 40, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 150.809, "r_y0": 543.091, "r_x1": 155.721, "r_y1": 543.091, "r_x2": 155.721, "r_y2": 540.762, "r_x3": 150.809, "r_y3": 540.762, "coord_origin": "TOPLEFT"}, "text": "Item", "orig": "Item", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 41, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 162.76, "r_y0": 537.754, "r_x1": 172.296, "r_y1": 537.754, "r_x2": 172.296, "r_y2": 535.424, "r_x3": 162.76, "r_y3": 535.424, "coord_origin": "TOPLEFT"}, "text": "Amount", "orig": "Amount", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 42, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 147.636, "r_y0": 537.726, "r_x1": 155.918, "r_y1": 537.726, "r_x2": 155.918, "r_y2": 535.396, "r_x3": 147.636, "r_y3": 535.396, "coord_origin": "TOPLEFT"}, "text": "Names", "orig": "Names", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 43, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 158.485, "r_y0": 543.091, "r_x1": 164.102, "r_y1": 543.091, "r_x2": 164.102, "r_y2": 540.762, "r_x3": 158.485, "r_y3": 540.762, "coord_origin": "TOPLEFT"}, "text": "1000", "orig": "1000", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 44, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 158.485, "r_y0": 547.03, "r_x1": 162.697, "r_y1": 547.03, "r_x2": 162.697, "r_y2": 544.701, "r_x3": 158.485, "r_y3": 544.701, "coord_origin": "TOPLEFT"}, "text": "500", "orig": "500", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 45, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 158.485, "r_y0": 551.2719999999999, "r_x1": 164.102, "r_y1": 551.2719999999999, "r_x2": 164.102, "r_y2": 548.943, "r_x3": 158.485, "r_y3": 548.943, "coord_origin": "TOPLEFT"}, "text": "3500", "orig": "3500", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 46, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 158.485, "r_y0": 555.514, "r_x1": 162.697, "r_y1": 555.514, "r_x2": 162.697, "r_y2": 553.185, "r_x3": 158.485, "r_y3": 553.185, "coord_origin": "TOPLEFT"}, "text": "150", "orig": "150", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 47, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 168.817, "r_y0": 543.091, "r_x1": 172.889, "r_y1": 543.091, "r_x2": 172.889, "r_y2": 540.762, "r_x3": 168.817, "r_y3": 540.762, "coord_origin": "TOPLEFT"}, "text": "unit", "orig": "unit", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 48, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 168.817, "r_y0": 547.03, "r_x1": 172.889, "r_y1": 547.03, "r_x2": 172.889, "r_y2": 544.701, "r_x3": 168.817, "r_y3": 544.701, "coord_origin": "TOPLEFT"}, "text": "unit", "orig": "unit", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 49, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 168.817, "r_y0": 551.2719999999999, "r_x1": 172.889, "r_y1": 551.2719999999999, "r_x2": 172.889, "r_y2": 548.943, "r_x3": 168.817, "r_y3": 548.943, "coord_origin": "TOPLEFT"}, "text": "unit", "orig": "unit", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 50, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 168.817, "r_y0": 555.514, "r_x1": 172.889, "r_y1": 555.514, "r_x2": 172.889, "r_y2": 553.185, "r_x3": 168.817, "r_y3": 553.185, "coord_origin": "TOPLEFT"}, "text": "unit", "orig": "unit", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 51, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 147.3, "r_y0": 547.03, "r_x1": 149.407, "r_y1": 547.03, "r_x2": 149.407, "r_y2": 544.701, "r_x3": 147.3, "r_y3": 544.701, "coord_origin": "TOPLEFT"}, "text": "2.", "orig": "2.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 52, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 150.809, "r_y0": 547.03, "r_x1": 155.721, "r_y1": 547.03, "r_x2": 155.721, "r_y2": 544.701, "r_x3": 150.809, "r_y3": 544.701, "coord_origin": "TOPLEFT"}, "text": "Item", "orig": "Item", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 53, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 147.3, "r_y0": 551.2719999999999, "r_x1": 149.407, "r_y1": 551.2719999999999, "r_x2": 149.407, "r_y2": 548.943, "r_x3": 147.3, "r_y3": 548.943, "coord_origin": "TOPLEFT"}, "text": "3.", "orig": "3.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 54, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 150.809, "r_y0": 551.2719999999999, "r_x1": 155.721, "r_y1": 551.2719999999999, "r_x2": 155.721, "r_y2": 548.943, "r_x3": 150.809, "r_y3": 548.943, "coord_origin": "TOPLEFT"}, "text": "Item", "orig": "Item", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 55, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 147.3, "r_y0": 555.514, "r_x1": 149.407, "r_y1": 555.514, "r_x2": 149.407, "r_y2": 553.185, "r_x3": 147.3, "r_y3": 553.185, "coord_origin": "TOPLEFT"}, "text": "4.", "orig": "4.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 56, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 150.809, "r_y0": 555.514, "r_x1": 155.721, "r_y1": 555.514, "r_x2": 155.721, "r_y2": 553.185, "r_x3": 150.809, "r_y3": 553.185, "coord_origin": "TOPLEFT"}, "text": "Item", "orig": "Item", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 57, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 152.05, "r_y0": 521.2570000000001, "r_x1": 171.249, "r_y1": 521.2570000000001, "r_x2": 171.249, "r_y2": 517.0640000000001, "r_x3": 152.05, "r_y3": 517.0640000000001, "coord_origin": "TOPLEFT"}, "text": "Extracted", "orig": "Extracted", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 58, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 148.133, "r_y0": 526.56, "r_x1": 175.168, "r_y1": 526.56, "r_x2": 175.168, "r_y2": 522.367, "r_x3": 148.133, "r_y3": 522.367, "coord_origin": "TOPLEFT"}, "text": "Table Images", "orig": "Table Images", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 59, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 193.533, "r_y0": 528.762, "r_x1": 220.32, "r_y1": 528.762, "r_x2": 220.32, "r_y2": 524.569, "r_x3": 193.533, "r_y3": 524.569, "coord_origin": "TOPLEFT"}, "text": "Standardized", "orig": "Standardized", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 60, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 199.473, "r_y0": 534.0640000000001, "r_x1": 214.379, "r_y1": 534.0640000000001, "r_x2": 214.379, "r_y2": 529.871, "r_x3": 199.473, "r_y3": 529.871, "coord_origin": "TOPLEFT"}, "text": "Images", "orig": "Images", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 61, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 273.611, "r_y0": 514.153, "r_x1": 284.473, "r_y1": 514.153, "r_x2": 284.473, "r_y2": 509.96, "r_x3": 273.611, "r_y3": 509.96, "coord_origin": "TOPLEFT"}, "text": "BBox", "orig": "BBox", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 62, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 270.452, "r_y0": 517.94, "r_x1": 287.632, "r_y1": 517.94, "r_x2": 287.632, "r_y2": 513.7470000000001, "r_x3": 270.452, "r_y3": 513.7470000000001, "coord_origin": "TOPLEFT"}, "text": "Decoder", "orig": "Decoder", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 63, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 332.478, "r_y0": 512.392, "r_x1": 348.14, "r_y1": 512.392, "r_x2": 348.14, "r_y2": 508.199, "r_x3": 332.478, "r_y3": 508.199, "coord_origin": "TOPLEFT"}, "text": "BBoxes", "orig": "BBoxes", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 64, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 376.686, "r_y0": 525.3679999999999, "r_x1": 407.255, "r_y1": 525.3679999999999, "r_x2": 407.255, "r_y2": 521.175, "r_x3": 376.686, "r_y3": 521.175, "coord_origin": "TOPLEFT"}, "text": "BBoxes can be", "orig": "BBoxes can be", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 65, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 373.909, "r_y0": 529.913, "r_x1": 410.035, "r_y1": 529.913, "r_x2": 410.035, "r_y2": 525.72, "r_x3": 373.909, "r_y3": 525.72, "coord_origin": "TOPLEFT"}, "text": "traced back to the", "orig": "traced back to the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 66, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 375.299, "r_y0": 534.4580000000001, "r_x1": 408.649, "r_y1": 534.4580000000001, "r_x2": 408.649, "r_y2": 530.265, "r_x3": 375.299, "r_y3": 530.265, "coord_origin": "TOPLEFT"}, "text": "original image to", "orig": "original image to", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 67, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 377.067, "r_y0": 539.0029999999999, "r_x1": 406.883, "r_y1": 539.0029999999999, "r_x2": 406.883, "r_y2": 534.81, "r_x3": 377.067, "r_y3": 534.81, "coord_origin": "TOPLEFT"}, "text": "extract content", "orig": "extract content", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 68, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 383.567, "r_y0": 567.489, "r_x1": 433.765, "r_y1": 567.489, "r_x2": 433.765, "r_y2": 563.296, "r_x3": 383.567, "r_y3": 563.296, "coord_origin": "TOPLEFT"}, "text": "Structure Tags sequence", "orig": "Structure Tags sequence", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 69, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 383.528, "r_y0": 572.034, "r_x1": 433.808, "r_y1": 572.034, "r_x2": 433.808, "r_y2": 567.841, "r_x3": 383.528, "r_y3": 567.841, "coord_origin": "TOPLEFT"}, "text": "provide full description of", "orig": "provide full description of", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 70, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 390.475, "r_y0": 576.579, "r_x1": 426.857, "r_y1": 576.579, "r_x2": 426.857, "r_y2": 572.386, "r_x3": 390.475, "r_y3": 572.386, "coord_origin": "TOPLEFT"}, "text": "the table structure", "orig": "the table structure", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 71, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 293.947, "r_y0": 582.139, "r_x1": 323.169, "r_y1": 582.139, "r_x2": 323.169, "r_y2": 577.946, "r_x3": 293.947, "r_y3": 577.946, "coord_origin": "TOPLEFT"}, "text": "Structure Tags", "orig": "Structure Tags", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 72, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 293.947, "r_y0": 586.684, "r_x1": 324.594, "r_y1": 586.684, "r_x2": 324.594, "r_y2": 582.491, "r_x3": 293.947, "r_y3": 582.491, "coord_origin": "TOPLEFT"}, "text": "in OTSL format", "orig": "in OTSL format", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 73, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 333.078, "r_y0": 546.0699999999999, "r_x1": 364.147, "r_y1": 546.0699999999999, "r_x2": 364.147, "r_y2": 541.877, "r_x3": 333.078, "r_y3": 541.877, "coord_origin": "TOPLEFT"}, "text": "BBoxes in sync", "orig": "BBoxes in sync", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 74, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 333.078, "r_y0": 549.858, "r_x1": 369.715, "r_y1": 549.858, "r_x2": 369.715, "r_y2": 545.665, "r_x3": 333.078, "r_y3": 545.665, "coord_origin": "TOPLEFT"}, "text": "with tag sequence", "orig": "with tag sequence", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 75, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 232.659, "r_y0": 519.489, "r_x1": 249.589, "r_y1": 519.489, "r_x2": 249.589, "r_y2": 515.296, "r_x3": 232.659, "r_y3": 515.296, "coord_origin": "TOPLEFT"}, "text": "Encoder", "orig": "Encoder", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 76, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 269.822, "r_y0": 550.218, "r_x1": 288.263, "r_y1": 550.218, "r_x2": 288.263, "r_y2": 546.0260000000001, "r_x3": 269.822, "r_y3": 546.0260000000001, "coord_origin": "TOPLEFT"}, "text": "Structure", "orig": "Structure", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 77, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 270.452, "r_y0": 554.006, "r_x1": 287.632, "r_y1": 554.006, "r_x2": 287.632, "r_y2": 549.813, "r_x3": 270.452, "r_y3": 549.813, "coord_origin": "TOPLEFT"}, "text": "Decoder", "orig": "Decoder", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 78, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 332.177, "r_y0": 520.1600000000001, "r_x1": 358.112, "r_y1": 520.1600000000001, "r_x2": 358.112, "r_y2": 515.967, "r_x3": 332.177, "r_y3": 515.967, "coord_origin": "TOPLEFT"}, "text": "[x1, y2, x2, y2]", "orig": "[x1, y2, x2, y2]", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 79, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 332.177, "r_y0": 526.22, "r_x1": 361.583, "r_y1": 526.22, "r_x2": 361.583, "r_y2": 522.027, "r_x3": 332.177, "r_y3": 522.027, "coord_origin": "TOPLEFT"}, "text": "[x1', y2', x2', y2']", "orig": "[x1', y2', x2', y2']", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 80, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 332.177, "r_y0": 532.28, "r_x1": 364.765, "r_y1": 532.28, "r_x2": 364.765, "r_y2": 528.087, "r_x3": 332.177, "r_y3": 528.087, "coord_origin": "TOPLEFT"}, "text": "[x1'', y2'', x2'', y2'']", "orig": "[x1'', y2'', x2'', y2'']", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 81, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 332.177, "r_y0": 538.34, "r_x1": 335.965, "r_y1": 538.34, "r_x2": 335.965, "r_y2": 534.1469999999999, "r_x3": 332.177, "r_y3": 534.1469999999999, "coord_origin": "TOPLEFT"}, "text": "...", "orig": "...", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 82, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 326.889, "r_y0": 520.643, "r_x1": 329.416, "r_y1": 520.643, "r_x2": 329.416, "r_y2": 516.45, "r_x3": 326.889, "r_y3": 516.45, "coord_origin": "TOPLEFT"}, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 83, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 327.041, "r_y0": 526.672, "r_x1": 329.568, "r_y1": 526.672, "r_x2": 329.568, "r_y2": 522.479, "r_x3": 327.041, "r_y3": 522.479, "coord_origin": "TOPLEFT"}, "text": "2", "orig": "2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 84, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 327.041, "r_y0": 532.7629999999999, "r_x1": 329.568, "r_y1": 532.7629999999999, "r_x2": 329.568, "r_y2": 528.5699999999999, "r_x3": 327.041, "r_y3": 528.5699999999999, "coord_origin": "TOPLEFT"}, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 85, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 424.141, "r_y0": 531.69, "r_x1": 426.668, "r_y1": 531.69, "r_x2": 426.668, "r_y2": 527.4970000000001, "r_x3": 424.141, "r_y3": 527.4970000000001, "coord_origin": "TOPLEFT"}, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 86, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 453.002, "r_y0": 521.701, "r_x1": 455.529, "r_y1": 521.701, "r_x2": 455.529, "r_y2": 517.508, "r_x3": 453.002, "r_y3": 517.508, "coord_origin": "TOPLEFT"}, "text": "2", "orig": "2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 87, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 423.858, "r_y0": 521.31, "r_x1": 426.385, "r_y1": 521.31, "r_x2": 426.385, "r_y2": 517.117, "r_x3": 423.858, "r_y3": 517.117, "coord_origin": "TOPLEFT"}, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 88, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 333.434, "r_y0": 562.3389999999999, "r_x1": 359.834, "r_y1": 561.855, "r_x2": 359.834, "r_y2": 556.947, "r_x3": 333.434, "r_y3": 557.431, "coord_origin": "TOPLEFT"}, "text": "C C L NL", "orig": "C C L NL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 89, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 340.31, "r_y0": 568.837, "r_x1": 359.986, "r_y1": 568.552, "r_x2": 359.986, "r_y2": 563.644, "r_x3": 340.31, "r_y3": 563.929, "coord_origin": "TOPLEFT"}, "text": "C C NL", "orig": "C C NL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 90, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 333.596, "r_y0": 568.795, "r_x1": 337.437, "r_y1": 568.795, "r_x2": 337.437, "r_y2": 563.887, "r_x3": 333.596, "r_y3": 563.887, "coord_origin": "TOPLEFT"}, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 91, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 340.375, "r_y0": 575.399, "r_x1": 359.999, "r_y1": 575.134, "r_x2": 359.999, "r_y2": 570.226, "r_x3": 340.375, "r_y3": 570.491, "coord_origin": "TOPLEFT"}, "text": "C C NL", "orig": "C C NL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 92, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 333.661, "r_y0": 575.356, "r_x1": 337.503, "r_y1": 575.356, "r_x2": 337.503, "r_y2": 570.448, "r_x3": 333.661, "r_y3": 570.448, "coord_origin": "TOPLEFT"}, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 93, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 340.377, "r_y0": 581.998, "r_x1": 359.954, "r_y1": 581.738, "r_x2": 359.954, "r_y2": 576.83, "r_x3": 340.377, "r_y3": 577.09, "coord_origin": "TOPLEFT"}, "text": "C C NL", "orig": "C C NL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 94, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 333.663, "r_y0": 581.955, "r_x1": 337.504, "r_y1": 581.955, "r_x2": 337.504, "r_y2": 577.047, "r_x3": 333.663, "r_y3": 577.047, "coord_origin": "TOPLEFT"}, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 95, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 340.279, "r_y0": 588.369, "r_x1": 360.07, "r_y1": 588.3779999999999, "r_x2": 360.07, "r_y2": 583.47, "r_x3": 340.279, "r_y3": 583.461, "coord_origin": "TOPLEFT"}, "text": "C C NL", "orig": "C C NL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 96, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 333.566, "r_y0": 588.327, "r_x1": 337.407, "r_y1": 588.327, "r_x2": 337.407, "r_y2": 583.419, "r_x3": 333.566, "r_y3": 583.419, "coord_origin": "TOPLEFT"}, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 97, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 331.14, "r_y0": 568.538, "r_x1": 333.667, "r_y1": 568.538, "r_x2": 333.667, "r_y2": 564.345, "r_x3": 331.14, "r_y3": 564.345, "coord_origin": "TOPLEFT"}, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 98, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 340.81, "r_y0": 558.841, "r_x1": 343.337, "r_y1": 558.841, "r_x2": 343.337, "r_y2": 554.648, "r_x3": 340.81, "r_y3": 554.648, "coord_origin": "TOPLEFT"}, "text": "2", "orig": "2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 99, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 330.98, "r_y0": 559.078, "r_x1": 333.507, "r_y1": 559.078, "r_x2": 333.507, "r_y2": 554.885, "r_x3": 330.98, "r_y3": 554.885, "coord_origin": "TOPLEFT"}, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": [{"id": 13, "label": "text", "bbox": {"l": 147.3, "t": 540.762, "r": 149.407, "b": 543.091, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 39, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 147.3, "r_y0": 543.091, "r_x1": 149.407, "r_y1": 543.091, "r_x2": 149.407, "r_y2": 540.762, "r_x3": 147.3, "r_y3": 540.762, "coord_origin": "TOPLEFT"}, "text": "1.", "orig": "1.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 14, "label": "text", "bbox": {"l": 150.809, "t": 540.762, "r": 155.721, "b": 543.091, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 40, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 150.809, "r_y0": 543.091, "r_x1": 155.721, "r_y1": 543.091, "r_x2": 155.721, "r_y2": 540.762, "r_x3": 150.809, "r_y3": 540.762, "coord_origin": "TOPLEFT"}, "text": "Item", "orig": "Item", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 15, "label": "text", "bbox": {"l": 162.76, "t": 535.424, "r": 172.296, "b": 537.754, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 41, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 162.76, "r_y0": 537.754, "r_x1": 172.296, "r_y1": 537.754, "r_x2": 172.296, "r_y2": 535.424, "r_x3": 162.76, "r_y3": 535.424, "coord_origin": "TOPLEFT"}, "text": "Amount", "orig": "Amount", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 16, "label": "text", "bbox": {"l": 147.636, "t": 535.396, "r": 155.918, "b": 537.726, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 42, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 147.636, "r_y0": 537.726, "r_x1": 155.918, "r_y1": 537.726, "r_x2": 155.918, "r_y2": 535.396, "r_x3": 147.636, "r_y3": 535.396, "coord_origin": "TOPLEFT"}, "text": "Names", "orig": "Names", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 17, "label": "text", "bbox": {"l": 158.485, "t": 540.762, "r": 164.102, "b": 543.091, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 43, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 158.485, "r_y0": 543.091, "r_x1": 164.102, "r_y1": 543.091, "r_x2": 164.102, "r_y2": 540.762, "r_x3": 158.485, "r_y3": 540.762, "coord_origin": "TOPLEFT"}, "text": "1000", "orig": "1000", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 18, "label": "text", "bbox": {"l": 158.485, "t": 544.701, "r": 162.697, "b": 547.03, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 44, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 158.485, "r_y0": 547.03, "r_x1": 162.697, "r_y1": 547.03, "r_x2": 162.697, "r_y2": 544.701, "r_x3": 158.485, "r_y3": 544.701, "coord_origin": "TOPLEFT"}, "text": "500", "orig": "500", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 19, "label": "text", "bbox": {"l": 158.485, "t": 548.943, "r": 164.102, "b": 551.2719999999999, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 45, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 158.485, "r_y0": 551.2719999999999, "r_x1": 164.102, "r_y1": 551.2719999999999, "r_x2": 164.102, "r_y2": 548.943, "r_x3": 158.485, "r_y3": 548.943, "coord_origin": "TOPLEFT"}, "text": "3500", "orig": "3500", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 20, "label": "text", "bbox": {"l": 158.485, "t": 553.185, "r": 162.697, "b": 555.514, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 46, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 158.485, "r_y0": 555.514, "r_x1": 162.697, "r_y1": 555.514, "r_x2": 162.697, "r_y2": 553.185, "r_x3": 158.485, "r_y3": 553.185, "coord_origin": "TOPLEFT"}, "text": "150", "orig": "150", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 21, "label": "text", "bbox": {"l": 168.817, "t": 540.762, "r": 172.889, "b": 543.091, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 47, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 168.817, "r_y0": 543.091, "r_x1": 172.889, "r_y1": 543.091, "r_x2": 172.889, "r_y2": 540.762, "r_x3": 168.817, "r_y3": 540.762, "coord_origin": "TOPLEFT"}, "text": "unit", "orig": "unit", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 22, "label": "text", "bbox": {"l": 168.817, "t": 544.701, "r": 172.889, "b": 547.03, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 48, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 168.817, "r_y0": 547.03, "r_x1": 172.889, "r_y1": 547.03, "r_x2": 172.889, "r_y2": 544.701, "r_x3": 168.817, "r_y3": 544.701, "coord_origin": "TOPLEFT"}, "text": "unit", "orig": "unit", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 23, "label": "text", "bbox": {"l": 168.817, "t": 548.943, "r": 172.889, "b": 551.2719999999999, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 49, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 168.817, "r_y0": 551.2719999999999, "r_x1": 172.889, "r_y1": 551.2719999999999, "r_x2": 172.889, "r_y2": 548.943, "r_x3": 168.817, "r_y3": 548.943, "coord_origin": "TOPLEFT"}, "text": "unit", "orig": "unit", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 24, "label": "text", "bbox": {"l": 168.817, "t": 553.185, "r": 172.889, "b": 555.514, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 50, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 168.817, "r_y0": 555.514, "r_x1": 172.889, "r_y1": 555.514, "r_x2": 172.889, "r_y2": 553.185, "r_x3": 168.817, "r_y3": 553.185, "coord_origin": "TOPLEFT"}, "text": "unit", "orig": "unit", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 25, "label": "text", "bbox": {"l": 147.3, "t": 544.701, "r": 149.407, "b": 547.03, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 51, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 147.3, "r_y0": 547.03, "r_x1": 149.407, "r_y1": 547.03, "r_x2": 149.407, "r_y2": 544.701, "r_x3": 147.3, "r_y3": 544.701, "coord_origin": "TOPLEFT"}, "text": "2.", "orig": "2.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 26, "label": "text", "bbox": {"l": 150.809, "t": 544.701, "r": 155.721, "b": 547.03, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 52, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 150.809, "r_y0": 547.03, "r_x1": 155.721, "r_y1": 547.03, "r_x2": 155.721, "r_y2": 544.701, "r_x3": 150.809, "r_y3": 544.701, "coord_origin": "TOPLEFT"}, "text": "Item", "orig": "Item", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 27, "label": "text", "bbox": {"l": 147.3, "t": 548.943, "r": 149.407, "b": 551.2719999999999, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 53, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 147.3, "r_y0": 551.2719999999999, "r_x1": 149.407, "r_y1": 551.2719999999999, "r_x2": 149.407, "r_y2": 548.943, "r_x3": 147.3, "r_y3": 548.943, "coord_origin": "TOPLEFT"}, "text": "3.", "orig": "3.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 28, "label": "text", "bbox": {"l": 150.809, "t": 548.943, "r": 155.721, "b": 551.2719999999999, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 54, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 150.809, "r_y0": 551.2719999999999, "r_x1": 155.721, "r_y1": 551.2719999999999, "r_x2": 155.721, "r_y2": 548.943, "r_x3": 150.809, "r_y3": 548.943, "coord_origin": "TOPLEFT"}, "text": "Item", "orig": "Item", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 29, "label": "text", "bbox": {"l": 147.3, "t": 553.185, "r": 149.407, "b": 555.514, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 55, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 147.3, "r_y0": 555.514, "r_x1": 149.407, "r_y1": 555.514, "r_x2": 149.407, "r_y2": 553.185, "r_x3": 147.3, "r_y3": 553.185, "coord_origin": "TOPLEFT"}, "text": "4.", "orig": "4.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 30, "label": "text", "bbox": {"l": 150.809, "t": 553.185, "r": 155.721, "b": 555.514, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 56, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 150.809, "r_y0": 555.514, "r_x1": 155.721, "r_y1": 555.514, "r_x2": 155.721, "r_y2": 553.185, "r_x3": 150.809, "r_y3": 553.185, "coord_origin": "TOPLEFT"}, "text": "Item", "orig": "Item", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 31, "label": "text", "bbox": {"l": 152.05, "t": 517.0640000000001, "r": 171.249, "b": 521.2570000000001, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 57, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 152.05, "r_y0": 521.2570000000001, "r_x1": 171.249, "r_y1": 521.2570000000001, "r_x2": 171.249, "r_y2": 517.0640000000001, "r_x3": 152.05, "r_y3": 517.0640000000001, "coord_origin": "TOPLEFT"}, "text": "Extracted", "orig": "Extracted", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 32, "label": "text", "bbox": {"l": 148.133, "t": 522.367, "r": 175.168, "b": 526.56, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 58, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 148.133, "r_y0": 526.56, "r_x1": 175.168, "r_y1": 526.56, "r_x2": 175.168, "r_y2": 522.367, "r_x3": 148.133, "r_y3": 522.367, "coord_origin": "TOPLEFT"}, "text": "Table Images", "orig": "Table Images", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 33, "label": "text", "bbox": {"l": 193.533, "t": 524.569, "r": 220.32, "b": 528.762, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 59, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 193.533, "r_y0": 528.762, "r_x1": 220.32, "r_y1": 528.762, "r_x2": 220.32, "r_y2": 524.569, "r_x3": 193.533, "r_y3": 524.569, "coord_origin": "TOPLEFT"}, "text": "Standardized", "orig": "Standardized", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 34, "label": "text", "bbox": {"l": 199.473, "t": 529.871, "r": 214.379, "b": 534.0640000000001, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 60, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 199.473, "r_y0": 534.0640000000001, "r_x1": 214.379, "r_y1": 534.0640000000001, "r_x2": 214.379, "r_y2": 529.871, "r_x3": 199.473, "r_y3": 529.871, "coord_origin": "TOPLEFT"}, "text": "Images", "orig": "Images", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 35, "label": "text", "bbox": {"l": 273.611, "t": 509.96, "r": 284.473, "b": 514.153, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 61, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 273.611, "r_y0": 514.153, "r_x1": 284.473, "r_y1": 514.153, "r_x2": 284.473, "r_y2": 509.96, "r_x3": 273.611, "r_y3": 509.96, "coord_origin": "TOPLEFT"}, "text": "BBox", "orig": "BBox", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 36, "label": "text", "bbox": {"l": 270.452, "t": 513.7470000000001, "r": 287.632, "b": 517.94, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 62, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 270.452, "r_y0": 517.94, "r_x1": 287.632, "r_y1": 517.94, "r_x2": 287.632, "r_y2": 513.7470000000001, "r_x3": 270.452, "r_y3": 513.7470000000001, "coord_origin": "TOPLEFT"}, "text": "Decoder", "orig": "Decoder", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 37, "label": "text", "bbox": {"l": 332.478, "t": 508.199, "r": 348.14, "b": 512.392, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 63, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 332.478, "r_y0": 512.392, "r_x1": 348.14, "r_y1": 512.392, "r_x2": 348.14, "r_y2": 508.199, "r_x3": 332.478, "r_y3": 508.199, "coord_origin": "TOPLEFT"}, "text": "BBoxes", "orig": "BBoxes", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 38, "label": "text", "bbox": {"l": 376.686, "t": 521.175, "r": 407.255, "b": 525.3679999999999, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 64, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 376.686, "r_y0": 525.3679999999999, "r_x1": 407.255, "r_y1": 525.3679999999999, "r_x2": 407.255, "r_y2": 521.175, "r_x3": 376.686, "r_y3": 521.175, "coord_origin": "TOPLEFT"}, "text": "BBoxes can be", "orig": "BBoxes can be", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 39, "label": "text", "bbox": {"l": 373.909, "t": 525.72, "r": 410.035, "b": 529.913, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 65, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 373.909, "r_y0": 529.913, "r_x1": 410.035, "r_y1": 529.913, "r_x2": 410.035, "r_y2": 525.72, "r_x3": 373.909, "r_y3": 525.72, "coord_origin": "TOPLEFT"}, "text": "traced back to the", "orig": "traced back to the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 40, "label": "text", "bbox": {"l": 375.299, "t": 530.265, "r": 408.649, "b": 534.4580000000001, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 66, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 375.299, "r_y0": 534.4580000000001, "r_x1": 408.649, "r_y1": 534.4580000000001, "r_x2": 408.649, "r_y2": 530.265, "r_x3": 375.299, "r_y3": 530.265, "coord_origin": "TOPLEFT"}, "text": "original image to", "orig": "original image to", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 41, "label": "text", "bbox": {"l": 377.067, "t": 534.81, "r": 406.883, "b": 539.0029999999999, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 67, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 377.067, "r_y0": 539.0029999999999, "r_x1": 406.883, "r_y1": 539.0029999999999, "r_x2": 406.883, "r_y2": 534.81, "r_x3": 377.067, "r_y3": 534.81, "coord_origin": "TOPLEFT"}, "text": "extract content", "orig": "extract content", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 42, "label": "text", "bbox": {"l": 383.567, "t": 563.296, "r": 433.765, "b": 567.489, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 68, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 383.567, "r_y0": 567.489, "r_x1": 433.765, "r_y1": 567.489, "r_x2": 433.765, "r_y2": 563.296, "r_x3": 383.567, "r_y3": 563.296, "coord_origin": "TOPLEFT"}, "text": "Structure Tags sequence", "orig": "Structure Tags sequence", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 43, "label": "text", "bbox": {"l": 383.528, "t": 567.841, "r": 433.808, "b": 572.034, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 69, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 383.528, "r_y0": 572.034, "r_x1": 433.808, "r_y1": 572.034, "r_x2": 433.808, "r_y2": 567.841, "r_x3": 383.528, "r_y3": 567.841, "coord_origin": "TOPLEFT"}, "text": "provide full description of", "orig": "provide full description of", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 44, "label": "text", "bbox": {"l": 390.475, "t": 572.386, "r": 426.857, "b": 576.579, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 70, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 390.475, "r_y0": 576.579, "r_x1": 426.857, "r_y1": 576.579, "r_x2": 426.857, "r_y2": 572.386, "r_x3": 390.475, "r_y3": 572.386, "coord_origin": "TOPLEFT"}, "text": "the table structure", "orig": "the table structure", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 45, "label": "text", "bbox": {"l": 293.947, "t": 577.946, "r": 323.169, "b": 582.139, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 71, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 293.947, "r_y0": 582.139, "r_x1": 323.169, "r_y1": 582.139, "r_x2": 323.169, "r_y2": 577.946, "r_x3": 293.947, "r_y3": 577.946, "coord_origin": "TOPLEFT"}, "text": "Structure Tags", "orig": "Structure Tags", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 46, "label": "text", "bbox": {"l": 293.947, "t": 582.491, "r": 324.594, "b": 586.684, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 72, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 293.947, "r_y0": 586.684, "r_x1": 324.594, "r_y1": 586.684, "r_x2": 324.594, "r_y2": 582.491, "r_x3": 293.947, "r_y3": 582.491, "coord_origin": "TOPLEFT"}, "text": "in OTSL format", "orig": "in OTSL format", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 47, "label": "text", "bbox": {"l": 333.078, "t": 541.877, "r": 364.147, "b": 546.0699999999999, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 73, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 333.078, "r_y0": 546.0699999999999, "r_x1": 364.147, "r_y1": 546.0699999999999, "r_x2": 364.147, "r_y2": 541.877, "r_x3": 333.078, "r_y3": 541.877, "coord_origin": "TOPLEFT"}, "text": "BBoxes in sync", "orig": "BBoxes in sync", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 48, "label": "text", "bbox": {"l": 333.078, "t": 545.665, "r": 369.715, "b": 549.858, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 74, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 333.078, "r_y0": 549.858, "r_x1": 369.715, "r_y1": 549.858, "r_x2": 369.715, "r_y2": 545.665, "r_x3": 333.078, "r_y3": 545.665, "coord_origin": "TOPLEFT"}, "text": "with tag sequence", "orig": "with tag sequence", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 49, "label": "text", "bbox": {"l": 232.659, "t": 515.296, "r": 249.589, "b": 519.489, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 75, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 232.659, "r_y0": 519.489, "r_x1": 249.589, "r_y1": 519.489, "r_x2": 249.589, "r_y2": 515.296, "r_x3": 232.659, "r_y3": 515.296, "coord_origin": "TOPLEFT"}, "text": "Encoder", "orig": "Encoder", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 50, "label": "text", "bbox": {"l": 269.822, "t": 546.0260000000001, "r": 288.263, "b": 550.218, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 76, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 269.822, "r_y0": 550.218, "r_x1": 288.263, "r_y1": 550.218, "r_x2": 288.263, "r_y2": 546.0260000000001, "r_x3": 269.822, "r_y3": 546.0260000000001, "coord_origin": "TOPLEFT"}, "text": "Structure", "orig": "Structure", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 51, "label": "text", "bbox": {"l": 270.452, "t": 549.813, "r": 287.632, "b": 554.006, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 77, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 270.452, "r_y0": 554.006, "r_x1": 287.632, "r_y1": 554.006, "r_x2": 287.632, "r_y2": 549.813, "r_x3": 270.452, "r_y3": 549.813, "coord_origin": "TOPLEFT"}, "text": "Decoder", "orig": "Decoder", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 52, "label": "text", "bbox": {"l": 332.177, "t": 515.967, "r": 358.112, "b": 520.1600000000001, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 78, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 332.177, "r_y0": 520.1600000000001, "r_x1": 358.112, "r_y1": 520.1600000000001, "r_x2": 358.112, "r_y2": 515.967, "r_x3": 332.177, "r_y3": 515.967, "coord_origin": "TOPLEFT"}, "text": "[x1, y2, x2, y2]", "orig": "[x1, y2, x2, y2]", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 53, "label": "text", "bbox": {"l": 332.177, "t": 522.027, "r": 361.583, "b": 526.22, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 79, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 332.177, "r_y0": 526.22, "r_x1": 361.583, "r_y1": 526.22, "r_x2": 361.583, "r_y2": 522.027, "r_x3": 332.177, "r_y3": 522.027, "coord_origin": "TOPLEFT"}, "text": "[x1', y2', x2', y2']", "orig": "[x1', y2', x2', y2']", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 54, "label": "text", "bbox": {"l": 332.177, "t": 528.087, "r": 364.765, "b": 532.28, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 80, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 332.177, "r_y0": 532.28, "r_x1": 364.765, "r_y1": 532.28, "r_x2": 364.765, "r_y2": 528.087, "r_x3": 332.177, "r_y3": 528.087, "coord_origin": "TOPLEFT"}, "text": "[x1'', y2'', x2'', y2'']", "orig": "[x1'', y2'', x2'', y2'']", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 55, "label": "text", "bbox": {"l": 332.177, "t": 534.1469999999999, "r": 335.965, "b": 538.34, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 81, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 332.177, "r_y0": 538.34, "r_x1": 335.965, "r_y1": 538.34, "r_x2": 335.965, "r_y2": 534.1469999999999, "r_x3": 332.177, "r_y3": 534.1469999999999, "coord_origin": "TOPLEFT"}, "text": "...", "orig": "...", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 56, "label": "text", "bbox": {"l": 326.889, "t": 516.45, "r": 329.416, "b": 520.643, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 82, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 326.889, "r_y0": 520.643, "r_x1": 329.416, "r_y1": 520.643, "r_x2": 329.416, "r_y2": 516.45, "r_x3": 326.889, "r_y3": 516.45, "coord_origin": "TOPLEFT"}, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 57, "label": "text", "bbox": {"l": 327.041, "t": 522.479, "r": 329.568, "b": 526.672, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 83, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 327.041, "r_y0": 526.672, "r_x1": 329.568, "r_y1": 526.672, "r_x2": 329.568, "r_y2": 522.479, "r_x3": 327.041, "r_y3": 522.479, "coord_origin": "TOPLEFT"}, "text": "2", "orig": "2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 58, "label": "text", "bbox": {"l": 327.041, "t": 528.5699999999999, "r": 329.568, "b": 532.7629999999999, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 84, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 327.041, "r_y0": 532.7629999999999, "r_x1": 329.568, "r_y1": 532.7629999999999, "r_x2": 329.568, "r_y2": 528.5699999999999, "r_x3": 327.041, "r_y3": 528.5699999999999, "coord_origin": "TOPLEFT"}, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 59, "label": "text", "bbox": {"l": 424.141, "t": 527.4970000000001, "r": 426.668, "b": 531.69, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 85, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 424.141, "r_y0": 531.69, "r_x1": 426.668, "r_y1": 531.69, "r_x2": 426.668, "r_y2": 527.4970000000001, "r_x3": 424.141, "r_y3": 527.4970000000001, "coord_origin": "TOPLEFT"}, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 60, "label": "text", "bbox": {"l": 453.002, "t": 517.508, "r": 455.529, "b": 521.701, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 86, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 453.002, "r_y0": 521.701, "r_x1": 455.529, "r_y1": 521.701, "r_x2": 455.529, "r_y2": 517.508, "r_x3": 453.002, "r_y3": 517.508, "coord_origin": "TOPLEFT"}, "text": "2", "orig": "2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 61, "label": "text", "bbox": {"l": 423.858, "t": 517.117, "r": 426.385, "b": 521.31, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 87, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 423.858, "r_y0": 521.31, "r_x1": 426.385, "r_y1": 521.31, "r_x2": 426.385, "r_y2": 517.117, "r_x3": 423.858, "r_y3": 517.117, "coord_origin": "TOPLEFT"}, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 62, "label": "text", "bbox": {"l": 333.434, "t": 556.947, "r": 359.834, "b": 562.3389999999999, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 88, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 333.434, "r_y0": 562.3389999999999, "r_x1": 359.834, "r_y1": 561.855, "r_x2": 359.834, "r_y2": 556.947, "r_x3": 333.434, "r_y3": 557.431, "coord_origin": "TOPLEFT"}, "text": "C C L NL", "orig": "C C L NL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 63, "label": "text", "bbox": {"l": 340.31, "t": 563.644, "r": 359.986, "b": 568.837, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 89, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 340.31, "r_y0": 568.837, "r_x1": 359.986, "r_y1": 568.552, "r_x2": 359.986, "r_y2": 563.644, "r_x3": 340.31, "r_y3": 563.929, "coord_origin": "TOPLEFT"}, "text": "C C NL", "orig": "C C NL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 64, "label": "text", "bbox": {"l": 333.596, "t": 563.887, "r": 337.437, "b": 568.795, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 90, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 333.596, "r_y0": 568.795, "r_x1": 337.437, "r_y1": 568.795, "r_x2": 337.437, "r_y2": 563.887, "r_x3": 333.596, "r_y3": 563.887, "coord_origin": "TOPLEFT"}, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 65, "label": "text", "bbox": {"l": 340.375, "t": 570.226, "r": 359.999, "b": 575.399, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 91, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 340.375, "r_y0": 575.399, "r_x1": 359.999, "r_y1": 575.134, "r_x2": 359.999, "r_y2": 570.226, "r_x3": 340.375, "r_y3": 570.491, "coord_origin": "TOPLEFT"}, "text": "C C NL", "orig": "C C NL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 66, "label": "text", "bbox": {"l": 333.661, "t": 570.448, "r": 337.503, "b": 575.356, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 92, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 333.661, "r_y0": 575.356, "r_x1": 337.503, "r_y1": 575.356, "r_x2": 337.503, "r_y2": 570.448, "r_x3": 333.661, "r_y3": 570.448, "coord_origin": "TOPLEFT"}, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 67, "label": "text", "bbox": {"l": 340.377, "t": 576.83, "r": 359.954, "b": 581.998, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 93, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 340.377, "r_y0": 581.998, "r_x1": 359.954, "r_y1": 581.738, "r_x2": 359.954, "r_y2": 576.83, "r_x3": 340.377, "r_y3": 577.09, "coord_origin": "TOPLEFT"}, "text": "C C NL", "orig": "C C NL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 68, "label": "text", "bbox": {"l": 333.663, "t": 577.047, "r": 337.504, "b": 581.955, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 94, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 333.663, "r_y0": 581.955, "r_x1": 337.504, "r_y1": 581.955, "r_x2": 337.504, "r_y2": 577.047, "r_x3": 333.663, "r_y3": 577.047, "coord_origin": "TOPLEFT"}, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 69, "label": "text", "bbox": {"l": 340.279, "t": 583.461, "r": 360.07, "b": 588.3779999999999, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 95, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 340.279, "r_y0": 588.369, "r_x1": 360.07, "r_y1": 588.3779999999999, "r_x2": 360.07, "r_y2": 583.47, "r_x3": 340.279, "r_y3": 583.461, "coord_origin": "TOPLEFT"}, "text": "C C NL", "orig": "C C NL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 70, "label": "text", "bbox": {"l": 333.566, "t": 583.419, "r": 337.407, "b": 588.327, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 96, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 333.566, "r_y0": 588.327, "r_x1": 337.407, "r_y1": 588.327, "r_x2": 337.407, "r_y2": 583.419, "r_x3": 333.566, "r_y3": 583.419, "coord_origin": "TOPLEFT"}, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 71, "label": "text", "bbox": {"l": 331.14, "t": 564.345, "r": 333.667, "b": 568.538, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 97, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 331.14, "r_y0": 568.538, "r_x1": 333.667, "r_y1": 568.538, "r_x2": 333.667, "r_y2": 564.345, "r_x3": 331.14, "r_y3": 564.345, "coord_origin": "TOPLEFT"}, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 72, "label": "text", "bbox": {"l": 340.81, "t": 554.648, "r": 343.337, "b": 558.841, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 98, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 340.81, "r_y0": 558.841, "r_x1": 343.337, "r_y1": 558.841, "r_x2": 343.337, "r_y2": 554.648, "r_x3": 340.81, "r_y3": 554.648, "coord_origin": "TOPLEFT"}, "text": "2", "orig": "2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 73, "label": "text", "bbox": {"l": 330.98, "t": 554.885, "r": 333.507, "b": 559.078, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 99, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 330.98, "r_y0": 559.078, "r_x1": 333.507, "r_y1": 559.078, "r_x2": 333.507, "r_y2": 554.885, "r_x3": 330.98, "r_y3": 554.885, "coord_origin": "TOPLEFT"}, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}]}, {"id": 4, "label": "text", "bbox": {"l": 134.765, "t": 620.193, "r": 480.592, "b": 664.855, "coord_origin": "TOPLEFT"}, "confidence": 0.951270341873169, "cells": [{"index": 100, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 149.709, "r_y0": 628.99, "r_x1": 480.588, "r_y1": 628.99, "r_x2": 480.588, "r_y2": 620.193, "r_x3": 149.709, "r_y3": 620.193, "coord_origin": "TOPLEFT"}, "text": "We rely on standard metrics such as Tree Edit Distance score (TEDs) for", "orig": "We rely on standard metrics such as Tree Edit Distance score (TEDs) for", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 101, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 640.9449999999999, "r_x1": 480.589, "r_y1": 640.9449999999999, "r_x2": 480.589, "r_y2": 632.148, "r_x3": 134.765, "r_y3": 632.148, "coord_origin": "TOPLEFT"}, "text": "table structure prediction, and Mean Average Precision (mAP) with 0.75 Inter-", "orig": "table structure prediction, and Mean Average Precision (mAP) with 0.75 Inter-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 102, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 652.9, "r_x1": 480.592, "r_y1": 652.9, "r_x2": 480.592, "r_y2": 644.1030000000001, "r_x3": 134.765, "r_y3": 644.1030000000001, "coord_origin": "TOPLEFT"}, "text": "section Over Union (IOU) threshold for the bounding-box predictions of table", "orig": "section Over Union (IOU) threshold for the bounding-box predictions of table", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 103, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 664.855, "r_x1": 155.846, "r_y1": 664.855, "r_x2": 155.846, "r_y2": 656.058, "r_x3": 134.765, "r_y3": 656.058, "coord_origin": "TOPLEFT"}, "text": "cells.", "orig": "cells.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 104, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 159.442, "r_y0": 664.855, "r_x1": 480.59, "r_y1": 664.855, "r_x2": 480.59, "r_y2": 656.058, "r_x3": 159.442, "r_y3": 656.058, "coord_origin": "TOPLEFT"}, "text": "The predicted OTSL structures were converted back to HTML format in", "orig": "The predicted OTSL structures were converted back to HTML format in", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}]}, "tablestructure": {"table_map": {}}, "figures_classification": null, "equations_prediction": null, "vlm_response": null}, "assembled": {"elements": [{"label": "page_header", "id": 9, "page_no": 7, "cluster": {"id": 9, "label": "page_header", "bbox": {"l": 134.765, "t": 91.49300000000005, "r": 139.372, "b": 102.78200000000004, "coord_origin": "TOPLEFT"}, "confidence": 0.8301323056221008, "cells": [{"index": 0, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 102.78200000000004, "r_x1": 139.372, "r_y1": 102.78200000000004, "r_x2": 139.372, "r_y2": 91.49300000000005, "r_x3": 134.765, "r_y3": 91.49300000000005, "coord_origin": "TOPLEFT"}, "text": "8", "orig": "8", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "8"}, {"label": "page_header", "id": 8, "page_no": 7, "cluster": {"id": 8, "label": "page_header", "bbox": {"l": 167.813, "t": 91.49300000000005, "r": 231.722, "b": 102.78200000000004, "coord_origin": "TOPLEFT"}, "confidence": 0.8631826043128967, "cells": [{"index": 1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 167.813, "r_y0": 102.78200000000004, "r_x1": 231.722, "r_y1": 102.78200000000004, "r_x2": 231.722, "r_y2": 91.49300000000005, "r_x3": 167.813, "r_y3": 91.49300000000005, "coord_origin": "TOPLEFT"}, "text": "M. Lysak, et al.", "orig": "M. Lysak, et al.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "M. Lysak, et al."}, {"label": "text", "id": 5, "page_no": 7, "cluster": {"id": 5, "label": "text", "bbox": {"l": 134.765, "t": 118.93399999999997, "r": 480.589, "b": 139.68600000000004, "coord_origin": "TOPLEFT"}, "confidence": 0.9464744925498962, "cells": [{"index": 2, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 127.731, "r_x1": 480.589, "r_y1": 127.731, "r_x2": 480.589, "r_y2": 118.93399999999997, "r_x3": 134.765, "r_y3": 118.93399999999997, "coord_origin": "TOPLEFT"}, "text": "reduces significantly the column drift seen in the HTML based models (see Fig-", "orig": "reduces significantly the column drift seen in the HTML based models (see Fig-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 3, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 139.68600000000004, "r_x1": 163.564, "r_y1": 139.68600000000004, "r_x2": 163.564, "r_y2": 130.889, "r_x3": 134.765, "r_y3": 130.889, "coord_origin": "TOPLEFT"}, "text": "ure 5).", "orig": "ure 5).", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "reduces significantly the column drift seen in the HTML based models (see Figure 5)."}, {"label": "section_header", "id": 2, "page_no": 7, "cluster": {"id": 2, "label": "section_header", "bbox": {"l": 134.765, "t": 161.55700000000002, "r": 319.347, "b": 170.36400000000003, "coord_origin": "TOPLEFT"}, "confidence": 0.9549514651298523, "cells": [{"index": 4, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 170.36400000000003, "r_x1": 149.402, "r_y1": 170.36400000000003, "r_x2": 149.402, "r_y2": 161.55700000000002, "r_x3": 134.765, "r_y3": 161.55700000000002, "coord_origin": "TOPLEFT"}, "text": "4.3", "orig": "4.3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 5, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 160.859, "r_y0": 170.36400000000003, "r_x1": 319.347, "r_y1": 170.36400000000003, "r_x2": 319.347, "r_y2": 161.55700000000002, "r_x3": 160.859, "r_y3": 161.55700000000002, "coord_origin": "TOPLEFT"}, "text": "Error-detection and -mitigation", "orig": "Error-detection and -mitigation", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "4.3 Error-detection and -mitigation"}, {"label": "text", "id": 0, "page_no": 7, "cluster": {"id": 0, "label": "text", "bbox": {"l": 134.765, "t": 182.28200000000004, "r": 480.596, "b": 298.676, "coord_origin": "TOPLEFT"}, "confidence": 0.9879790544509888, "cells": [{"index": 6, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 191.07899999999995, "r_x1": 480.596, "r_y1": 191.07899999999995, "r_x2": 480.596, "r_y2": 182.28200000000004, "r_x3": 134.765, "r_y3": 182.28200000000004, "coord_origin": "TOPLEFT"}, "text": "The design of OTSL allows to validate a table structure easily on an unfinished", "orig": "The design of OTSL allows to validate a table structure easily on an unfinished", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 7, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 203.03499999999997, "r_x1": 480.595, "r_y1": 203.03499999999997, "r_x2": 480.595, "r_y2": 194.23800000000006, "r_x3": 134.765, "r_y3": 194.23800000000006, "coord_origin": "TOPLEFT"}, "text": "sequence. The detection of an invalid sequence token is a clear indication of a", "orig": "sequence. The detection of an invalid sequence token is a clear indication of a", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 8, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 214.99, "r_x1": 480.587, "r_y1": 214.99, "r_x2": 480.587, "r_y2": 206.19299999999998, "r_x3": 134.765, "r_y3": 206.19299999999998, "coord_origin": "TOPLEFT"}, "text": "prediction mistake, however a valid sequence by itself does not guarantee pre-", "orig": "prediction mistake, however a valid sequence by itself does not guarantee pre-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 9, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 226.94500000000005, "r_x1": 480.592, "r_y1": 226.94500000000005, "r_x2": 480.592, "r_y2": 218.14800000000002, "r_x3": 134.765, "r_y3": 218.14800000000002, "coord_origin": "TOPLEFT"}, "text": "diction correctness. Different heuristics can be used to correct token errors in", "orig": "diction correctness. Different heuristics can be used to correct token errors in", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 10, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 238.89999999999998, "r_x1": 480.588, "r_y1": 238.89999999999998, "r_x2": 480.588, "r_y2": 230.10299999999995, "r_x3": 134.765, "r_y3": 230.10299999999995, "coord_origin": "TOPLEFT"}, "text": "an invalid sequence and thus increase the chances for accurate predictions. Such", "orig": "an invalid sequence and thus increase the chances for accurate predictions. Such", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 11, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 250.85500000000002, "r_x1": 480.587, "r_y1": 250.85500000000002, "r_x2": 480.587, "r_y2": 242.058, "r_x3": 134.765, "r_y3": 242.058, "coord_origin": "TOPLEFT"}, "text": "heuristics can be applied either after the prediction of each token, or at the end", "orig": "heuristics can be applied either after the prediction of each token, or at the end", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 12, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 262.80999999999995, "r_x1": 480.594, "r_y1": 262.80999999999995, "r_x2": 480.594, "r_y2": 254.01300000000003, "r_x3": 134.765, "r_y3": 254.01300000000003, "coord_origin": "TOPLEFT"}, "text": "on the entire predicted sequence. For example a simple heuristic which can cor-", "orig": "on the entire predicted sequence. For example a simple heuristic which can cor-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 13, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 274.76599999999996, "r_x1": 480.591, "r_y1": 274.76599999999996, "r_x2": 480.591, "r_y2": 265.96900000000005, "r_x3": 134.765, "r_y3": 265.96900000000005, "coord_origin": "TOPLEFT"}, "text": "rect the predicted OTSL sequence on-the-fly is to verify if the token with the", "orig": "rect the predicted OTSL sequence on-the-fly is to verify if the token with the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 14, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 286.721, "r_x1": 480.596, "r_y1": 286.721, "r_x2": 480.596, "r_y2": 277.924, "r_x3": 134.765, "r_y3": 277.924, "coord_origin": "TOPLEFT"}, "text": "highest prediction confidence invalidates the predicted sequence, and replace it", "orig": "highest prediction confidence invalidates the predicted sequence, and replace it", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 15, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 298.676, "r_x1": 469.404, "r_y1": 298.676, "r_x2": 469.404, "r_y2": 289.879, "r_x3": 134.765, "r_y3": 289.879, "coord_origin": "TOPLEFT"}, "text": "by the token with the next highest confidence until OTSL rules are satisfied.", "orig": "by the token with the next highest confidence until OTSL rules are satisfied.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "The design of OTSL allows to validate a table structure easily on an unfinished sequence. The detection of an invalid sequence token is a clear indication of a prediction mistake, however a valid sequence by itself does not guarantee prediction correctness. Different heuristics can be used to correct token errors in an invalid sequence and thus increase the chances for accurate predictions. Such heuristics can be applied either after the prediction of each token, or at the end on the entire predicted sequence. For example a simple heuristic which can correct the predicted OTSL sequence on-the-fly is to verify if the token with the highest prediction confidence invalidates the predicted sequence, and replace it by the token with the next highest confidence until OTSL rules are satisfied."}, {"label": "section_header", "id": 3, "page_no": 7, "cluster": {"id": 3, "label": "section_header", "bbox": {"l": 134.765, "t": 321.164, "r": 229.035, "b": 331.732, "coord_origin": "TOPLEFT"}, "confidence": 0.95152747631073, "cells": [{"index": 16, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 331.732, "r_x1": 141.489, "r_y1": 331.732, "r_x2": 141.489, "r_y2": 321.164, "r_x3": 134.765, "r_y3": 321.164, "coord_origin": "TOPLEFT"}, "text": "5", "orig": "5", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 17, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 154.938, "r_y0": 331.732, "r_x1": 229.035, "r_y1": 331.732, "r_x2": 229.035, "r_y2": 321.164, "r_x3": 154.938, "r_y3": 321.164, "coord_origin": "TOPLEFT"}, "text": "Experiments", "orig": "Experiments", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "5 Experiments"}, {"label": "text", "id": 1, "page_no": 7, "cluster": {"id": 1, "label": "text", "bbox": {"l": 134.765, "t": 347.25, "r": 480.595, "b": 451.688, "coord_origin": "TOPLEFT"}, "confidence": 0.9877985119819641, "cells": [{"index": 18, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 356.047, "r_x1": 480.594, "r_y1": 356.047, "r_x2": 480.594, "r_y2": 347.25, "r_x3": 134.765, "r_y3": 347.25, "coord_origin": "TOPLEFT"}, "text": "To evaluate the impact of OTSL on prediction accuracy and inference times, we", "orig": "To evaluate the impact of OTSL on prediction accuracy and inference times, we", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 19, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 368.002, "r_x1": 480.595, "r_y1": 368.002, "r_x2": 480.595, "r_y2": 359.205, "r_x3": 134.765, "r_y3": 359.205, "coord_origin": "TOPLEFT"}, "text": "conducted a series of experiments based on the TableFormer model (Figure 4)", "orig": "conducted a series of experiments based on the TableFormer model (Figure 4)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 20, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 379.957, "r_x1": 480.588, "r_y1": 379.957, "r_x2": 480.588, "r_y2": 371.16, "r_x3": 134.765, "r_y3": 371.16, "coord_origin": "TOPLEFT"}, "text": "with two objectives: Firstly we evaluate the prediction quality and performance", "orig": "with two objectives: Firstly we evaluate the prediction quality and performance", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 21, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 391.912, "r_x1": 480.588, "r_y1": 391.912, "r_x2": 480.588, "r_y2": 383.115, "r_x3": 134.765, "r_y3": 383.115, "coord_origin": "TOPLEFT"}, "text": "of OTSL vs. HTML after performing Hyper Parameter Optimization (HPO) on", "orig": "of OTSL vs. HTML after performing Hyper Parameter Optimization (HPO) on", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 22, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 403.867, "r_x1": 148.598, "r_y1": 403.867, "r_x2": 148.598, "r_y2": 395.07, "r_x3": 134.765, "r_y3": 395.07, "coord_origin": "TOPLEFT"}, "text": "the", "orig": "the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 23, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 151.627, "r_y0": 403.867, "r_x1": 191.847, "r_y1": 403.867, "r_x2": 191.847, "r_y2": 395.07, "r_x3": 151.627, "r_y3": 395.07, "coord_origin": "TOPLEFT"}, "text": "canonical", "orig": "canonical", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 24, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 195.902, "r_y0": 403.867, "r_x1": 480.595, "r_y1": 403.867, "r_x2": 480.595, "r_y2": 395.07, "r_x3": 195.902, "r_y3": 395.07, "coord_origin": "TOPLEFT"}, "text": "PubTabNet data set. Secondly we pick the best hyper-parameters", "orig": "PubTabNet data set. Secondly we pick the best hyper-parameters", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 25, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 415.822, "r_x1": 172.59, "r_y1": 415.822, "r_x2": 172.59, "r_y2": 407.025, "r_x3": 134.765, "r_y3": 407.025, "coord_origin": "TOPLEFT"}, "text": "found in", "orig": "found in", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 26, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 177.492, "r_y0": 415.822, "r_x1": 191.325, "r_y1": 415.822, "r_x2": 191.325, "r_y2": 407.025, "r_x3": 177.492, "r_y3": 407.025, "coord_origin": "TOPLEFT"}, "text": "the", "orig": "the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 27, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 196.226, "r_y0": 415.822, "r_x1": 213.463, "r_y1": 415.822, "r_x2": 213.463, "r_y2": 407.025, "r_x3": 196.226, "r_y3": 407.025, "coord_origin": "TOPLEFT"}, "text": "first", "orig": "first", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 28, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 218.364, "r_y0": 415.822, "r_x1": 236.125, "r_y1": 415.822, "r_x2": 236.125, "r_y2": 407.025, "r_x3": 218.364, "r_y3": 407.025, "coord_origin": "TOPLEFT"}, "text": "step", "orig": "step", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 29, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 241.027, "r_y0": 415.822, "r_x1": 297.661, "r_y1": 415.822, "r_x2": 297.661, "r_y2": 407.025, "r_x3": 241.027, "r_y3": 407.025, "coord_origin": "TOPLEFT"}, "text": "and evaluate", "orig": "and evaluate", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 30, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 302.563, "r_y0": 415.822, "r_x1": 480.593, "r_y1": 415.822, "r_x2": 480.593, "r_y2": 407.025, "r_x3": 302.563, "r_y3": 407.025, "coord_origin": "TOPLEFT"}, "text": "how OTSL impacts the performance of", "orig": "how OTSL impacts the performance of", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 31, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 427.778, "r_x1": 377.321, "r_y1": 427.778, "r_x2": 377.321, "r_y2": 418.981, "r_x3": 134.765, "r_y3": 418.981, "coord_origin": "TOPLEFT"}, "text": "TableFormer after training on other publicly available", "orig": "TableFormer after training on other publicly available", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 32, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 381.874, "r_y0": 427.778, "r_x1": 421.951, "r_y1": 427.778, "r_x2": 421.951, "r_y2": 418.981, "r_x3": 381.874, "r_y3": 418.981, "coord_origin": "TOPLEFT"}, "text": "data sets", "orig": "data sets", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 33, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 426.504, "r_y0": 427.778, "r_x1": 480.595, "r_y1": 427.778, "r_x2": 480.595, "r_y2": 418.981, "r_x3": 426.504, "r_y3": 418.981, "coord_origin": "TOPLEFT"}, "text": "(FinTabNet,", "orig": "(FinTabNet,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 34, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 439.733, "r_x1": 480.592, "r_y1": 439.733, "r_x2": 480.592, "r_y2": 430.936, "r_x3": 134.765, "r_y3": 430.936, "coord_origin": "TOPLEFT"}, "text": "PubTables-1M [14]). The ground truth (GT) from all data sets has been con-", "orig": "PubTables-1M [14]). The ground truth (GT) from all data sets has been con-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 35, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 451.688, "r_x1": 479.303, "r_y1": 451.688, "r_x2": 479.303, "r_y2": 442.891, "r_x3": 134.765, "r_y3": 442.891, "coord_origin": "TOPLEFT"}, "text": "verted into OTSL format for this purpose, and will be made publicly available.", "orig": "verted into OTSL format for this purpose, and will be made publicly available.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "To evaluate the impact of OTSL on prediction accuracy and inference times, we conducted a series of experiments based on the TableFormer model (Figure 4) with two objectives: Firstly we evaluate the prediction quality and performance of OTSL vs. HTML after performing Hyper Parameter Optimization (HPO) on the canonical PubTabNet data set. Secondly we pick the best hyper-parameters found in the first step and evaluate how OTSL impacts the performance of TableFormer after training on other publicly available data sets (FinTabNet, PubTables-1M [14]). The ground truth (GT) from all data sets has been converted into OTSL format for this purpose, and will be made publicly available."}, {"label": "caption", "id": 7, "page_no": 7, "cluster": {"id": 7, "label": "caption", "bbox": {"l": 134.765, "t": 482.433, "r": 480.591, "b": 504.681, "coord_origin": "TOPLEFT"}, "confidence": 0.9297956228256226, "cells": [{"index": 36, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 492.574, "r_x1": 162.644, "r_y1": 492.574, "r_x2": 162.644, "r_y2": 484.648, "r_x3": 134.765, "r_y3": 484.648, "coord_origin": "TOPLEFT"}, "text": "Fig. 4.", "orig": "Fig. 4.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 37, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 165.196, "r_y0": 493.722, "r_x1": 480.591, "r_y1": 493.722, "r_x2": 480.591, "r_y2": 482.433, "r_x3": 165.196, "r_y3": 482.433, "coord_origin": "TOPLEFT"}, "text": "Architecture sketch of the TableFormer model, which is a representative for the", "orig": "Architecture sketch of the TableFormer model, which is a representative for the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 38, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 504.681, "r_x1": 206.702, "r_y1": 504.681, "r_x2": 206.702, "r_y2": 493.392, "r_x3": 134.765, "r_y3": 493.392, "coord_origin": "TOPLEFT"}, "text": "Im2Seq approach.", "orig": "Im2Seq approach.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "Fig. 4. Architecture sketch of the TableFormer model, which is a representative for the Im2Seq approach."}, {"label": "picture", "id": 6, "page_no": 7, "cluster": {"id": 6, "label": "picture", "bbox": {"l": 140.70968627929688, "t": 508.0638427734375, "r": 472.73382568359375, "b": 593.6771850585938, "coord_origin": "TOPLEFT"}, "confidence": 0.9303396344184875, "cells": [{"index": 39, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 147.3, "r_y0": 543.091, "r_x1": 149.407, "r_y1": 543.091, "r_x2": 149.407, "r_y2": 540.762, "r_x3": 147.3, "r_y3": 540.762, "coord_origin": "TOPLEFT"}, "text": "1.", "orig": "1.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 40, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 150.809, "r_y0": 543.091, "r_x1": 155.721, "r_y1": 543.091, "r_x2": 155.721, "r_y2": 540.762, "r_x3": 150.809, "r_y3": 540.762, "coord_origin": "TOPLEFT"}, "text": "Item", "orig": "Item", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 41, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 162.76, "r_y0": 537.754, "r_x1": 172.296, "r_y1": 537.754, "r_x2": 172.296, "r_y2": 535.424, "r_x3": 162.76, "r_y3": 535.424, "coord_origin": "TOPLEFT"}, "text": "Amount", "orig": "Amount", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 42, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 147.636, "r_y0": 537.726, "r_x1": 155.918, "r_y1": 537.726, "r_x2": 155.918, "r_y2": 535.396, "r_x3": 147.636, "r_y3": 535.396, "coord_origin": "TOPLEFT"}, "text": "Names", "orig": "Names", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 43, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 158.485, "r_y0": 543.091, "r_x1": 164.102, "r_y1": 543.091, "r_x2": 164.102, "r_y2": 540.762, "r_x3": 158.485, "r_y3": 540.762, "coord_origin": "TOPLEFT"}, "text": "1000", "orig": "1000", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 44, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 158.485, "r_y0": 547.03, "r_x1": 162.697, "r_y1": 547.03, "r_x2": 162.697, "r_y2": 544.701, "r_x3": 158.485, "r_y3": 544.701, "coord_origin": "TOPLEFT"}, "text": "500", "orig": "500", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 45, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 158.485, "r_y0": 551.2719999999999, "r_x1": 164.102, "r_y1": 551.2719999999999, "r_x2": 164.102, "r_y2": 548.943, "r_x3": 158.485, "r_y3": 548.943, "coord_origin": "TOPLEFT"}, "text": "3500", "orig": "3500", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 46, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 158.485, "r_y0": 555.514, "r_x1": 162.697, "r_y1": 555.514, "r_x2": 162.697, "r_y2": 553.185, "r_x3": 158.485, "r_y3": 553.185, "coord_origin": "TOPLEFT"}, "text": "150", "orig": "150", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 47, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 168.817, "r_y0": 543.091, "r_x1": 172.889, "r_y1": 543.091, "r_x2": 172.889, "r_y2": 540.762, "r_x3": 168.817, "r_y3": 540.762, "coord_origin": "TOPLEFT"}, "text": "unit", "orig": "unit", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 48, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 168.817, "r_y0": 547.03, "r_x1": 172.889, "r_y1": 547.03, "r_x2": 172.889, "r_y2": 544.701, "r_x3": 168.817, "r_y3": 544.701, "coord_origin": "TOPLEFT"}, "text": "unit", "orig": "unit", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 49, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 168.817, "r_y0": 551.2719999999999, "r_x1": 172.889, "r_y1": 551.2719999999999, "r_x2": 172.889, "r_y2": 548.943, "r_x3": 168.817, "r_y3": 548.943, "coord_origin": "TOPLEFT"}, "text": "unit", "orig": "unit", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 50, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 168.817, "r_y0": 555.514, "r_x1": 172.889, "r_y1": 555.514, "r_x2": 172.889, "r_y2": 553.185, "r_x3": 168.817, "r_y3": 553.185, "coord_origin": "TOPLEFT"}, "text": "unit", "orig": "unit", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 51, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 147.3, "r_y0": 547.03, "r_x1": 149.407, "r_y1": 547.03, "r_x2": 149.407, "r_y2": 544.701, "r_x3": 147.3, "r_y3": 544.701, "coord_origin": "TOPLEFT"}, "text": "2.", "orig": "2.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 52, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 150.809, "r_y0": 547.03, "r_x1": 155.721, "r_y1": 547.03, "r_x2": 155.721, "r_y2": 544.701, "r_x3": 150.809, "r_y3": 544.701, "coord_origin": "TOPLEFT"}, "text": "Item", "orig": "Item", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 53, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 147.3, "r_y0": 551.2719999999999, "r_x1": 149.407, "r_y1": 551.2719999999999, "r_x2": 149.407, "r_y2": 548.943, "r_x3": 147.3, "r_y3": 548.943, "coord_origin": "TOPLEFT"}, "text": "3.", "orig": "3.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 54, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 150.809, "r_y0": 551.2719999999999, "r_x1": 155.721, "r_y1": 551.2719999999999, "r_x2": 155.721, "r_y2": 548.943, "r_x3": 150.809, "r_y3": 548.943, "coord_origin": "TOPLEFT"}, "text": "Item", "orig": "Item", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 55, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 147.3, "r_y0": 555.514, "r_x1": 149.407, "r_y1": 555.514, "r_x2": 149.407, "r_y2": 553.185, "r_x3": 147.3, "r_y3": 553.185, "coord_origin": "TOPLEFT"}, "text": "4.", "orig": "4.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 56, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 150.809, "r_y0": 555.514, "r_x1": 155.721, "r_y1": 555.514, "r_x2": 155.721, "r_y2": 553.185, "r_x3": 150.809, "r_y3": 553.185, "coord_origin": "TOPLEFT"}, "text": "Item", "orig": "Item", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 57, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 152.05, "r_y0": 521.2570000000001, "r_x1": 171.249, "r_y1": 521.2570000000001, "r_x2": 171.249, "r_y2": 517.0640000000001, "r_x3": 152.05, "r_y3": 517.0640000000001, "coord_origin": "TOPLEFT"}, "text": "Extracted", "orig": "Extracted", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 58, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 148.133, "r_y0": 526.56, "r_x1": 175.168, "r_y1": 526.56, "r_x2": 175.168, "r_y2": 522.367, "r_x3": 148.133, "r_y3": 522.367, "coord_origin": "TOPLEFT"}, "text": "Table Images", "orig": "Table Images", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 59, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 193.533, "r_y0": 528.762, "r_x1": 220.32, "r_y1": 528.762, "r_x2": 220.32, "r_y2": 524.569, "r_x3": 193.533, "r_y3": 524.569, "coord_origin": "TOPLEFT"}, "text": "Standardized", "orig": "Standardized", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 60, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 199.473, "r_y0": 534.0640000000001, "r_x1": 214.379, "r_y1": 534.0640000000001, "r_x2": 214.379, "r_y2": 529.871, "r_x3": 199.473, "r_y3": 529.871, "coord_origin": "TOPLEFT"}, "text": "Images", "orig": "Images", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 61, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 273.611, "r_y0": 514.153, "r_x1": 284.473, "r_y1": 514.153, "r_x2": 284.473, "r_y2": 509.96, "r_x3": 273.611, "r_y3": 509.96, "coord_origin": "TOPLEFT"}, "text": "BBox", "orig": "BBox", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 62, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 270.452, "r_y0": 517.94, "r_x1": 287.632, "r_y1": 517.94, "r_x2": 287.632, "r_y2": 513.7470000000001, "r_x3": 270.452, "r_y3": 513.7470000000001, "coord_origin": "TOPLEFT"}, "text": "Decoder", "orig": "Decoder", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 63, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 332.478, "r_y0": 512.392, "r_x1": 348.14, "r_y1": 512.392, "r_x2": 348.14, "r_y2": 508.199, "r_x3": 332.478, "r_y3": 508.199, "coord_origin": "TOPLEFT"}, "text": "BBoxes", "orig": "BBoxes", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 64, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 376.686, "r_y0": 525.3679999999999, "r_x1": 407.255, "r_y1": 525.3679999999999, "r_x2": 407.255, "r_y2": 521.175, "r_x3": 376.686, "r_y3": 521.175, "coord_origin": "TOPLEFT"}, "text": "BBoxes can be", "orig": "BBoxes can be", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 65, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 373.909, "r_y0": 529.913, "r_x1": 410.035, "r_y1": 529.913, "r_x2": 410.035, "r_y2": 525.72, "r_x3": 373.909, "r_y3": 525.72, "coord_origin": "TOPLEFT"}, "text": "traced back to the", "orig": "traced back to the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 66, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 375.299, "r_y0": 534.4580000000001, "r_x1": 408.649, "r_y1": 534.4580000000001, "r_x2": 408.649, "r_y2": 530.265, "r_x3": 375.299, "r_y3": 530.265, "coord_origin": "TOPLEFT"}, "text": "original image to", "orig": "original image to", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 67, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 377.067, "r_y0": 539.0029999999999, "r_x1": 406.883, "r_y1": 539.0029999999999, "r_x2": 406.883, "r_y2": 534.81, "r_x3": 377.067, "r_y3": 534.81, "coord_origin": "TOPLEFT"}, "text": "extract content", "orig": "extract content", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 68, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 383.567, "r_y0": 567.489, "r_x1": 433.765, "r_y1": 567.489, "r_x2": 433.765, "r_y2": 563.296, "r_x3": 383.567, "r_y3": 563.296, "coord_origin": "TOPLEFT"}, "text": "Structure Tags sequence", "orig": "Structure Tags sequence", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 69, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 383.528, "r_y0": 572.034, "r_x1": 433.808, "r_y1": 572.034, "r_x2": 433.808, "r_y2": 567.841, "r_x3": 383.528, "r_y3": 567.841, "coord_origin": "TOPLEFT"}, "text": "provide full description of", "orig": "provide full description of", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 70, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 390.475, "r_y0": 576.579, "r_x1": 426.857, "r_y1": 576.579, "r_x2": 426.857, "r_y2": 572.386, "r_x3": 390.475, "r_y3": 572.386, "coord_origin": "TOPLEFT"}, "text": "the table structure", "orig": "the table structure", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 71, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 293.947, "r_y0": 582.139, "r_x1": 323.169, "r_y1": 582.139, "r_x2": 323.169, "r_y2": 577.946, "r_x3": 293.947, "r_y3": 577.946, "coord_origin": "TOPLEFT"}, "text": "Structure Tags", "orig": "Structure Tags", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 72, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 293.947, "r_y0": 586.684, "r_x1": 324.594, "r_y1": 586.684, "r_x2": 324.594, "r_y2": 582.491, "r_x3": 293.947, "r_y3": 582.491, "coord_origin": "TOPLEFT"}, "text": "in OTSL format", "orig": "in OTSL format", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 73, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 333.078, "r_y0": 546.0699999999999, "r_x1": 364.147, "r_y1": 546.0699999999999, "r_x2": 364.147, "r_y2": 541.877, "r_x3": 333.078, "r_y3": 541.877, "coord_origin": "TOPLEFT"}, "text": "BBoxes in sync", "orig": "BBoxes in sync", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 74, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 333.078, "r_y0": 549.858, "r_x1": 369.715, "r_y1": 549.858, "r_x2": 369.715, "r_y2": 545.665, "r_x3": 333.078, "r_y3": 545.665, "coord_origin": "TOPLEFT"}, "text": "with tag sequence", "orig": "with tag sequence", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 75, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 232.659, "r_y0": 519.489, "r_x1": 249.589, "r_y1": 519.489, "r_x2": 249.589, "r_y2": 515.296, "r_x3": 232.659, "r_y3": 515.296, "coord_origin": "TOPLEFT"}, "text": "Encoder", "orig": "Encoder", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 76, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 269.822, "r_y0": 550.218, "r_x1": 288.263, "r_y1": 550.218, "r_x2": 288.263, "r_y2": 546.0260000000001, "r_x3": 269.822, "r_y3": 546.0260000000001, "coord_origin": "TOPLEFT"}, "text": "Structure", "orig": "Structure", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 77, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 270.452, "r_y0": 554.006, "r_x1": 287.632, "r_y1": 554.006, "r_x2": 287.632, "r_y2": 549.813, "r_x3": 270.452, "r_y3": 549.813, "coord_origin": "TOPLEFT"}, "text": "Decoder", "orig": "Decoder", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 78, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 332.177, "r_y0": 520.1600000000001, "r_x1": 358.112, "r_y1": 520.1600000000001, "r_x2": 358.112, "r_y2": 515.967, "r_x3": 332.177, "r_y3": 515.967, "coord_origin": "TOPLEFT"}, "text": "[x1, y2, x2, y2]", "orig": "[x1, y2, x2, y2]", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 79, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 332.177, "r_y0": 526.22, "r_x1": 361.583, "r_y1": 526.22, "r_x2": 361.583, "r_y2": 522.027, "r_x3": 332.177, "r_y3": 522.027, "coord_origin": "TOPLEFT"}, "text": "[x1', y2', x2', y2']", "orig": "[x1', y2', x2', y2']", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 80, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 332.177, "r_y0": 532.28, "r_x1": 364.765, "r_y1": 532.28, "r_x2": 364.765, "r_y2": 528.087, "r_x3": 332.177, "r_y3": 528.087, "coord_origin": "TOPLEFT"}, "text": "[x1'', y2'', x2'', y2'']", "orig": "[x1'', y2'', x2'', y2'']", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 81, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 332.177, "r_y0": 538.34, "r_x1": 335.965, "r_y1": 538.34, "r_x2": 335.965, "r_y2": 534.1469999999999, "r_x3": 332.177, "r_y3": 534.1469999999999, "coord_origin": "TOPLEFT"}, "text": "...", "orig": "...", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 82, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 326.889, "r_y0": 520.643, "r_x1": 329.416, "r_y1": 520.643, "r_x2": 329.416, "r_y2": 516.45, "r_x3": 326.889, "r_y3": 516.45, "coord_origin": "TOPLEFT"}, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 83, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 327.041, "r_y0": 526.672, "r_x1": 329.568, "r_y1": 526.672, "r_x2": 329.568, "r_y2": 522.479, "r_x3": 327.041, "r_y3": 522.479, "coord_origin": "TOPLEFT"}, "text": "2", "orig": "2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 84, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 327.041, "r_y0": 532.7629999999999, "r_x1": 329.568, "r_y1": 532.7629999999999, "r_x2": 329.568, "r_y2": 528.5699999999999, "r_x3": 327.041, "r_y3": 528.5699999999999, "coord_origin": "TOPLEFT"}, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 85, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 424.141, "r_y0": 531.69, "r_x1": 426.668, "r_y1": 531.69, "r_x2": 426.668, "r_y2": 527.4970000000001, "r_x3": 424.141, "r_y3": 527.4970000000001, "coord_origin": "TOPLEFT"}, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 86, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 453.002, "r_y0": 521.701, "r_x1": 455.529, "r_y1": 521.701, "r_x2": 455.529, "r_y2": 517.508, "r_x3": 453.002, "r_y3": 517.508, "coord_origin": "TOPLEFT"}, "text": "2", "orig": "2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 87, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 423.858, "r_y0": 521.31, "r_x1": 426.385, "r_y1": 521.31, "r_x2": 426.385, "r_y2": 517.117, "r_x3": 423.858, "r_y3": 517.117, "coord_origin": "TOPLEFT"}, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 88, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 333.434, "r_y0": 562.3389999999999, "r_x1": 359.834, "r_y1": 561.855, "r_x2": 359.834, "r_y2": 556.947, "r_x3": 333.434, "r_y3": 557.431, "coord_origin": "TOPLEFT"}, "text": "C C L NL", "orig": "C C L NL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 89, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 340.31, "r_y0": 568.837, "r_x1": 359.986, "r_y1": 568.552, "r_x2": 359.986, "r_y2": 563.644, "r_x3": 340.31, "r_y3": 563.929, "coord_origin": "TOPLEFT"}, "text": "C C NL", "orig": "C C NL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 90, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 333.596, "r_y0": 568.795, "r_x1": 337.437, "r_y1": 568.795, "r_x2": 337.437, "r_y2": 563.887, "r_x3": 333.596, "r_y3": 563.887, "coord_origin": "TOPLEFT"}, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 91, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 340.375, "r_y0": 575.399, "r_x1": 359.999, "r_y1": 575.134, "r_x2": 359.999, "r_y2": 570.226, "r_x3": 340.375, "r_y3": 570.491, "coord_origin": "TOPLEFT"}, "text": "C C NL", "orig": "C C NL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 92, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 333.661, "r_y0": 575.356, "r_x1": 337.503, "r_y1": 575.356, "r_x2": 337.503, "r_y2": 570.448, "r_x3": 333.661, "r_y3": 570.448, "coord_origin": "TOPLEFT"}, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 93, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 340.377, "r_y0": 581.998, "r_x1": 359.954, "r_y1": 581.738, "r_x2": 359.954, "r_y2": 576.83, "r_x3": 340.377, "r_y3": 577.09, "coord_origin": "TOPLEFT"}, "text": "C C NL", "orig": "C C NL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 94, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 333.663, "r_y0": 581.955, "r_x1": 337.504, "r_y1": 581.955, "r_x2": 337.504, "r_y2": 577.047, "r_x3": 333.663, "r_y3": 577.047, "coord_origin": "TOPLEFT"}, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 95, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 340.279, "r_y0": 588.369, "r_x1": 360.07, "r_y1": 588.3779999999999, "r_x2": 360.07, "r_y2": 583.47, "r_x3": 340.279, "r_y3": 583.461, "coord_origin": "TOPLEFT"}, "text": "C C NL", "orig": "C C NL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 96, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 333.566, "r_y0": 588.327, "r_x1": 337.407, "r_y1": 588.327, "r_x2": 337.407, "r_y2": 583.419, "r_x3": 333.566, "r_y3": 583.419, "coord_origin": "TOPLEFT"}, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 97, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 331.14, "r_y0": 568.538, "r_x1": 333.667, "r_y1": 568.538, "r_x2": 333.667, "r_y2": 564.345, "r_x3": 331.14, "r_y3": 564.345, "coord_origin": "TOPLEFT"}, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 98, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 340.81, "r_y0": 558.841, "r_x1": 343.337, "r_y1": 558.841, "r_x2": 343.337, "r_y2": 554.648, "r_x3": 340.81, "r_y3": 554.648, "coord_origin": "TOPLEFT"}, "text": "2", "orig": "2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 99, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 330.98, "r_y0": 559.078, "r_x1": 333.507, "r_y1": 559.078, "r_x2": 333.507, "r_y2": 554.885, "r_x3": 330.98, "r_y3": 554.885, "coord_origin": "TOPLEFT"}, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": [{"id": 13, "label": "text", "bbox": {"l": 147.3, "t": 540.762, "r": 149.407, "b": 543.091, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 39, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 147.3, "r_y0": 543.091, "r_x1": 149.407, "r_y1": 543.091, "r_x2": 149.407, "r_y2": 540.762, "r_x3": 147.3, "r_y3": 540.762, "coord_origin": "TOPLEFT"}, "text": "1.", "orig": "1.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 14, "label": "text", "bbox": {"l": 150.809, "t": 540.762, "r": 155.721, "b": 543.091, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 40, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 150.809, "r_y0": 543.091, "r_x1": 155.721, "r_y1": 543.091, "r_x2": 155.721, "r_y2": 540.762, "r_x3": 150.809, "r_y3": 540.762, "coord_origin": "TOPLEFT"}, "text": "Item", "orig": "Item", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 15, "label": "text", "bbox": {"l": 162.76, "t": 535.424, "r": 172.296, "b": 537.754, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 41, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 162.76, "r_y0": 537.754, "r_x1": 172.296, "r_y1": 537.754, "r_x2": 172.296, "r_y2": 535.424, "r_x3": 162.76, "r_y3": 535.424, "coord_origin": "TOPLEFT"}, "text": "Amount", "orig": "Amount", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 16, "label": "text", "bbox": {"l": 147.636, "t": 535.396, "r": 155.918, "b": 537.726, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 42, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 147.636, "r_y0": 537.726, "r_x1": 155.918, "r_y1": 537.726, "r_x2": 155.918, "r_y2": 535.396, "r_x3": 147.636, "r_y3": 535.396, "coord_origin": "TOPLEFT"}, "text": "Names", "orig": "Names", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 17, "label": "text", "bbox": {"l": 158.485, "t": 540.762, "r": 164.102, "b": 543.091, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 43, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 158.485, "r_y0": 543.091, "r_x1": 164.102, "r_y1": 543.091, "r_x2": 164.102, "r_y2": 540.762, "r_x3": 158.485, "r_y3": 540.762, "coord_origin": "TOPLEFT"}, "text": "1000", "orig": "1000", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 18, "label": "text", "bbox": {"l": 158.485, "t": 544.701, "r": 162.697, "b": 547.03, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 44, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 158.485, "r_y0": 547.03, "r_x1": 162.697, "r_y1": 547.03, "r_x2": 162.697, "r_y2": 544.701, "r_x3": 158.485, "r_y3": 544.701, "coord_origin": "TOPLEFT"}, "text": "500", "orig": "500", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 19, "label": "text", "bbox": {"l": 158.485, "t": 548.943, "r": 164.102, "b": 551.2719999999999, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 45, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 158.485, "r_y0": 551.2719999999999, "r_x1": 164.102, "r_y1": 551.2719999999999, "r_x2": 164.102, "r_y2": 548.943, "r_x3": 158.485, "r_y3": 548.943, "coord_origin": "TOPLEFT"}, "text": "3500", "orig": "3500", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 20, "label": "text", "bbox": {"l": 158.485, "t": 553.185, "r": 162.697, "b": 555.514, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 46, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 158.485, "r_y0": 555.514, "r_x1": 162.697, "r_y1": 555.514, "r_x2": 162.697, "r_y2": 553.185, "r_x3": 158.485, "r_y3": 553.185, "coord_origin": "TOPLEFT"}, "text": "150", "orig": "150", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 21, "label": "text", "bbox": {"l": 168.817, "t": 540.762, "r": 172.889, "b": 543.091, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 47, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 168.817, "r_y0": 543.091, "r_x1": 172.889, "r_y1": 543.091, "r_x2": 172.889, "r_y2": 540.762, "r_x3": 168.817, "r_y3": 540.762, "coord_origin": "TOPLEFT"}, "text": "unit", "orig": "unit", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 22, "label": "text", "bbox": {"l": 168.817, "t": 544.701, "r": 172.889, "b": 547.03, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 48, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 168.817, "r_y0": 547.03, "r_x1": 172.889, "r_y1": 547.03, "r_x2": 172.889, "r_y2": 544.701, "r_x3": 168.817, "r_y3": 544.701, "coord_origin": "TOPLEFT"}, "text": "unit", "orig": "unit", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 23, "label": "text", "bbox": {"l": 168.817, "t": 548.943, "r": 172.889, "b": 551.2719999999999, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 49, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 168.817, "r_y0": 551.2719999999999, "r_x1": 172.889, "r_y1": 551.2719999999999, "r_x2": 172.889, "r_y2": 548.943, "r_x3": 168.817, "r_y3": 548.943, "coord_origin": "TOPLEFT"}, "text": "unit", "orig": "unit", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 24, "label": "text", "bbox": {"l": 168.817, "t": 553.185, "r": 172.889, "b": 555.514, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 50, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 168.817, "r_y0": 555.514, "r_x1": 172.889, "r_y1": 555.514, "r_x2": 172.889, "r_y2": 553.185, "r_x3": 168.817, "r_y3": 553.185, "coord_origin": "TOPLEFT"}, "text": "unit", "orig": "unit", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 25, "label": "text", "bbox": {"l": 147.3, "t": 544.701, "r": 149.407, "b": 547.03, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 51, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 147.3, "r_y0": 547.03, "r_x1": 149.407, "r_y1": 547.03, "r_x2": 149.407, "r_y2": 544.701, "r_x3": 147.3, "r_y3": 544.701, "coord_origin": "TOPLEFT"}, "text": "2.", "orig": "2.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 26, "label": "text", "bbox": {"l": 150.809, "t": 544.701, "r": 155.721, "b": 547.03, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 52, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 150.809, "r_y0": 547.03, "r_x1": 155.721, "r_y1": 547.03, "r_x2": 155.721, "r_y2": 544.701, "r_x3": 150.809, "r_y3": 544.701, "coord_origin": "TOPLEFT"}, "text": "Item", "orig": "Item", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 27, "label": "text", "bbox": {"l": 147.3, "t": 548.943, "r": 149.407, "b": 551.2719999999999, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 53, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 147.3, "r_y0": 551.2719999999999, "r_x1": 149.407, "r_y1": 551.2719999999999, "r_x2": 149.407, "r_y2": 548.943, "r_x3": 147.3, "r_y3": 548.943, "coord_origin": "TOPLEFT"}, "text": "3.", "orig": "3.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 28, "label": "text", "bbox": {"l": 150.809, "t": 548.943, "r": 155.721, "b": 551.2719999999999, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 54, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 150.809, "r_y0": 551.2719999999999, "r_x1": 155.721, "r_y1": 551.2719999999999, "r_x2": 155.721, "r_y2": 548.943, "r_x3": 150.809, "r_y3": 548.943, "coord_origin": "TOPLEFT"}, "text": "Item", "orig": "Item", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 29, "label": "text", "bbox": {"l": 147.3, "t": 553.185, "r": 149.407, "b": 555.514, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 55, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 147.3, "r_y0": 555.514, "r_x1": 149.407, "r_y1": 555.514, "r_x2": 149.407, "r_y2": 553.185, "r_x3": 147.3, "r_y3": 553.185, "coord_origin": "TOPLEFT"}, "text": "4.", "orig": "4.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 30, "label": "text", "bbox": {"l": 150.809, "t": 553.185, "r": 155.721, "b": 555.514, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 56, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 150.809, "r_y0": 555.514, "r_x1": 155.721, "r_y1": 555.514, "r_x2": 155.721, "r_y2": 553.185, "r_x3": 150.809, "r_y3": 553.185, "coord_origin": "TOPLEFT"}, "text": "Item", "orig": "Item", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 31, "label": "text", "bbox": {"l": 152.05, "t": 517.0640000000001, "r": 171.249, "b": 521.2570000000001, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 57, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 152.05, "r_y0": 521.2570000000001, "r_x1": 171.249, "r_y1": 521.2570000000001, "r_x2": 171.249, "r_y2": 517.0640000000001, "r_x3": 152.05, "r_y3": 517.0640000000001, "coord_origin": "TOPLEFT"}, "text": "Extracted", "orig": "Extracted", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 32, "label": "text", "bbox": {"l": 148.133, "t": 522.367, "r": 175.168, "b": 526.56, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 58, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 148.133, "r_y0": 526.56, "r_x1": 175.168, "r_y1": 526.56, "r_x2": 175.168, "r_y2": 522.367, "r_x3": 148.133, "r_y3": 522.367, "coord_origin": "TOPLEFT"}, "text": "Table Images", "orig": "Table Images", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 33, "label": "text", "bbox": {"l": 193.533, "t": 524.569, "r": 220.32, "b": 528.762, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 59, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 193.533, "r_y0": 528.762, "r_x1": 220.32, "r_y1": 528.762, "r_x2": 220.32, "r_y2": 524.569, "r_x3": 193.533, "r_y3": 524.569, "coord_origin": "TOPLEFT"}, "text": "Standardized", "orig": "Standardized", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 34, "label": "text", "bbox": {"l": 199.473, "t": 529.871, "r": 214.379, "b": 534.0640000000001, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 60, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 199.473, "r_y0": 534.0640000000001, "r_x1": 214.379, "r_y1": 534.0640000000001, "r_x2": 214.379, "r_y2": 529.871, "r_x3": 199.473, "r_y3": 529.871, "coord_origin": "TOPLEFT"}, "text": "Images", "orig": "Images", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 35, "label": "text", "bbox": {"l": 273.611, "t": 509.96, "r": 284.473, "b": 514.153, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 61, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 273.611, "r_y0": 514.153, "r_x1": 284.473, "r_y1": 514.153, "r_x2": 284.473, "r_y2": 509.96, "r_x3": 273.611, "r_y3": 509.96, "coord_origin": "TOPLEFT"}, "text": "BBox", "orig": "BBox", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 36, "label": "text", "bbox": {"l": 270.452, "t": 513.7470000000001, "r": 287.632, "b": 517.94, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 62, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 270.452, "r_y0": 517.94, "r_x1": 287.632, "r_y1": 517.94, "r_x2": 287.632, "r_y2": 513.7470000000001, "r_x3": 270.452, "r_y3": 513.7470000000001, "coord_origin": "TOPLEFT"}, "text": "Decoder", "orig": "Decoder", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 37, "label": "text", "bbox": {"l": 332.478, "t": 508.199, "r": 348.14, "b": 512.392, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 63, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 332.478, "r_y0": 512.392, "r_x1": 348.14, "r_y1": 512.392, "r_x2": 348.14, "r_y2": 508.199, "r_x3": 332.478, "r_y3": 508.199, "coord_origin": "TOPLEFT"}, "text": "BBoxes", "orig": "BBoxes", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 38, "label": "text", "bbox": {"l": 376.686, "t": 521.175, "r": 407.255, "b": 525.3679999999999, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 64, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 376.686, "r_y0": 525.3679999999999, "r_x1": 407.255, "r_y1": 525.3679999999999, "r_x2": 407.255, "r_y2": 521.175, "r_x3": 376.686, "r_y3": 521.175, "coord_origin": "TOPLEFT"}, "text": "BBoxes can be", "orig": "BBoxes can be", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 39, "label": "text", "bbox": {"l": 373.909, "t": 525.72, "r": 410.035, "b": 529.913, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 65, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 373.909, "r_y0": 529.913, "r_x1": 410.035, "r_y1": 529.913, "r_x2": 410.035, "r_y2": 525.72, "r_x3": 373.909, "r_y3": 525.72, "coord_origin": "TOPLEFT"}, "text": "traced back to the", "orig": "traced back to the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 40, "label": "text", "bbox": {"l": 375.299, "t": 530.265, "r": 408.649, "b": 534.4580000000001, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 66, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 375.299, "r_y0": 534.4580000000001, "r_x1": 408.649, "r_y1": 534.4580000000001, "r_x2": 408.649, "r_y2": 530.265, "r_x3": 375.299, "r_y3": 530.265, "coord_origin": "TOPLEFT"}, "text": "original image to", "orig": "original image to", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 41, "label": "text", "bbox": {"l": 377.067, "t": 534.81, "r": 406.883, "b": 539.0029999999999, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 67, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 377.067, "r_y0": 539.0029999999999, "r_x1": 406.883, "r_y1": 539.0029999999999, "r_x2": 406.883, "r_y2": 534.81, "r_x3": 377.067, "r_y3": 534.81, "coord_origin": "TOPLEFT"}, "text": "extract content", "orig": "extract content", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 42, "label": "text", "bbox": {"l": 383.567, "t": 563.296, "r": 433.765, "b": 567.489, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 68, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 383.567, "r_y0": 567.489, "r_x1": 433.765, "r_y1": 567.489, "r_x2": 433.765, "r_y2": 563.296, "r_x3": 383.567, "r_y3": 563.296, "coord_origin": "TOPLEFT"}, "text": "Structure Tags sequence", "orig": "Structure Tags sequence", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 43, "label": "text", "bbox": {"l": 383.528, "t": 567.841, "r": 433.808, "b": 572.034, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 69, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 383.528, "r_y0": 572.034, "r_x1": 433.808, "r_y1": 572.034, "r_x2": 433.808, "r_y2": 567.841, "r_x3": 383.528, "r_y3": 567.841, "coord_origin": "TOPLEFT"}, "text": "provide full description of", "orig": "provide full description of", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 44, "label": "text", "bbox": {"l": 390.475, "t": 572.386, "r": 426.857, "b": 576.579, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 70, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 390.475, "r_y0": 576.579, "r_x1": 426.857, "r_y1": 576.579, "r_x2": 426.857, "r_y2": 572.386, "r_x3": 390.475, "r_y3": 572.386, "coord_origin": "TOPLEFT"}, "text": "the table structure", "orig": "the table structure", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 45, "label": "text", "bbox": {"l": 293.947, "t": 577.946, "r": 323.169, "b": 582.139, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 71, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 293.947, "r_y0": 582.139, "r_x1": 323.169, "r_y1": 582.139, "r_x2": 323.169, "r_y2": 577.946, "r_x3": 293.947, "r_y3": 577.946, "coord_origin": "TOPLEFT"}, "text": "Structure Tags", "orig": "Structure Tags", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 46, "label": "text", "bbox": {"l": 293.947, "t": 582.491, "r": 324.594, "b": 586.684, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 72, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 293.947, "r_y0": 586.684, "r_x1": 324.594, "r_y1": 586.684, "r_x2": 324.594, "r_y2": 582.491, "r_x3": 293.947, "r_y3": 582.491, "coord_origin": "TOPLEFT"}, "text": "in OTSL format", "orig": "in OTSL format", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 47, "label": "text", "bbox": {"l": 333.078, "t": 541.877, "r": 364.147, "b": 546.0699999999999, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 73, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 333.078, "r_y0": 546.0699999999999, "r_x1": 364.147, "r_y1": 546.0699999999999, "r_x2": 364.147, "r_y2": 541.877, "r_x3": 333.078, "r_y3": 541.877, "coord_origin": "TOPLEFT"}, "text": "BBoxes in sync", "orig": "BBoxes in sync", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 48, "label": "text", "bbox": {"l": 333.078, "t": 545.665, "r": 369.715, "b": 549.858, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 74, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 333.078, "r_y0": 549.858, "r_x1": 369.715, "r_y1": 549.858, "r_x2": 369.715, "r_y2": 545.665, "r_x3": 333.078, "r_y3": 545.665, "coord_origin": "TOPLEFT"}, "text": "with tag sequence", "orig": "with tag sequence", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 49, "label": "text", "bbox": {"l": 232.659, "t": 515.296, "r": 249.589, "b": 519.489, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 75, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 232.659, "r_y0": 519.489, "r_x1": 249.589, "r_y1": 519.489, "r_x2": 249.589, "r_y2": 515.296, "r_x3": 232.659, "r_y3": 515.296, "coord_origin": "TOPLEFT"}, "text": "Encoder", "orig": "Encoder", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 50, "label": "text", "bbox": {"l": 269.822, "t": 546.0260000000001, "r": 288.263, "b": 550.218, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 76, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 269.822, "r_y0": 550.218, "r_x1": 288.263, "r_y1": 550.218, "r_x2": 288.263, "r_y2": 546.0260000000001, "r_x3": 269.822, "r_y3": 546.0260000000001, "coord_origin": "TOPLEFT"}, "text": "Structure", "orig": "Structure", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 51, "label": "text", "bbox": {"l": 270.452, "t": 549.813, "r": 287.632, "b": 554.006, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 77, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 270.452, "r_y0": 554.006, "r_x1": 287.632, "r_y1": 554.006, "r_x2": 287.632, "r_y2": 549.813, "r_x3": 270.452, "r_y3": 549.813, "coord_origin": "TOPLEFT"}, "text": "Decoder", "orig": "Decoder", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 52, "label": "text", "bbox": {"l": 332.177, "t": 515.967, "r": 358.112, "b": 520.1600000000001, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 78, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 332.177, "r_y0": 520.1600000000001, "r_x1": 358.112, "r_y1": 520.1600000000001, "r_x2": 358.112, "r_y2": 515.967, "r_x3": 332.177, "r_y3": 515.967, "coord_origin": "TOPLEFT"}, "text": "[x1, y2, x2, y2]", "orig": "[x1, y2, x2, y2]", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 53, "label": "text", "bbox": {"l": 332.177, "t": 522.027, "r": 361.583, "b": 526.22, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 79, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 332.177, "r_y0": 526.22, "r_x1": 361.583, "r_y1": 526.22, "r_x2": 361.583, "r_y2": 522.027, "r_x3": 332.177, "r_y3": 522.027, "coord_origin": "TOPLEFT"}, "text": "[x1', y2', x2', y2']", "orig": "[x1', y2', x2', y2']", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 54, "label": "text", "bbox": {"l": 332.177, "t": 528.087, "r": 364.765, "b": 532.28, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 80, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 332.177, "r_y0": 532.28, "r_x1": 364.765, "r_y1": 532.28, "r_x2": 364.765, "r_y2": 528.087, "r_x3": 332.177, "r_y3": 528.087, "coord_origin": "TOPLEFT"}, "text": "[x1'', y2'', x2'', y2'']", "orig": "[x1'', y2'', x2'', y2'']", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 55, "label": "text", "bbox": {"l": 332.177, "t": 534.1469999999999, "r": 335.965, "b": 538.34, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 81, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 332.177, "r_y0": 538.34, "r_x1": 335.965, "r_y1": 538.34, "r_x2": 335.965, "r_y2": 534.1469999999999, "r_x3": 332.177, "r_y3": 534.1469999999999, "coord_origin": "TOPLEFT"}, "text": "...", "orig": "...", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 56, "label": "text", "bbox": {"l": 326.889, "t": 516.45, "r": 329.416, "b": 520.643, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 82, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 326.889, "r_y0": 520.643, "r_x1": 329.416, "r_y1": 520.643, "r_x2": 329.416, "r_y2": 516.45, "r_x3": 326.889, "r_y3": 516.45, "coord_origin": "TOPLEFT"}, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 57, "label": "text", "bbox": {"l": 327.041, "t": 522.479, "r": 329.568, "b": 526.672, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 83, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 327.041, "r_y0": 526.672, "r_x1": 329.568, "r_y1": 526.672, "r_x2": 329.568, "r_y2": 522.479, "r_x3": 327.041, "r_y3": 522.479, "coord_origin": "TOPLEFT"}, "text": "2", "orig": "2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 58, "label": "text", "bbox": {"l": 327.041, "t": 528.5699999999999, "r": 329.568, "b": 532.7629999999999, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 84, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 327.041, "r_y0": 532.7629999999999, "r_x1": 329.568, "r_y1": 532.7629999999999, "r_x2": 329.568, "r_y2": 528.5699999999999, "r_x3": 327.041, "r_y3": 528.5699999999999, "coord_origin": "TOPLEFT"}, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 59, "label": "text", "bbox": {"l": 424.141, "t": 527.4970000000001, "r": 426.668, "b": 531.69, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 85, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 424.141, "r_y0": 531.69, "r_x1": 426.668, "r_y1": 531.69, "r_x2": 426.668, "r_y2": 527.4970000000001, "r_x3": 424.141, "r_y3": 527.4970000000001, "coord_origin": "TOPLEFT"}, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 60, "label": "text", "bbox": {"l": 453.002, "t": 517.508, "r": 455.529, "b": 521.701, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 86, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 453.002, "r_y0": 521.701, "r_x1": 455.529, "r_y1": 521.701, "r_x2": 455.529, "r_y2": 517.508, "r_x3": 453.002, "r_y3": 517.508, "coord_origin": "TOPLEFT"}, "text": "2", "orig": "2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 61, "label": "text", "bbox": {"l": 423.858, "t": 517.117, "r": 426.385, "b": 521.31, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 87, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 423.858, "r_y0": 521.31, "r_x1": 426.385, "r_y1": 521.31, "r_x2": 426.385, "r_y2": 517.117, "r_x3": 423.858, "r_y3": 517.117, "coord_origin": "TOPLEFT"}, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 62, "label": "text", "bbox": {"l": 333.434, "t": 556.947, "r": 359.834, "b": 562.3389999999999, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 88, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 333.434, "r_y0": 562.3389999999999, "r_x1": 359.834, "r_y1": 561.855, "r_x2": 359.834, "r_y2": 556.947, "r_x3": 333.434, "r_y3": 557.431, "coord_origin": "TOPLEFT"}, "text": "C C L NL", "orig": "C C L NL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 63, "label": "text", "bbox": {"l": 340.31, "t": 563.644, "r": 359.986, "b": 568.837, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 89, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 340.31, "r_y0": 568.837, "r_x1": 359.986, "r_y1": 568.552, "r_x2": 359.986, "r_y2": 563.644, "r_x3": 340.31, "r_y3": 563.929, "coord_origin": "TOPLEFT"}, "text": "C C NL", "orig": "C C NL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 64, "label": "text", "bbox": {"l": 333.596, "t": 563.887, "r": 337.437, "b": 568.795, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 90, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 333.596, "r_y0": 568.795, "r_x1": 337.437, "r_y1": 568.795, "r_x2": 337.437, "r_y2": 563.887, "r_x3": 333.596, "r_y3": 563.887, "coord_origin": "TOPLEFT"}, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 65, "label": "text", "bbox": {"l": 340.375, "t": 570.226, "r": 359.999, "b": 575.399, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 91, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 340.375, "r_y0": 575.399, "r_x1": 359.999, "r_y1": 575.134, "r_x2": 359.999, "r_y2": 570.226, "r_x3": 340.375, "r_y3": 570.491, "coord_origin": "TOPLEFT"}, "text": "C C NL", "orig": "C C NL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 66, "label": "text", "bbox": {"l": 333.661, "t": 570.448, "r": 337.503, "b": 575.356, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 92, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 333.661, "r_y0": 575.356, "r_x1": 337.503, "r_y1": 575.356, "r_x2": 337.503, "r_y2": 570.448, "r_x3": 333.661, "r_y3": 570.448, "coord_origin": "TOPLEFT"}, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 67, "label": "text", "bbox": {"l": 340.377, "t": 576.83, "r": 359.954, "b": 581.998, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 93, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 340.377, "r_y0": 581.998, "r_x1": 359.954, "r_y1": 581.738, "r_x2": 359.954, "r_y2": 576.83, "r_x3": 340.377, "r_y3": 577.09, "coord_origin": "TOPLEFT"}, "text": "C C NL", "orig": "C C NL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 68, "label": "text", "bbox": {"l": 333.663, "t": 577.047, "r": 337.504, "b": 581.955, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 94, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 333.663, "r_y0": 581.955, "r_x1": 337.504, "r_y1": 581.955, "r_x2": 337.504, "r_y2": 577.047, "r_x3": 333.663, "r_y3": 577.047, "coord_origin": "TOPLEFT"}, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 69, "label": "text", "bbox": {"l": 340.279, "t": 583.461, "r": 360.07, "b": 588.3779999999999, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 95, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 340.279, "r_y0": 588.369, "r_x1": 360.07, "r_y1": 588.3779999999999, "r_x2": 360.07, "r_y2": 583.47, "r_x3": 340.279, "r_y3": 583.461, "coord_origin": "TOPLEFT"}, "text": "C C NL", "orig": "C C NL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 70, "label": "text", "bbox": {"l": 333.566, "t": 583.419, "r": 337.407, "b": 588.327, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 96, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 333.566, "r_y0": 588.327, "r_x1": 337.407, "r_y1": 588.327, "r_x2": 337.407, "r_y2": 583.419, "r_x3": 333.566, "r_y3": 583.419, "coord_origin": "TOPLEFT"}, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 71, "label": "text", "bbox": {"l": 331.14, "t": 564.345, "r": 333.667, "b": 568.538, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 97, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 331.14, "r_y0": 568.538, "r_x1": 333.667, "r_y1": 568.538, "r_x2": 333.667, "r_y2": 564.345, "r_x3": 331.14, "r_y3": 564.345, "coord_origin": "TOPLEFT"}, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 72, "label": "text", "bbox": {"l": 340.81, "t": 554.648, "r": 343.337, "b": 558.841, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 98, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 340.81, "r_y0": 558.841, "r_x1": 343.337, "r_y1": 558.841, "r_x2": 343.337, "r_y2": 554.648, "r_x3": 340.81, "r_y3": 554.648, "coord_origin": "TOPLEFT"}, "text": "2", "orig": "2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 73, "label": "text", "bbox": {"l": 330.98, "t": 554.885, "r": 333.507, "b": 559.078, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 99, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 330.98, "r_y0": 559.078, "r_x1": 333.507, "r_y1": 559.078, "r_x2": 333.507, "r_y2": 554.885, "r_x3": 330.98, "r_y3": 554.885, "coord_origin": "TOPLEFT"}, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}]}, "text": "", "annotations": [], "provenance": null, "predicted_class": null, "confidence": null}, {"label": "text", "id": 4, "page_no": 7, "cluster": {"id": 4, "label": "text", "bbox": {"l": 134.765, "t": 620.193, "r": 480.592, "b": 664.855, "coord_origin": "TOPLEFT"}, "confidence": 0.951270341873169, "cells": [{"index": 100, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 149.709, "r_y0": 628.99, "r_x1": 480.588, "r_y1": 628.99, "r_x2": 480.588, "r_y2": 620.193, "r_x3": 149.709, "r_y3": 620.193, "coord_origin": "TOPLEFT"}, "text": "We rely on standard metrics such as Tree Edit Distance score (TEDs) for", "orig": "We rely on standard metrics such as Tree Edit Distance score (TEDs) for", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 101, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 640.9449999999999, "r_x1": 480.589, "r_y1": 640.9449999999999, "r_x2": 480.589, "r_y2": 632.148, "r_x3": 134.765, "r_y3": 632.148, "coord_origin": "TOPLEFT"}, "text": "table structure prediction, and Mean Average Precision (mAP) with 0.75 Inter-", "orig": "table structure prediction, and Mean Average Precision (mAP) with 0.75 Inter-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 102, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 652.9, "r_x1": 480.592, "r_y1": 652.9, "r_x2": 480.592, "r_y2": 644.1030000000001, "r_x3": 134.765, "r_y3": 644.1030000000001, "coord_origin": "TOPLEFT"}, "text": "section Over Union (IOU) threshold for the bounding-box predictions of table", "orig": "section Over Union (IOU) threshold for the bounding-box predictions of table", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 103, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 664.855, "r_x1": 155.846, "r_y1": 664.855, "r_x2": 155.846, "r_y2": 656.058, "r_x3": 134.765, "r_y3": 656.058, "coord_origin": "TOPLEFT"}, "text": "cells.", "orig": "cells.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 104, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 159.442, "r_y0": 664.855, "r_x1": 480.59, "r_y1": 664.855, "r_x2": 480.59, "r_y2": 656.058, "r_x3": 159.442, "r_y3": 656.058, "coord_origin": "TOPLEFT"}, "text": "The predicted OTSL structures were converted back to HTML format in", "orig": "The predicted OTSL structures were converted back to HTML format in", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "We rely on standard metrics such as Tree Edit Distance score (TEDs) for table structure prediction, and Mean Average Precision (mAP) with 0.75 Intersection Over Union (IOU) threshold for the bounding-box predictions of table cells. The predicted OTSL structures were converted back to HTML format in"}], "body": [{"label": "text", "id": 5, "page_no": 7, "cluster": {"id": 5, "label": "text", "bbox": {"l": 134.765, "t": 118.93399999999997, "r": 480.589, "b": 139.68600000000004, "coord_origin": "TOPLEFT"}, "confidence": 0.9464744925498962, "cells": [{"index": 2, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 127.731, "r_x1": 480.589, "r_y1": 127.731, "r_x2": 480.589, "r_y2": 118.93399999999997, "r_x3": 134.765, "r_y3": 118.93399999999997, "coord_origin": "TOPLEFT"}, "text": "reduces significantly the column drift seen in the HTML based models (see Fig-", "orig": "reduces significantly the column drift seen in the HTML based models (see Fig-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 3, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 139.68600000000004, "r_x1": 163.564, "r_y1": 139.68600000000004, "r_x2": 163.564, "r_y2": 130.889, "r_x3": 134.765, "r_y3": 130.889, "coord_origin": "TOPLEFT"}, "text": "ure 5).", "orig": "ure 5).", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "reduces significantly the column drift seen in the HTML based models (see Figure 5)."}, {"label": "section_header", "id": 2, "page_no": 7, "cluster": {"id": 2, "label": "section_header", "bbox": {"l": 134.765, "t": 161.55700000000002, "r": 319.347, "b": 170.36400000000003, "coord_origin": "TOPLEFT"}, "confidence": 0.9549514651298523, "cells": [{"index": 4, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 170.36400000000003, "r_x1": 149.402, "r_y1": 170.36400000000003, "r_x2": 149.402, "r_y2": 161.55700000000002, "r_x3": 134.765, "r_y3": 161.55700000000002, "coord_origin": "TOPLEFT"}, "text": "4.3", "orig": "4.3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 5, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 160.859, "r_y0": 170.36400000000003, "r_x1": 319.347, "r_y1": 170.36400000000003, "r_x2": 319.347, "r_y2": 161.55700000000002, "r_x3": 160.859, "r_y3": 161.55700000000002, "coord_origin": "TOPLEFT"}, "text": "Error-detection and -mitigation", "orig": "Error-detection and -mitigation", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "4.3 Error-detection and -mitigation"}, {"label": "text", "id": 0, "page_no": 7, "cluster": {"id": 0, "label": "text", "bbox": {"l": 134.765, "t": 182.28200000000004, "r": 480.596, "b": 298.676, "coord_origin": "TOPLEFT"}, "confidence": 0.9879790544509888, "cells": [{"index": 6, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 191.07899999999995, "r_x1": 480.596, "r_y1": 191.07899999999995, "r_x2": 480.596, "r_y2": 182.28200000000004, "r_x3": 134.765, "r_y3": 182.28200000000004, "coord_origin": "TOPLEFT"}, "text": "The design of OTSL allows to validate a table structure easily on an unfinished", "orig": "The design of OTSL allows to validate a table structure easily on an unfinished", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 7, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 203.03499999999997, "r_x1": 480.595, "r_y1": 203.03499999999997, "r_x2": 480.595, "r_y2": 194.23800000000006, "r_x3": 134.765, "r_y3": 194.23800000000006, "coord_origin": "TOPLEFT"}, "text": "sequence. The detection of an invalid sequence token is a clear indication of a", "orig": "sequence. The detection of an invalid sequence token is a clear indication of a", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 8, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 214.99, "r_x1": 480.587, "r_y1": 214.99, "r_x2": 480.587, "r_y2": 206.19299999999998, "r_x3": 134.765, "r_y3": 206.19299999999998, "coord_origin": "TOPLEFT"}, "text": "prediction mistake, however a valid sequence by itself does not guarantee pre-", "orig": "prediction mistake, however a valid sequence by itself does not guarantee pre-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 9, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 226.94500000000005, "r_x1": 480.592, "r_y1": 226.94500000000005, "r_x2": 480.592, "r_y2": 218.14800000000002, "r_x3": 134.765, "r_y3": 218.14800000000002, "coord_origin": "TOPLEFT"}, "text": "diction correctness. Different heuristics can be used to correct token errors in", "orig": "diction correctness. Different heuristics can be used to correct token errors in", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 10, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 238.89999999999998, "r_x1": 480.588, "r_y1": 238.89999999999998, "r_x2": 480.588, "r_y2": 230.10299999999995, "r_x3": 134.765, "r_y3": 230.10299999999995, "coord_origin": "TOPLEFT"}, "text": "an invalid sequence and thus increase the chances for accurate predictions. Such", "orig": "an invalid sequence and thus increase the chances for accurate predictions. Such", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 11, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 250.85500000000002, "r_x1": 480.587, "r_y1": 250.85500000000002, "r_x2": 480.587, "r_y2": 242.058, "r_x3": 134.765, "r_y3": 242.058, "coord_origin": "TOPLEFT"}, "text": "heuristics can be applied either after the prediction of each token, or at the end", "orig": "heuristics can be applied either after the prediction of each token, or at the end", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 12, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 262.80999999999995, "r_x1": 480.594, "r_y1": 262.80999999999995, "r_x2": 480.594, "r_y2": 254.01300000000003, "r_x3": 134.765, "r_y3": 254.01300000000003, "coord_origin": "TOPLEFT"}, "text": "on the entire predicted sequence. For example a simple heuristic which can cor-", "orig": "on the entire predicted sequence. For example a simple heuristic which can cor-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 13, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 274.76599999999996, "r_x1": 480.591, "r_y1": 274.76599999999996, "r_x2": 480.591, "r_y2": 265.96900000000005, "r_x3": 134.765, "r_y3": 265.96900000000005, "coord_origin": "TOPLEFT"}, "text": "rect the predicted OTSL sequence on-the-fly is to verify if the token with the", "orig": "rect the predicted OTSL sequence on-the-fly is to verify if the token with the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 14, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 286.721, "r_x1": 480.596, "r_y1": 286.721, "r_x2": 480.596, "r_y2": 277.924, "r_x3": 134.765, "r_y3": 277.924, "coord_origin": "TOPLEFT"}, "text": "highest prediction confidence invalidates the predicted sequence, and replace it", "orig": "highest prediction confidence invalidates the predicted sequence, and replace it", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 15, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 298.676, "r_x1": 469.404, "r_y1": 298.676, "r_x2": 469.404, "r_y2": 289.879, "r_x3": 134.765, "r_y3": 289.879, "coord_origin": "TOPLEFT"}, "text": "by the token with the next highest confidence until OTSL rules are satisfied.", "orig": "by the token with the next highest confidence until OTSL rules are satisfied.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "The design of OTSL allows to validate a table structure easily on an unfinished sequence. The detection of an invalid sequence token is a clear indication of a prediction mistake, however a valid sequence by itself does not guarantee prediction correctness. Different heuristics can be used to correct token errors in an invalid sequence and thus increase the chances for accurate predictions. Such heuristics can be applied either after the prediction of each token, or at the end on the entire predicted sequence. For example a simple heuristic which can correct the predicted OTSL sequence on-the-fly is to verify if the token with the highest prediction confidence invalidates the predicted sequence, and replace it by the token with the next highest confidence until OTSL rules are satisfied."}, {"label": "section_header", "id": 3, "page_no": 7, "cluster": {"id": 3, "label": "section_header", "bbox": {"l": 134.765, "t": 321.164, "r": 229.035, "b": 331.732, "coord_origin": "TOPLEFT"}, "confidence": 0.95152747631073, "cells": [{"index": 16, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 331.732, "r_x1": 141.489, "r_y1": 331.732, "r_x2": 141.489, "r_y2": 321.164, "r_x3": 134.765, "r_y3": 321.164, "coord_origin": "TOPLEFT"}, "text": "5", "orig": "5", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 17, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 154.938, "r_y0": 331.732, "r_x1": 229.035, "r_y1": 331.732, "r_x2": 229.035, "r_y2": 321.164, "r_x3": 154.938, "r_y3": 321.164, "coord_origin": "TOPLEFT"}, "text": "Experiments", "orig": "Experiments", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "5 Experiments"}, {"label": "text", "id": 1, "page_no": 7, "cluster": {"id": 1, "label": "text", "bbox": {"l": 134.765, "t": 347.25, "r": 480.595, "b": 451.688, "coord_origin": "TOPLEFT"}, "confidence": 0.9877985119819641, "cells": [{"index": 18, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 356.047, "r_x1": 480.594, "r_y1": 356.047, "r_x2": 480.594, "r_y2": 347.25, "r_x3": 134.765, "r_y3": 347.25, "coord_origin": "TOPLEFT"}, "text": "To evaluate the impact of OTSL on prediction accuracy and inference times, we", "orig": "To evaluate the impact of OTSL on prediction accuracy and inference times, we", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 19, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 368.002, "r_x1": 480.595, "r_y1": 368.002, "r_x2": 480.595, "r_y2": 359.205, "r_x3": 134.765, "r_y3": 359.205, "coord_origin": "TOPLEFT"}, "text": "conducted a series of experiments based on the TableFormer model (Figure 4)", "orig": "conducted a series of experiments based on the TableFormer model (Figure 4)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 20, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 379.957, "r_x1": 480.588, "r_y1": 379.957, "r_x2": 480.588, "r_y2": 371.16, "r_x3": 134.765, "r_y3": 371.16, "coord_origin": "TOPLEFT"}, "text": "with two objectives: Firstly we evaluate the prediction quality and performance", "orig": "with two objectives: Firstly we evaluate the prediction quality and performance", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 21, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 391.912, "r_x1": 480.588, "r_y1": 391.912, "r_x2": 480.588, "r_y2": 383.115, "r_x3": 134.765, "r_y3": 383.115, "coord_origin": "TOPLEFT"}, "text": "of OTSL vs. HTML after performing Hyper Parameter Optimization (HPO) on", "orig": "of OTSL vs. HTML after performing Hyper Parameter Optimization (HPO) on", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 22, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 403.867, "r_x1": 148.598, "r_y1": 403.867, "r_x2": 148.598, "r_y2": 395.07, "r_x3": 134.765, "r_y3": 395.07, "coord_origin": "TOPLEFT"}, "text": "the", "orig": "the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 23, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 151.627, "r_y0": 403.867, "r_x1": 191.847, "r_y1": 403.867, "r_x2": 191.847, "r_y2": 395.07, "r_x3": 151.627, "r_y3": 395.07, "coord_origin": "TOPLEFT"}, "text": "canonical", "orig": "canonical", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 24, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 195.902, "r_y0": 403.867, "r_x1": 480.595, "r_y1": 403.867, "r_x2": 480.595, "r_y2": 395.07, "r_x3": 195.902, "r_y3": 395.07, "coord_origin": "TOPLEFT"}, "text": "PubTabNet data set. Secondly we pick the best hyper-parameters", "orig": "PubTabNet data set. Secondly we pick the best hyper-parameters", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 25, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 415.822, "r_x1": 172.59, "r_y1": 415.822, "r_x2": 172.59, "r_y2": 407.025, "r_x3": 134.765, "r_y3": 407.025, "coord_origin": "TOPLEFT"}, "text": "found in", "orig": "found in", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 26, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 177.492, "r_y0": 415.822, "r_x1": 191.325, "r_y1": 415.822, "r_x2": 191.325, "r_y2": 407.025, "r_x3": 177.492, "r_y3": 407.025, "coord_origin": "TOPLEFT"}, "text": "the", "orig": "the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 27, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 196.226, "r_y0": 415.822, "r_x1": 213.463, "r_y1": 415.822, "r_x2": 213.463, "r_y2": 407.025, "r_x3": 196.226, "r_y3": 407.025, "coord_origin": "TOPLEFT"}, "text": "first", "orig": "first", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 28, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 218.364, "r_y0": 415.822, "r_x1": 236.125, "r_y1": 415.822, "r_x2": 236.125, "r_y2": 407.025, "r_x3": 218.364, "r_y3": 407.025, "coord_origin": "TOPLEFT"}, "text": "step", "orig": "step", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 29, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 241.027, "r_y0": 415.822, "r_x1": 297.661, "r_y1": 415.822, "r_x2": 297.661, "r_y2": 407.025, "r_x3": 241.027, "r_y3": 407.025, "coord_origin": "TOPLEFT"}, "text": "and evaluate", "orig": "and evaluate", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 30, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 302.563, "r_y0": 415.822, "r_x1": 480.593, "r_y1": 415.822, "r_x2": 480.593, "r_y2": 407.025, "r_x3": 302.563, "r_y3": 407.025, "coord_origin": "TOPLEFT"}, "text": "how OTSL impacts the performance of", "orig": "how OTSL impacts the performance of", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 31, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 427.778, "r_x1": 377.321, "r_y1": 427.778, "r_x2": 377.321, "r_y2": 418.981, "r_x3": 134.765, "r_y3": 418.981, "coord_origin": "TOPLEFT"}, "text": "TableFormer after training on other publicly available", "orig": "TableFormer after training on other publicly available", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 32, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 381.874, "r_y0": 427.778, "r_x1": 421.951, "r_y1": 427.778, "r_x2": 421.951, "r_y2": 418.981, "r_x3": 381.874, "r_y3": 418.981, "coord_origin": "TOPLEFT"}, "text": "data sets", "orig": "data sets", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 33, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 426.504, "r_y0": 427.778, "r_x1": 480.595, "r_y1": 427.778, "r_x2": 480.595, "r_y2": 418.981, "r_x3": 426.504, "r_y3": 418.981, "coord_origin": "TOPLEFT"}, "text": "(FinTabNet,", "orig": "(FinTabNet,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 34, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 439.733, "r_x1": 480.592, "r_y1": 439.733, "r_x2": 480.592, "r_y2": 430.936, "r_x3": 134.765, "r_y3": 430.936, "coord_origin": "TOPLEFT"}, "text": "PubTables-1M [14]). The ground truth (GT) from all data sets has been con-", "orig": "PubTables-1M [14]). The ground truth (GT) from all data sets has been con-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 35, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 451.688, "r_x1": 479.303, "r_y1": 451.688, "r_x2": 479.303, "r_y2": 442.891, "r_x3": 134.765, "r_y3": 442.891, "coord_origin": "TOPLEFT"}, "text": "verted into OTSL format for this purpose, and will be made publicly available.", "orig": "verted into OTSL format for this purpose, and will be made publicly available.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "To evaluate the impact of OTSL on prediction accuracy and inference times, we conducted a series of experiments based on the TableFormer model (Figure 4) with two objectives: Firstly we evaluate the prediction quality and performance of OTSL vs. HTML after performing Hyper Parameter Optimization (HPO) on the canonical PubTabNet data set. Secondly we pick the best hyper-parameters found in the first step and evaluate how OTSL impacts the performance of TableFormer after training on other publicly available data sets (FinTabNet, PubTables-1M [14]). The ground truth (GT) from all data sets has been converted into OTSL format for this purpose, and will be made publicly available."}, {"label": "caption", "id": 7, "page_no": 7, "cluster": {"id": 7, "label": "caption", "bbox": {"l": 134.765, "t": 482.433, "r": 480.591, "b": 504.681, "coord_origin": "TOPLEFT"}, "confidence": 0.9297956228256226, "cells": [{"index": 36, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 492.574, "r_x1": 162.644, "r_y1": 492.574, "r_x2": 162.644, "r_y2": 484.648, "r_x3": 134.765, "r_y3": 484.648, "coord_origin": "TOPLEFT"}, "text": "Fig. 4.", "orig": "Fig. 4.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 37, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 165.196, "r_y0": 493.722, "r_x1": 480.591, "r_y1": 493.722, "r_x2": 480.591, "r_y2": 482.433, "r_x3": 165.196, "r_y3": 482.433, "coord_origin": "TOPLEFT"}, "text": "Architecture sketch of the TableFormer model, which is a representative for the", "orig": "Architecture sketch of the TableFormer model, which is a representative for the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 38, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 504.681, "r_x1": 206.702, "r_y1": 504.681, "r_x2": 206.702, "r_y2": 493.392, "r_x3": 134.765, "r_y3": 493.392, "coord_origin": "TOPLEFT"}, "text": "Im2Seq approach.", "orig": "Im2Seq approach.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "Fig. 4. Architecture sketch of the TableFormer model, which is a representative for the Im2Seq approach."}, {"label": "picture", "id": 6, "page_no": 7, "cluster": {"id": 6, "label": "picture", "bbox": {"l": 140.70968627929688, "t": 508.0638427734375, "r": 472.73382568359375, "b": 593.6771850585938, "coord_origin": "TOPLEFT"}, "confidence": 0.9303396344184875, "cells": [{"index": 39, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 147.3, "r_y0": 543.091, "r_x1": 149.407, "r_y1": 543.091, "r_x2": 149.407, "r_y2": 540.762, "r_x3": 147.3, "r_y3": 540.762, "coord_origin": "TOPLEFT"}, "text": "1.", "orig": "1.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 40, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 150.809, "r_y0": 543.091, "r_x1": 155.721, "r_y1": 543.091, "r_x2": 155.721, "r_y2": 540.762, "r_x3": 150.809, "r_y3": 540.762, "coord_origin": "TOPLEFT"}, "text": "Item", "orig": "Item", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 41, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 162.76, "r_y0": 537.754, "r_x1": 172.296, "r_y1": 537.754, "r_x2": 172.296, "r_y2": 535.424, "r_x3": 162.76, "r_y3": 535.424, "coord_origin": "TOPLEFT"}, "text": "Amount", "orig": "Amount", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 42, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 147.636, "r_y0": 537.726, "r_x1": 155.918, "r_y1": 537.726, "r_x2": 155.918, "r_y2": 535.396, "r_x3": 147.636, "r_y3": 535.396, "coord_origin": "TOPLEFT"}, "text": "Names", "orig": "Names", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 43, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 158.485, "r_y0": 543.091, "r_x1": 164.102, "r_y1": 543.091, "r_x2": 164.102, "r_y2": 540.762, "r_x3": 158.485, "r_y3": 540.762, "coord_origin": "TOPLEFT"}, "text": "1000", "orig": "1000", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 44, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 158.485, "r_y0": 547.03, "r_x1": 162.697, "r_y1": 547.03, "r_x2": 162.697, "r_y2": 544.701, "r_x3": 158.485, "r_y3": 544.701, "coord_origin": "TOPLEFT"}, "text": "500", "orig": "500", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 45, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 158.485, "r_y0": 551.2719999999999, "r_x1": 164.102, "r_y1": 551.2719999999999, "r_x2": 164.102, "r_y2": 548.943, "r_x3": 158.485, "r_y3": 548.943, "coord_origin": "TOPLEFT"}, "text": "3500", "orig": "3500", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 46, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 158.485, "r_y0": 555.514, "r_x1": 162.697, "r_y1": 555.514, "r_x2": 162.697, "r_y2": 553.185, "r_x3": 158.485, "r_y3": 553.185, "coord_origin": "TOPLEFT"}, "text": "150", "orig": "150", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 47, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 168.817, "r_y0": 543.091, "r_x1": 172.889, "r_y1": 543.091, "r_x2": 172.889, "r_y2": 540.762, "r_x3": 168.817, "r_y3": 540.762, "coord_origin": "TOPLEFT"}, "text": "unit", "orig": "unit", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 48, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 168.817, "r_y0": 547.03, "r_x1": 172.889, "r_y1": 547.03, "r_x2": 172.889, "r_y2": 544.701, "r_x3": 168.817, "r_y3": 544.701, "coord_origin": "TOPLEFT"}, "text": "unit", "orig": "unit", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 49, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 168.817, "r_y0": 551.2719999999999, "r_x1": 172.889, "r_y1": 551.2719999999999, "r_x2": 172.889, "r_y2": 548.943, "r_x3": 168.817, "r_y3": 548.943, "coord_origin": "TOPLEFT"}, "text": "unit", "orig": "unit", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 50, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 168.817, "r_y0": 555.514, "r_x1": 172.889, "r_y1": 555.514, "r_x2": 172.889, "r_y2": 553.185, "r_x3": 168.817, "r_y3": 553.185, "coord_origin": "TOPLEFT"}, "text": "unit", "orig": "unit", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 51, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 147.3, "r_y0": 547.03, "r_x1": 149.407, "r_y1": 547.03, "r_x2": 149.407, "r_y2": 544.701, "r_x3": 147.3, "r_y3": 544.701, "coord_origin": "TOPLEFT"}, "text": "2.", "orig": "2.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 52, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 150.809, "r_y0": 547.03, "r_x1": 155.721, "r_y1": 547.03, "r_x2": 155.721, "r_y2": 544.701, "r_x3": 150.809, "r_y3": 544.701, "coord_origin": "TOPLEFT"}, "text": "Item", "orig": "Item", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 53, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 147.3, "r_y0": 551.2719999999999, "r_x1": 149.407, "r_y1": 551.2719999999999, "r_x2": 149.407, "r_y2": 548.943, "r_x3": 147.3, "r_y3": 548.943, "coord_origin": "TOPLEFT"}, "text": "3.", "orig": "3.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 54, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 150.809, "r_y0": 551.2719999999999, "r_x1": 155.721, "r_y1": 551.2719999999999, "r_x2": 155.721, "r_y2": 548.943, "r_x3": 150.809, "r_y3": 548.943, "coord_origin": "TOPLEFT"}, "text": "Item", "orig": "Item", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 55, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 147.3, "r_y0": 555.514, "r_x1": 149.407, "r_y1": 555.514, "r_x2": 149.407, "r_y2": 553.185, "r_x3": 147.3, "r_y3": 553.185, "coord_origin": "TOPLEFT"}, "text": "4.", "orig": "4.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 56, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 150.809, "r_y0": 555.514, "r_x1": 155.721, "r_y1": 555.514, "r_x2": 155.721, "r_y2": 553.185, "r_x3": 150.809, "r_y3": 553.185, "coord_origin": "TOPLEFT"}, "text": "Item", "orig": "Item", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 57, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 152.05, "r_y0": 521.2570000000001, "r_x1": 171.249, "r_y1": 521.2570000000001, "r_x2": 171.249, "r_y2": 517.0640000000001, "r_x3": 152.05, "r_y3": 517.0640000000001, "coord_origin": "TOPLEFT"}, "text": "Extracted", "orig": "Extracted", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 58, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 148.133, "r_y0": 526.56, "r_x1": 175.168, "r_y1": 526.56, "r_x2": 175.168, "r_y2": 522.367, "r_x3": 148.133, "r_y3": 522.367, "coord_origin": "TOPLEFT"}, "text": "Table Images", "orig": "Table Images", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 59, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 193.533, "r_y0": 528.762, "r_x1": 220.32, "r_y1": 528.762, "r_x2": 220.32, "r_y2": 524.569, "r_x3": 193.533, "r_y3": 524.569, "coord_origin": "TOPLEFT"}, "text": "Standardized", "orig": "Standardized", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 60, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 199.473, "r_y0": 534.0640000000001, "r_x1": 214.379, "r_y1": 534.0640000000001, "r_x2": 214.379, "r_y2": 529.871, "r_x3": 199.473, "r_y3": 529.871, "coord_origin": "TOPLEFT"}, "text": "Images", "orig": "Images", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 61, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 273.611, "r_y0": 514.153, "r_x1": 284.473, "r_y1": 514.153, "r_x2": 284.473, "r_y2": 509.96, "r_x3": 273.611, "r_y3": 509.96, "coord_origin": "TOPLEFT"}, "text": "BBox", "orig": "BBox", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 62, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 270.452, "r_y0": 517.94, "r_x1": 287.632, "r_y1": 517.94, "r_x2": 287.632, "r_y2": 513.7470000000001, "r_x3": 270.452, "r_y3": 513.7470000000001, "coord_origin": "TOPLEFT"}, "text": "Decoder", "orig": "Decoder", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 63, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 332.478, "r_y0": 512.392, "r_x1": 348.14, "r_y1": 512.392, "r_x2": 348.14, "r_y2": 508.199, "r_x3": 332.478, "r_y3": 508.199, "coord_origin": "TOPLEFT"}, "text": "BBoxes", "orig": "BBoxes", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 64, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 376.686, "r_y0": 525.3679999999999, "r_x1": 407.255, "r_y1": 525.3679999999999, "r_x2": 407.255, "r_y2": 521.175, "r_x3": 376.686, "r_y3": 521.175, "coord_origin": "TOPLEFT"}, "text": "BBoxes can be", "orig": "BBoxes can be", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 65, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 373.909, "r_y0": 529.913, "r_x1": 410.035, "r_y1": 529.913, "r_x2": 410.035, "r_y2": 525.72, "r_x3": 373.909, "r_y3": 525.72, "coord_origin": "TOPLEFT"}, "text": "traced back to the", "orig": "traced back to the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 66, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 375.299, "r_y0": 534.4580000000001, "r_x1": 408.649, "r_y1": 534.4580000000001, "r_x2": 408.649, "r_y2": 530.265, "r_x3": 375.299, "r_y3": 530.265, "coord_origin": "TOPLEFT"}, "text": "original image to", "orig": "original image to", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 67, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 377.067, "r_y0": 539.0029999999999, "r_x1": 406.883, "r_y1": 539.0029999999999, "r_x2": 406.883, "r_y2": 534.81, "r_x3": 377.067, "r_y3": 534.81, "coord_origin": "TOPLEFT"}, "text": "extract content", "orig": "extract content", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 68, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 383.567, "r_y0": 567.489, "r_x1": 433.765, "r_y1": 567.489, "r_x2": 433.765, "r_y2": 563.296, "r_x3": 383.567, "r_y3": 563.296, "coord_origin": "TOPLEFT"}, "text": "Structure Tags sequence", "orig": "Structure Tags sequence", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 69, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 383.528, "r_y0": 572.034, "r_x1": 433.808, "r_y1": 572.034, "r_x2": 433.808, "r_y2": 567.841, "r_x3": 383.528, "r_y3": 567.841, "coord_origin": "TOPLEFT"}, "text": "provide full description of", "orig": "provide full description of", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 70, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 390.475, "r_y0": 576.579, "r_x1": 426.857, "r_y1": 576.579, "r_x2": 426.857, "r_y2": 572.386, "r_x3": 390.475, "r_y3": 572.386, "coord_origin": "TOPLEFT"}, "text": "the table structure", "orig": "the table structure", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 71, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 293.947, "r_y0": 582.139, "r_x1": 323.169, "r_y1": 582.139, "r_x2": 323.169, "r_y2": 577.946, "r_x3": 293.947, "r_y3": 577.946, "coord_origin": "TOPLEFT"}, "text": "Structure Tags", "orig": "Structure Tags", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 72, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 293.947, "r_y0": 586.684, "r_x1": 324.594, "r_y1": 586.684, "r_x2": 324.594, "r_y2": 582.491, "r_x3": 293.947, "r_y3": 582.491, "coord_origin": "TOPLEFT"}, "text": "in OTSL format", "orig": "in OTSL format", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 73, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 333.078, "r_y0": 546.0699999999999, "r_x1": 364.147, "r_y1": 546.0699999999999, "r_x2": 364.147, "r_y2": 541.877, "r_x3": 333.078, "r_y3": 541.877, "coord_origin": "TOPLEFT"}, "text": "BBoxes in sync", "orig": "BBoxes in sync", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 74, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 333.078, "r_y0": 549.858, "r_x1": 369.715, "r_y1": 549.858, "r_x2": 369.715, "r_y2": 545.665, "r_x3": 333.078, "r_y3": 545.665, "coord_origin": "TOPLEFT"}, "text": "with tag sequence", "orig": "with tag sequence", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 75, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 232.659, "r_y0": 519.489, "r_x1": 249.589, "r_y1": 519.489, "r_x2": 249.589, "r_y2": 515.296, "r_x3": 232.659, "r_y3": 515.296, "coord_origin": "TOPLEFT"}, "text": "Encoder", "orig": "Encoder", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 76, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 269.822, "r_y0": 550.218, "r_x1": 288.263, "r_y1": 550.218, "r_x2": 288.263, "r_y2": 546.0260000000001, "r_x3": 269.822, "r_y3": 546.0260000000001, "coord_origin": "TOPLEFT"}, "text": "Structure", "orig": "Structure", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 77, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 270.452, "r_y0": 554.006, "r_x1": 287.632, "r_y1": 554.006, "r_x2": 287.632, "r_y2": 549.813, "r_x3": 270.452, "r_y3": 549.813, "coord_origin": "TOPLEFT"}, "text": "Decoder", "orig": "Decoder", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 78, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 332.177, "r_y0": 520.1600000000001, "r_x1": 358.112, "r_y1": 520.1600000000001, "r_x2": 358.112, "r_y2": 515.967, "r_x3": 332.177, "r_y3": 515.967, "coord_origin": "TOPLEFT"}, "text": "[x1, y2, x2, y2]", "orig": "[x1, y2, x2, y2]", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 79, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 332.177, "r_y0": 526.22, "r_x1": 361.583, "r_y1": 526.22, "r_x2": 361.583, "r_y2": 522.027, "r_x3": 332.177, "r_y3": 522.027, "coord_origin": "TOPLEFT"}, "text": "[x1', y2', x2', y2']", "orig": "[x1', y2', x2', y2']", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 80, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 332.177, "r_y0": 532.28, "r_x1": 364.765, "r_y1": 532.28, "r_x2": 364.765, "r_y2": 528.087, "r_x3": 332.177, "r_y3": 528.087, "coord_origin": "TOPLEFT"}, "text": "[x1'', y2'', x2'', y2'']", "orig": "[x1'', y2'', x2'', y2'']", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 81, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 332.177, "r_y0": 538.34, "r_x1": 335.965, "r_y1": 538.34, "r_x2": 335.965, "r_y2": 534.1469999999999, "r_x3": 332.177, "r_y3": 534.1469999999999, "coord_origin": "TOPLEFT"}, "text": "...", "orig": "...", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 82, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 326.889, "r_y0": 520.643, "r_x1": 329.416, "r_y1": 520.643, "r_x2": 329.416, "r_y2": 516.45, "r_x3": 326.889, "r_y3": 516.45, "coord_origin": "TOPLEFT"}, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 83, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 327.041, "r_y0": 526.672, "r_x1": 329.568, "r_y1": 526.672, "r_x2": 329.568, "r_y2": 522.479, "r_x3": 327.041, "r_y3": 522.479, "coord_origin": "TOPLEFT"}, "text": "2", "orig": "2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 84, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 327.041, "r_y0": 532.7629999999999, "r_x1": 329.568, "r_y1": 532.7629999999999, "r_x2": 329.568, "r_y2": 528.5699999999999, "r_x3": 327.041, "r_y3": 528.5699999999999, "coord_origin": "TOPLEFT"}, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 85, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 424.141, "r_y0": 531.69, "r_x1": 426.668, "r_y1": 531.69, "r_x2": 426.668, "r_y2": 527.4970000000001, "r_x3": 424.141, "r_y3": 527.4970000000001, "coord_origin": "TOPLEFT"}, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 86, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 453.002, "r_y0": 521.701, "r_x1": 455.529, "r_y1": 521.701, "r_x2": 455.529, "r_y2": 517.508, "r_x3": 453.002, "r_y3": 517.508, "coord_origin": "TOPLEFT"}, "text": "2", "orig": "2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 87, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 423.858, "r_y0": 521.31, "r_x1": 426.385, "r_y1": 521.31, "r_x2": 426.385, "r_y2": 517.117, "r_x3": 423.858, "r_y3": 517.117, "coord_origin": "TOPLEFT"}, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 88, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 333.434, "r_y0": 562.3389999999999, "r_x1": 359.834, "r_y1": 561.855, "r_x2": 359.834, "r_y2": 556.947, "r_x3": 333.434, "r_y3": 557.431, "coord_origin": "TOPLEFT"}, "text": "C C L NL", "orig": "C C L NL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 89, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 340.31, "r_y0": 568.837, "r_x1": 359.986, "r_y1": 568.552, "r_x2": 359.986, "r_y2": 563.644, "r_x3": 340.31, "r_y3": 563.929, "coord_origin": "TOPLEFT"}, "text": "C C NL", "orig": "C C NL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 90, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 333.596, "r_y0": 568.795, "r_x1": 337.437, "r_y1": 568.795, "r_x2": 337.437, "r_y2": 563.887, "r_x3": 333.596, "r_y3": 563.887, "coord_origin": "TOPLEFT"}, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 91, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 340.375, "r_y0": 575.399, "r_x1": 359.999, "r_y1": 575.134, "r_x2": 359.999, "r_y2": 570.226, "r_x3": 340.375, "r_y3": 570.491, "coord_origin": "TOPLEFT"}, "text": "C C NL", "orig": "C C NL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 92, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 333.661, "r_y0": 575.356, "r_x1": 337.503, "r_y1": 575.356, "r_x2": 337.503, "r_y2": 570.448, "r_x3": 333.661, "r_y3": 570.448, "coord_origin": "TOPLEFT"}, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 93, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 340.377, "r_y0": 581.998, "r_x1": 359.954, "r_y1": 581.738, "r_x2": 359.954, "r_y2": 576.83, "r_x3": 340.377, "r_y3": 577.09, "coord_origin": "TOPLEFT"}, "text": "C C NL", "orig": "C C NL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 94, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 333.663, "r_y0": 581.955, "r_x1": 337.504, "r_y1": 581.955, "r_x2": 337.504, "r_y2": 577.047, "r_x3": 333.663, "r_y3": 577.047, "coord_origin": "TOPLEFT"}, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 95, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 340.279, "r_y0": 588.369, "r_x1": 360.07, "r_y1": 588.3779999999999, "r_x2": 360.07, "r_y2": 583.47, "r_x3": 340.279, "r_y3": 583.461, "coord_origin": "TOPLEFT"}, "text": "C C NL", "orig": "C C NL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 96, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 333.566, "r_y0": 588.327, "r_x1": 337.407, "r_y1": 588.327, "r_x2": 337.407, "r_y2": 583.419, "r_x3": 333.566, "r_y3": 583.419, "coord_origin": "TOPLEFT"}, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 97, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 331.14, "r_y0": 568.538, "r_x1": 333.667, "r_y1": 568.538, "r_x2": 333.667, "r_y2": 564.345, "r_x3": 331.14, "r_y3": 564.345, "coord_origin": "TOPLEFT"}, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 98, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 340.81, "r_y0": 558.841, "r_x1": 343.337, "r_y1": 558.841, "r_x2": 343.337, "r_y2": 554.648, "r_x3": 340.81, "r_y3": 554.648, "coord_origin": "TOPLEFT"}, "text": "2", "orig": "2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 99, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 330.98, "r_y0": 559.078, "r_x1": 333.507, "r_y1": 559.078, "r_x2": 333.507, "r_y2": 554.885, "r_x3": 330.98, "r_y3": 554.885, "coord_origin": "TOPLEFT"}, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": [{"id": 13, "label": "text", "bbox": {"l": 147.3, "t": 540.762, "r": 149.407, "b": 543.091, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 39, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 147.3, "r_y0": 543.091, "r_x1": 149.407, "r_y1": 543.091, "r_x2": 149.407, "r_y2": 540.762, "r_x3": 147.3, "r_y3": 540.762, "coord_origin": "TOPLEFT"}, "text": "1.", "orig": "1.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 14, "label": "text", "bbox": {"l": 150.809, "t": 540.762, "r": 155.721, "b": 543.091, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 40, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 150.809, "r_y0": 543.091, "r_x1": 155.721, "r_y1": 543.091, "r_x2": 155.721, "r_y2": 540.762, "r_x3": 150.809, "r_y3": 540.762, "coord_origin": "TOPLEFT"}, "text": "Item", "orig": "Item", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 15, "label": "text", "bbox": {"l": 162.76, "t": 535.424, "r": 172.296, "b": 537.754, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 41, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 162.76, "r_y0": 537.754, "r_x1": 172.296, "r_y1": 537.754, "r_x2": 172.296, "r_y2": 535.424, "r_x3": 162.76, "r_y3": 535.424, "coord_origin": "TOPLEFT"}, "text": "Amount", "orig": "Amount", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 16, "label": "text", "bbox": {"l": 147.636, "t": 535.396, "r": 155.918, "b": 537.726, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 42, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 147.636, "r_y0": 537.726, "r_x1": 155.918, "r_y1": 537.726, "r_x2": 155.918, "r_y2": 535.396, "r_x3": 147.636, "r_y3": 535.396, "coord_origin": "TOPLEFT"}, "text": "Names", "orig": "Names", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 17, "label": "text", "bbox": {"l": 158.485, "t": 540.762, "r": 164.102, "b": 543.091, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 43, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 158.485, "r_y0": 543.091, "r_x1": 164.102, "r_y1": 543.091, "r_x2": 164.102, "r_y2": 540.762, "r_x3": 158.485, "r_y3": 540.762, "coord_origin": "TOPLEFT"}, "text": "1000", "orig": "1000", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 18, "label": "text", "bbox": {"l": 158.485, "t": 544.701, "r": 162.697, "b": 547.03, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 44, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 158.485, "r_y0": 547.03, "r_x1": 162.697, "r_y1": 547.03, "r_x2": 162.697, "r_y2": 544.701, "r_x3": 158.485, "r_y3": 544.701, "coord_origin": "TOPLEFT"}, "text": "500", "orig": "500", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 19, "label": "text", "bbox": {"l": 158.485, "t": 548.943, "r": 164.102, "b": 551.2719999999999, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 45, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 158.485, "r_y0": 551.2719999999999, "r_x1": 164.102, "r_y1": 551.2719999999999, "r_x2": 164.102, "r_y2": 548.943, "r_x3": 158.485, "r_y3": 548.943, "coord_origin": "TOPLEFT"}, "text": "3500", "orig": "3500", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 20, "label": "text", "bbox": {"l": 158.485, "t": 553.185, "r": 162.697, "b": 555.514, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 46, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 158.485, "r_y0": 555.514, "r_x1": 162.697, "r_y1": 555.514, "r_x2": 162.697, "r_y2": 553.185, "r_x3": 158.485, "r_y3": 553.185, "coord_origin": "TOPLEFT"}, "text": "150", "orig": "150", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 21, "label": "text", "bbox": {"l": 168.817, "t": 540.762, "r": 172.889, "b": 543.091, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 47, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 168.817, "r_y0": 543.091, "r_x1": 172.889, "r_y1": 543.091, "r_x2": 172.889, "r_y2": 540.762, "r_x3": 168.817, "r_y3": 540.762, "coord_origin": "TOPLEFT"}, "text": "unit", "orig": "unit", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 22, "label": "text", "bbox": {"l": 168.817, "t": 544.701, "r": 172.889, "b": 547.03, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 48, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 168.817, "r_y0": 547.03, "r_x1": 172.889, "r_y1": 547.03, "r_x2": 172.889, "r_y2": 544.701, "r_x3": 168.817, "r_y3": 544.701, "coord_origin": "TOPLEFT"}, "text": "unit", "orig": "unit", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 23, "label": "text", "bbox": {"l": 168.817, "t": 548.943, "r": 172.889, "b": 551.2719999999999, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 49, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 168.817, "r_y0": 551.2719999999999, "r_x1": 172.889, "r_y1": 551.2719999999999, "r_x2": 172.889, "r_y2": 548.943, "r_x3": 168.817, "r_y3": 548.943, "coord_origin": "TOPLEFT"}, "text": "unit", "orig": "unit", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 24, "label": "text", "bbox": {"l": 168.817, "t": 553.185, "r": 172.889, "b": 555.514, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 50, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 168.817, "r_y0": 555.514, "r_x1": 172.889, "r_y1": 555.514, "r_x2": 172.889, "r_y2": 553.185, "r_x3": 168.817, "r_y3": 553.185, "coord_origin": "TOPLEFT"}, "text": "unit", "orig": "unit", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 25, "label": "text", "bbox": {"l": 147.3, "t": 544.701, "r": 149.407, "b": 547.03, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 51, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 147.3, "r_y0": 547.03, "r_x1": 149.407, "r_y1": 547.03, "r_x2": 149.407, "r_y2": 544.701, "r_x3": 147.3, "r_y3": 544.701, "coord_origin": "TOPLEFT"}, "text": "2.", "orig": "2.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 26, "label": "text", "bbox": {"l": 150.809, "t": 544.701, "r": 155.721, "b": 547.03, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 52, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 150.809, "r_y0": 547.03, "r_x1": 155.721, "r_y1": 547.03, "r_x2": 155.721, "r_y2": 544.701, "r_x3": 150.809, "r_y3": 544.701, "coord_origin": "TOPLEFT"}, "text": "Item", "orig": "Item", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 27, "label": "text", "bbox": {"l": 147.3, "t": 548.943, "r": 149.407, "b": 551.2719999999999, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 53, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 147.3, "r_y0": 551.2719999999999, "r_x1": 149.407, "r_y1": 551.2719999999999, "r_x2": 149.407, "r_y2": 548.943, "r_x3": 147.3, "r_y3": 548.943, "coord_origin": "TOPLEFT"}, "text": "3.", "orig": "3.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 28, "label": "text", "bbox": {"l": 150.809, "t": 548.943, "r": 155.721, "b": 551.2719999999999, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 54, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 150.809, "r_y0": 551.2719999999999, "r_x1": 155.721, "r_y1": 551.2719999999999, "r_x2": 155.721, "r_y2": 548.943, "r_x3": 150.809, "r_y3": 548.943, "coord_origin": "TOPLEFT"}, "text": "Item", "orig": "Item", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 29, "label": "text", "bbox": {"l": 147.3, "t": 553.185, "r": 149.407, "b": 555.514, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 55, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 147.3, "r_y0": 555.514, "r_x1": 149.407, "r_y1": 555.514, "r_x2": 149.407, "r_y2": 553.185, "r_x3": 147.3, "r_y3": 553.185, "coord_origin": "TOPLEFT"}, "text": "4.", "orig": "4.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 30, "label": "text", "bbox": {"l": 150.809, "t": 553.185, "r": 155.721, "b": 555.514, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 56, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 150.809, "r_y0": 555.514, "r_x1": 155.721, "r_y1": 555.514, "r_x2": 155.721, "r_y2": 553.185, "r_x3": 150.809, "r_y3": 553.185, "coord_origin": "TOPLEFT"}, "text": "Item", "orig": "Item", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 31, "label": "text", "bbox": {"l": 152.05, "t": 517.0640000000001, "r": 171.249, "b": 521.2570000000001, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 57, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 152.05, "r_y0": 521.2570000000001, "r_x1": 171.249, "r_y1": 521.2570000000001, "r_x2": 171.249, "r_y2": 517.0640000000001, "r_x3": 152.05, "r_y3": 517.0640000000001, "coord_origin": "TOPLEFT"}, "text": "Extracted", "orig": "Extracted", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 32, "label": "text", "bbox": {"l": 148.133, "t": 522.367, "r": 175.168, "b": 526.56, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 58, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 148.133, "r_y0": 526.56, "r_x1": 175.168, "r_y1": 526.56, "r_x2": 175.168, "r_y2": 522.367, "r_x3": 148.133, "r_y3": 522.367, "coord_origin": "TOPLEFT"}, "text": "Table Images", "orig": "Table Images", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 33, "label": "text", "bbox": {"l": 193.533, "t": 524.569, "r": 220.32, "b": 528.762, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 59, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 193.533, "r_y0": 528.762, "r_x1": 220.32, "r_y1": 528.762, "r_x2": 220.32, "r_y2": 524.569, "r_x3": 193.533, "r_y3": 524.569, "coord_origin": "TOPLEFT"}, "text": "Standardized", "orig": "Standardized", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 34, "label": "text", "bbox": {"l": 199.473, "t": 529.871, "r": 214.379, "b": 534.0640000000001, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 60, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 199.473, "r_y0": 534.0640000000001, "r_x1": 214.379, "r_y1": 534.0640000000001, "r_x2": 214.379, "r_y2": 529.871, "r_x3": 199.473, "r_y3": 529.871, "coord_origin": "TOPLEFT"}, "text": "Images", "orig": "Images", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 35, "label": "text", "bbox": {"l": 273.611, "t": 509.96, "r": 284.473, "b": 514.153, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 61, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 273.611, "r_y0": 514.153, "r_x1": 284.473, "r_y1": 514.153, "r_x2": 284.473, "r_y2": 509.96, "r_x3": 273.611, "r_y3": 509.96, "coord_origin": "TOPLEFT"}, "text": "BBox", "orig": "BBox", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 36, "label": "text", "bbox": {"l": 270.452, "t": 513.7470000000001, "r": 287.632, "b": 517.94, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 62, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 270.452, "r_y0": 517.94, "r_x1": 287.632, "r_y1": 517.94, "r_x2": 287.632, "r_y2": 513.7470000000001, "r_x3": 270.452, "r_y3": 513.7470000000001, "coord_origin": "TOPLEFT"}, "text": "Decoder", "orig": "Decoder", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 37, "label": "text", "bbox": {"l": 332.478, "t": 508.199, "r": 348.14, "b": 512.392, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 63, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 332.478, "r_y0": 512.392, "r_x1": 348.14, "r_y1": 512.392, "r_x2": 348.14, "r_y2": 508.199, "r_x3": 332.478, "r_y3": 508.199, "coord_origin": "TOPLEFT"}, "text": "BBoxes", "orig": "BBoxes", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 38, "label": "text", "bbox": {"l": 376.686, "t": 521.175, "r": 407.255, "b": 525.3679999999999, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 64, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 376.686, "r_y0": 525.3679999999999, "r_x1": 407.255, "r_y1": 525.3679999999999, "r_x2": 407.255, "r_y2": 521.175, "r_x3": 376.686, "r_y3": 521.175, "coord_origin": "TOPLEFT"}, "text": "BBoxes can be", "orig": "BBoxes can be", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 39, "label": "text", "bbox": {"l": 373.909, "t": 525.72, "r": 410.035, "b": 529.913, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 65, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 373.909, "r_y0": 529.913, "r_x1": 410.035, "r_y1": 529.913, "r_x2": 410.035, "r_y2": 525.72, "r_x3": 373.909, "r_y3": 525.72, "coord_origin": "TOPLEFT"}, "text": "traced back to the", "orig": "traced back to the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 40, "label": "text", "bbox": {"l": 375.299, "t": 530.265, "r": 408.649, "b": 534.4580000000001, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 66, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 375.299, "r_y0": 534.4580000000001, "r_x1": 408.649, "r_y1": 534.4580000000001, "r_x2": 408.649, "r_y2": 530.265, "r_x3": 375.299, "r_y3": 530.265, "coord_origin": "TOPLEFT"}, "text": "original image to", "orig": "original image to", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 41, "label": "text", "bbox": {"l": 377.067, "t": 534.81, "r": 406.883, "b": 539.0029999999999, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 67, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 377.067, "r_y0": 539.0029999999999, "r_x1": 406.883, "r_y1": 539.0029999999999, "r_x2": 406.883, "r_y2": 534.81, "r_x3": 377.067, "r_y3": 534.81, "coord_origin": "TOPLEFT"}, "text": "extract content", "orig": "extract content", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 42, "label": "text", "bbox": {"l": 383.567, "t": 563.296, "r": 433.765, "b": 567.489, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 68, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 383.567, "r_y0": 567.489, "r_x1": 433.765, "r_y1": 567.489, "r_x2": 433.765, "r_y2": 563.296, "r_x3": 383.567, "r_y3": 563.296, "coord_origin": "TOPLEFT"}, "text": "Structure Tags sequence", "orig": "Structure Tags sequence", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 43, "label": "text", "bbox": {"l": 383.528, "t": 567.841, "r": 433.808, "b": 572.034, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 69, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 383.528, "r_y0": 572.034, "r_x1": 433.808, "r_y1": 572.034, "r_x2": 433.808, "r_y2": 567.841, "r_x3": 383.528, "r_y3": 567.841, "coord_origin": "TOPLEFT"}, "text": "provide full description of", "orig": "provide full description of", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 44, "label": "text", "bbox": {"l": 390.475, "t": 572.386, "r": 426.857, "b": 576.579, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 70, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 390.475, "r_y0": 576.579, "r_x1": 426.857, "r_y1": 576.579, "r_x2": 426.857, "r_y2": 572.386, "r_x3": 390.475, "r_y3": 572.386, "coord_origin": "TOPLEFT"}, "text": "the table structure", "orig": "the table structure", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 45, "label": "text", "bbox": {"l": 293.947, "t": 577.946, "r": 323.169, "b": 582.139, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 71, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 293.947, "r_y0": 582.139, "r_x1": 323.169, "r_y1": 582.139, "r_x2": 323.169, "r_y2": 577.946, "r_x3": 293.947, "r_y3": 577.946, "coord_origin": "TOPLEFT"}, "text": "Structure Tags", "orig": "Structure Tags", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 46, "label": "text", "bbox": {"l": 293.947, "t": 582.491, "r": 324.594, "b": 586.684, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 72, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 293.947, "r_y0": 586.684, "r_x1": 324.594, "r_y1": 586.684, "r_x2": 324.594, "r_y2": 582.491, "r_x3": 293.947, "r_y3": 582.491, "coord_origin": "TOPLEFT"}, "text": "in OTSL format", "orig": "in OTSL format", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 47, "label": "text", "bbox": {"l": 333.078, "t": 541.877, "r": 364.147, "b": 546.0699999999999, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 73, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 333.078, "r_y0": 546.0699999999999, "r_x1": 364.147, "r_y1": 546.0699999999999, "r_x2": 364.147, "r_y2": 541.877, "r_x3": 333.078, "r_y3": 541.877, "coord_origin": "TOPLEFT"}, "text": "BBoxes in sync", "orig": "BBoxes in sync", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 48, "label": "text", "bbox": {"l": 333.078, "t": 545.665, "r": 369.715, "b": 549.858, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 74, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 333.078, "r_y0": 549.858, "r_x1": 369.715, "r_y1": 549.858, "r_x2": 369.715, "r_y2": 545.665, "r_x3": 333.078, "r_y3": 545.665, "coord_origin": "TOPLEFT"}, "text": "with tag sequence", "orig": "with tag sequence", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 49, "label": "text", "bbox": {"l": 232.659, "t": 515.296, "r": 249.589, "b": 519.489, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 75, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 232.659, "r_y0": 519.489, "r_x1": 249.589, "r_y1": 519.489, "r_x2": 249.589, "r_y2": 515.296, "r_x3": 232.659, "r_y3": 515.296, "coord_origin": "TOPLEFT"}, "text": "Encoder", "orig": "Encoder", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 50, "label": "text", "bbox": {"l": 269.822, "t": 546.0260000000001, "r": 288.263, "b": 550.218, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 76, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 269.822, "r_y0": 550.218, "r_x1": 288.263, "r_y1": 550.218, "r_x2": 288.263, "r_y2": 546.0260000000001, "r_x3": 269.822, "r_y3": 546.0260000000001, "coord_origin": "TOPLEFT"}, "text": "Structure", "orig": "Structure", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 51, "label": "text", "bbox": {"l": 270.452, "t": 549.813, "r": 287.632, "b": 554.006, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 77, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 270.452, "r_y0": 554.006, "r_x1": 287.632, "r_y1": 554.006, "r_x2": 287.632, "r_y2": 549.813, "r_x3": 270.452, "r_y3": 549.813, "coord_origin": "TOPLEFT"}, "text": "Decoder", "orig": "Decoder", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 52, "label": "text", "bbox": {"l": 332.177, "t": 515.967, "r": 358.112, "b": 520.1600000000001, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 78, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 332.177, "r_y0": 520.1600000000001, "r_x1": 358.112, "r_y1": 520.1600000000001, "r_x2": 358.112, "r_y2": 515.967, "r_x3": 332.177, "r_y3": 515.967, "coord_origin": "TOPLEFT"}, "text": "[x1, y2, x2, y2]", "orig": "[x1, y2, x2, y2]", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 53, "label": "text", "bbox": {"l": 332.177, "t": 522.027, "r": 361.583, "b": 526.22, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 79, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 332.177, "r_y0": 526.22, "r_x1": 361.583, "r_y1": 526.22, "r_x2": 361.583, "r_y2": 522.027, "r_x3": 332.177, "r_y3": 522.027, "coord_origin": "TOPLEFT"}, "text": "[x1', y2', x2', y2']", "orig": "[x1', y2', x2', y2']", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 54, "label": "text", "bbox": {"l": 332.177, "t": 528.087, "r": 364.765, "b": 532.28, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 80, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 332.177, "r_y0": 532.28, "r_x1": 364.765, "r_y1": 532.28, "r_x2": 364.765, "r_y2": 528.087, "r_x3": 332.177, "r_y3": 528.087, "coord_origin": "TOPLEFT"}, "text": "[x1'', y2'', x2'', y2'']", "orig": "[x1'', y2'', x2'', y2'']", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 55, "label": "text", "bbox": {"l": 332.177, "t": 534.1469999999999, "r": 335.965, "b": 538.34, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 81, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 332.177, "r_y0": 538.34, "r_x1": 335.965, "r_y1": 538.34, "r_x2": 335.965, "r_y2": 534.1469999999999, "r_x3": 332.177, "r_y3": 534.1469999999999, "coord_origin": "TOPLEFT"}, "text": "...", "orig": "...", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 56, "label": "text", "bbox": {"l": 326.889, "t": 516.45, "r": 329.416, "b": 520.643, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 82, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 326.889, "r_y0": 520.643, "r_x1": 329.416, "r_y1": 520.643, "r_x2": 329.416, "r_y2": 516.45, "r_x3": 326.889, "r_y3": 516.45, "coord_origin": "TOPLEFT"}, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 57, "label": "text", "bbox": {"l": 327.041, "t": 522.479, "r": 329.568, "b": 526.672, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 83, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 327.041, "r_y0": 526.672, "r_x1": 329.568, "r_y1": 526.672, "r_x2": 329.568, "r_y2": 522.479, "r_x3": 327.041, "r_y3": 522.479, "coord_origin": "TOPLEFT"}, "text": "2", "orig": "2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 58, "label": "text", "bbox": {"l": 327.041, "t": 528.5699999999999, "r": 329.568, "b": 532.7629999999999, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 84, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 327.041, "r_y0": 532.7629999999999, "r_x1": 329.568, "r_y1": 532.7629999999999, "r_x2": 329.568, "r_y2": 528.5699999999999, "r_x3": 327.041, "r_y3": 528.5699999999999, "coord_origin": "TOPLEFT"}, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 59, "label": "text", "bbox": {"l": 424.141, "t": 527.4970000000001, "r": 426.668, "b": 531.69, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 85, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 424.141, "r_y0": 531.69, "r_x1": 426.668, "r_y1": 531.69, "r_x2": 426.668, "r_y2": 527.4970000000001, "r_x3": 424.141, "r_y3": 527.4970000000001, "coord_origin": "TOPLEFT"}, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 60, "label": "text", "bbox": {"l": 453.002, "t": 517.508, "r": 455.529, "b": 521.701, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 86, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 453.002, "r_y0": 521.701, "r_x1": 455.529, "r_y1": 521.701, "r_x2": 455.529, "r_y2": 517.508, "r_x3": 453.002, "r_y3": 517.508, "coord_origin": "TOPLEFT"}, "text": "2", "orig": "2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 61, "label": "text", "bbox": {"l": 423.858, "t": 517.117, "r": 426.385, "b": 521.31, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 87, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 423.858, "r_y0": 521.31, "r_x1": 426.385, "r_y1": 521.31, "r_x2": 426.385, "r_y2": 517.117, "r_x3": 423.858, "r_y3": 517.117, "coord_origin": "TOPLEFT"}, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 62, "label": "text", "bbox": {"l": 333.434, "t": 556.947, "r": 359.834, "b": 562.3389999999999, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 88, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 333.434, "r_y0": 562.3389999999999, "r_x1": 359.834, "r_y1": 561.855, "r_x2": 359.834, "r_y2": 556.947, "r_x3": 333.434, "r_y3": 557.431, "coord_origin": "TOPLEFT"}, "text": "C C L NL", "orig": "C C L NL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 63, "label": "text", "bbox": {"l": 340.31, "t": 563.644, "r": 359.986, "b": 568.837, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 89, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 340.31, "r_y0": 568.837, "r_x1": 359.986, "r_y1": 568.552, "r_x2": 359.986, "r_y2": 563.644, "r_x3": 340.31, "r_y3": 563.929, "coord_origin": "TOPLEFT"}, "text": "C C NL", "orig": "C C NL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 64, "label": "text", "bbox": {"l": 333.596, "t": 563.887, "r": 337.437, "b": 568.795, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 90, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 333.596, "r_y0": 568.795, "r_x1": 337.437, "r_y1": 568.795, "r_x2": 337.437, "r_y2": 563.887, "r_x3": 333.596, "r_y3": 563.887, "coord_origin": "TOPLEFT"}, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 65, "label": "text", "bbox": {"l": 340.375, "t": 570.226, "r": 359.999, "b": 575.399, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 91, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 340.375, "r_y0": 575.399, "r_x1": 359.999, "r_y1": 575.134, "r_x2": 359.999, "r_y2": 570.226, "r_x3": 340.375, "r_y3": 570.491, "coord_origin": "TOPLEFT"}, "text": "C C NL", "orig": "C C NL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 66, "label": "text", "bbox": {"l": 333.661, "t": 570.448, "r": 337.503, "b": 575.356, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 92, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 333.661, "r_y0": 575.356, "r_x1": 337.503, "r_y1": 575.356, "r_x2": 337.503, "r_y2": 570.448, "r_x3": 333.661, "r_y3": 570.448, "coord_origin": "TOPLEFT"}, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 67, "label": "text", "bbox": {"l": 340.377, "t": 576.83, "r": 359.954, "b": 581.998, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 93, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 340.377, "r_y0": 581.998, "r_x1": 359.954, "r_y1": 581.738, "r_x2": 359.954, "r_y2": 576.83, "r_x3": 340.377, "r_y3": 577.09, "coord_origin": "TOPLEFT"}, "text": "C C NL", "orig": "C C NL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 68, "label": "text", "bbox": {"l": 333.663, "t": 577.047, "r": 337.504, "b": 581.955, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 94, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 333.663, "r_y0": 581.955, "r_x1": 337.504, "r_y1": 581.955, "r_x2": 337.504, "r_y2": 577.047, "r_x3": 333.663, "r_y3": 577.047, "coord_origin": "TOPLEFT"}, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 69, "label": "text", "bbox": {"l": 340.279, "t": 583.461, "r": 360.07, "b": 588.3779999999999, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 95, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 340.279, "r_y0": 588.369, "r_x1": 360.07, "r_y1": 588.3779999999999, "r_x2": 360.07, "r_y2": 583.47, "r_x3": 340.279, "r_y3": 583.461, "coord_origin": "TOPLEFT"}, "text": "C C NL", "orig": "C C NL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 70, "label": "text", "bbox": {"l": 333.566, "t": 583.419, "r": 337.407, "b": 588.327, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 96, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 333.566, "r_y0": 588.327, "r_x1": 337.407, "r_y1": 588.327, "r_x2": 337.407, "r_y2": 583.419, "r_x3": 333.566, "r_y3": 583.419, "coord_origin": "TOPLEFT"}, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 71, "label": "text", "bbox": {"l": 331.14, "t": 564.345, "r": 333.667, "b": 568.538, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 97, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 331.14, "r_y0": 568.538, "r_x1": 333.667, "r_y1": 568.538, "r_x2": 333.667, "r_y2": 564.345, "r_x3": 331.14, "r_y3": 564.345, "coord_origin": "TOPLEFT"}, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 72, "label": "text", "bbox": {"l": 340.81, "t": 554.648, "r": 343.337, "b": 558.841, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 98, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 340.81, "r_y0": 558.841, "r_x1": 343.337, "r_y1": 558.841, "r_x2": 343.337, "r_y2": 554.648, "r_x3": 340.81, "r_y3": 554.648, "coord_origin": "TOPLEFT"}, "text": "2", "orig": "2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 73, "label": "text", "bbox": {"l": 330.98, "t": 554.885, "r": 333.507, "b": 559.078, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 99, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 330.98, "r_y0": 559.078, "r_x1": 333.507, "r_y1": 559.078, "r_x2": 333.507, "r_y2": 554.885, "r_x3": 330.98, "r_y3": 554.885, "coord_origin": "TOPLEFT"}, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}]}, "text": "", "annotations": [], "provenance": null, "predicted_class": null, "confidence": null}, {"label": "text", "id": 4, "page_no": 7, "cluster": {"id": 4, "label": "text", "bbox": {"l": 134.765, "t": 620.193, "r": 480.592, "b": 664.855, "coord_origin": "TOPLEFT"}, "confidence": 0.951270341873169, "cells": [{"index": 100, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 149.709, "r_y0": 628.99, "r_x1": 480.588, "r_y1": 628.99, "r_x2": 480.588, "r_y2": 620.193, "r_x3": 149.709, "r_y3": 620.193, "coord_origin": "TOPLEFT"}, "text": "We rely on standard metrics such as Tree Edit Distance score (TEDs) for", "orig": "We rely on standard metrics such as Tree Edit Distance score (TEDs) for", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 101, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 640.9449999999999, "r_x1": 480.589, "r_y1": 640.9449999999999, "r_x2": 480.589, "r_y2": 632.148, "r_x3": 134.765, "r_y3": 632.148, "coord_origin": "TOPLEFT"}, "text": "table structure prediction, and Mean Average Precision (mAP) with 0.75 Inter-", "orig": "table structure prediction, and Mean Average Precision (mAP) with 0.75 Inter-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 102, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 652.9, "r_x1": 480.592, "r_y1": 652.9, "r_x2": 480.592, "r_y2": 644.1030000000001, "r_x3": 134.765, "r_y3": 644.1030000000001, "coord_origin": "TOPLEFT"}, "text": "section Over Union (IOU) threshold for the bounding-box predictions of table", "orig": "section Over Union (IOU) threshold for the bounding-box predictions of table", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 103, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 664.855, "r_x1": 155.846, "r_y1": 664.855, "r_x2": 155.846, "r_y2": 656.058, "r_x3": 134.765, "r_y3": 656.058, "coord_origin": "TOPLEFT"}, "text": "cells.", "orig": "cells.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 104, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 159.442, "r_y0": 664.855, "r_x1": 480.59, "r_y1": 664.855, "r_x2": 480.59, "r_y2": 656.058, "r_x3": 159.442, "r_y3": 656.058, "coord_origin": "TOPLEFT"}, "text": "The predicted OTSL structures were converted back to HTML format in", "orig": "The predicted OTSL structures were converted back to HTML format in", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "We rely on standard metrics such as Tree Edit Distance score (TEDs) for table structure prediction, and Mean Average Precision (mAP) with 0.75 Intersection Over Union (IOU) threshold for the bounding-box predictions of table cells. The predicted OTSL structures were converted back to HTML format in"}], "headers": [{"label": "page_header", "id": 9, "page_no": 7, "cluster": {"id": 9, "label": "page_header", "bbox": {"l": 134.765, "t": 91.49300000000005, "r": 139.372, "b": 102.78200000000004, "coord_origin": "TOPLEFT"}, "confidence": 0.8301323056221008, "cells": [{"index": 0, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 102.78200000000004, "r_x1": 139.372, "r_y1": 102.78200000000004, "r_x2": 139.372, "r_y2": 91.49300000000005, "r_x3": 134.765, "r_y3": 91.49300000000005, "coord_origin": "TOPLEFT"}, "text": "8", "orig": "8", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "8"}, {"label": "page_header", "id": 8, "page_no": 7, "cluster": {"id": 8, "label": "page_header", "bbox": {"l": 167.813, "t": 91.49300000000005, "r": 231.722, "b": 102.78200000000004, "coord_origin": "TOPLEFT"}, "confidence": 0.8631826043128967, "cells": [{"index": 1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 167.813, "r_y0": 102.78200000000004, "r_x1": 231.722, "r_y1": 102.78200000000004, "r_x2": 231.722, "r_y2": 91.49300000000005, "r_x3": 167.813, "r_y3": 91.49300000000005, "coord_origin": "TOPLEFT"}, "text": "M. Lysak, et al.", "orig": "M. Lysak, et al.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "M. Lysak, et al."}]}}, {"page_no": 8, "size": {"width": 612.0, "height": 792.0}, "cells": [{"index": 0, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 194.478, "r_y0": 102.78200000000004, "r_x1": 447.543, "r_y1": 102.78200000000004, "r_x2": 447.543, "r_y2": 91.49300000000005, "r_x3": 194.478, "r_y3": 91.49300000000005, "coord_origin": "TOPLEFT"}, "text": "Optimized Table Tokenization for Table Structure Recognition", "orig": "Optimized Table Tokenization for Table Structure Recognition", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 475.984, "r_y0": 102.78200000000004, "r_x1": 480.591, "r_y1": 102.78200000000004, "r_x2": 480.591, "r_y2": 91.49300000000005, "r_x3": 475.984, "r_y3": 91.49300000000005, "coord_origin": "TOPLEFT"}, "text": "9", "orig": "9", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 2, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 127.731, "r_x1": 480.594, "r_y1": 127.731, "r_x2": 480.594, "r_y2": 118.93399999999997, "r_x3": 134.765, "r_y3": 118.93399999999997, "coord_origin": "TOPLEFT"}, "text": "order to compute the TED score. Inference timing results for all experiments", "orig": "order to compute the TED score. Inference timing results for all experiments", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 3, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 139.68600000000004, "r_x1": 480.596, "r_y1": 139.68600000000004, "r_x2": 480.596, "r_y2": 130.889, "r_x3": 134.765, "r_y3": 130.889, "coord_origin": "TOPLEFT"}, "text": "were obtained from the same machine on a single core with AMD EPYC 7763", "orig": "were obtained from the same machine on a single core with AMD EPYC 7763", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 4, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 151.64200000000005, "r_x1": 210.785, "r_y1": 151.64200000000005, "r_x2": 210.785, "r_y2": 142.84500000000003, "r_x3": 134.765, "r_y3": 142.84500000000003, "coord_origin": "TOPLEFT"}, "text": "CPU @2.45 GHz.", "orig": "CPU @2.45 GHz.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 5, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 177.99300000000005, "r_x1": 149.402, "r_y1": 177.99300000000005, "r_x2": 149.402, "r_y2": 169.18600000000004, "r_x3": 134.765, "r_y3": 169.18600000000004, "coord_origin": "TOPLEFT"}, "text": "5.1", "orig": "5.1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 6, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 160.859, "r_y0": 177.99300000000005, "r_x1": 318.448, "r_y1": 177.99300000000005, "r_x2": 318.448, "r_y2": 169.18600000000004, "r_x3": 160.859, "r_y3": 169.18600000000004, "coord_origin": "TOPLEFT"}, "text": "Hyper Parameter Optimization", "orig": "Hyper Parameter Optimization", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 7, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 194.38300000000004, "r_x1": 480.592, "r_y1": 194.38300000000004, "r_x2": 480.592, "r_y2": 185.586, "r_x3": 134.765, "r_y3": 185.586, "coord_origin": "TOPLEFT"}, "text": "We have chosen the PubTabNet data set to perform HPO, since it includes a", "orig": "We have chosen the PubTabNet data set to perform HPO, since it includes a", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 8, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 206.33799999999997, "r_x1": 480.592, "r_y1": 206.33799999999997, "r_x2": 480.592, "r_y2": 197.54100000000005, "r_x3": 134.765, "r_y3": 197.54100000000005, "coord_origin": "TOPLEFT"}, "text": "highly diverse set of tables. Also we report TED scores separately for simple and", "orig": "highly diverse set of tables. Also we report TED scores separately for simple and", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 9, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 218.293, "r_x1": 480.592, "r_y1": 218.293, "r_x2": 480.592, "r_y2": 209.49599999999998, "r_x3": 134.765, "r_y3": 209.49599999999998, "coord_origin": "TOPLEFT"}, "text": "complex tables (tables with cell spans). Results are presented in Table. 1. It is", "orig": "complex tables (tables with cell spans). Results are presented in Table. 1. It is", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 10, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 230.24800000000005, "r_x1": 480.593, "r_y1": 230.24800000000005, "r_x2": 480.593, "r_y2": 221.45100000000002, "r_x3": 134.765, "r_y3": 221.45100000000002, "coord_origin": "TOPLEFT"}, "text": "evident that with OTSL, our model achieves the same TED score and slightly", "orig": "evident that with OTSL, our model achieves the same TED score and slightly", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 11, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 242.20299999999997, "r_x1": 440.942, "r_y1": 242.20299999999997, "r_x2": 440.942, "r_y2": 233.40599999999995, "r_x3": 134.765, "r_y3": 233.40599999999995, "coord_origin": "TOPLEFT"}, "text": "better mAP scores in comparison to HTML. However OTSL yields a", "orig": "better mAP scores in comparison to HTML. However OTSL yields a", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 12, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 444.868, "r_y0": 242.20299999999997, "r_x1": 480.588, "r_y1": 242.20299999999997, "r_x2": 480.588, "r_y2": 233.40599999999995, "r_x3": 444.868, "r_y3": 233.40599999999995, "coord_origin": "TOPLEFT"}, "text": "2x speed", "orig": "2x speed", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 13, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 254.159, "r_x1": 145.201, "r_y1": 254.159, "r_x2": 145.201, "r_y2": 245.36199999999997, "r_x3": 134.765, "r_y3": 245.36199999999997, "coord_origin": "TOPLEFT"}, "text": "up", "orig": "up", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 14, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 149.149, "r_y0": 254.159, "r_x1": 311.22, "r_y1": 254.159, "r_x2": 311.22, "r_y2": 245.36199999999997, "r_x3": 149.149, "r_y3": 245.36199999999997, "coord_origin": "TOPLEFT"}, "text": "in the inference runtime over HTML.", "orig": "in the inference runtime over HTML.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 15, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 282.998, "r_x1": 160.118, "r_y1": 282.998, "r_x2": 160.118, "r_y2": 275.072, "r_x3": 134.765, "r_y3": 275.072, "coord_origin": "TOPLEFT"}, "text": "Table", "orig": "Table", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 16, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 167.345, "r_y0": 282.998, "r_x1": 175.595, "r_y1": 282.998, "r_x2": 175.595, "r_y2": 275.072, "r_x3": 167.345, "r_y3": 275.072, "coord_origin": "TOPLEFT"}, "text": "1.", "orig": "1.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 17, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 188.133, "r_y0": 284.146, "r_x1": 255.736, "r_y1": 284.146, "r_x2": 255.736, "r_y2": 272.85699999999997, "r_x3": 188.133, "r_y3": 272.85699999999997, "coord_origin": "TOPLEFT"}, "text": "HPO performed", "orig": "HPO performed", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 18, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 262.013, "r_y0": 284.146, "r_x1": 269.69, "r_y1": 284.146, "r_x2": 269.69, "r_y2": 272.85699999999997, "r_x3": 262.013, "r_y3": 272.85699999999997, "coord_origin": "TOPLEFT"}, "text": "in", "orig": "in", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 19, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 275.957, "r_y0": 284.146, "r_x1": 300.652, "r_y1": 284.146, "r_x2": 300.652, "r_y2": 272.85699999999997, "r_x3": 275.957, "r_y3": 272.85699999999997, "coord_origin": "TOPLEFT"}, "text": "OTSL", "orig": "OTSL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 20, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 306.92, "r_y0": 284.146, "r_x1": 321.763, "r_y1": 284.146, "r_x2": 321.763, "r_y2": 272.85699999999997, "r_x3": 306.92, "r_y3": 272.85699999999997, "coord_origin": "TOPLEFT"}, "text": "and", "orig": "and", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 21, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 328.03, "r_y0": 284.146, "r_x1": 419.24, "r_y1": 284.146, "r_x2": 419.24, "r_y2": 272.85699999999997, "r_x3": 328.03, "r_y3": 272.85699999999997, "coord_origin": "TOPLEFT"}, "text": "HTML representation", "orig": "HTML representation", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 22, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 425.508, "r_y0": 284.146, "r_x1": 435.233, "r_y1": 284.146, "r_x2": 435.233, "r_y2": 272.85699999999997, "r_x3": 425.508, "r_y3": 272.85699999999997, "coord_origin": "TOPLEFT"}, "text": "on", "orig": "on", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 23, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 441.509, "r_y0": 284.146, "r_x1": 454.309, "r_y1": 284.146, "r_x2": 454.309, "r_y2": 272.85699999999997, "r_x3": 441.509, "r_y3": 272.85699999999997, "coord_origin": "TOPLEFT"}, "text": "the", "orig": "the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 24, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 460.576, "r_y0": 284.146, "r_x1": 480.594, "r_y1": 284.146, "r_x2": 480.594, "r_y2": 272.85699999999997, "r_x3": 460.576, "r_y3": 272.85699999999997, "coord_origin": "TOPLEFT"}, "text": "same", "orig": "same", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 25, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 295.105, "r_x1": 480.595, "r_y1": 295.105, "r_x2": 480.595, "r_y2": 283.816, "r_x3": 134.765, "r_y3": 283.816, "coord_origin": "TOPLEFT"}, "text": "transformer-based TableFormer [9] architecture, trained only on PubTabNet [22]. Ef-", "orig": "transformer-based TableFormer [9] architecture, trained only on PubTabNet [22]. Ef-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 26, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 306.064, "r_x1": 480.595, "r_y1": 306.064, "r_x2": 480.595, "r_y2": 294.775, "r_x3": 134.765, "r_y3": 294.775, "coord_origin": "TOPLEFT"}, "text": "fects of reducing the # of layers in encoder and decoder stages of the model show that", "orig": "fects of reducing the # of layers in encoder and decoder stages of the model show that", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 27, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 317.023, "r_x1": 163.504, "r_y1": 317.023, "r_x2": 163.504, "r_y2": 305.734, "r_x3": 134.765, "r_y3": 305.734, "coord_origin": "TOPLEFT"}, "text": "smaller", "orig": "smaller", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 28, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 167.817, "r_y0": 317.023, "r_x1": 443.264, "r_y1": 317.023, "r_x2": 443.264, "r_y2": 305.734, "r_x3": 167.817, "r_y3": 305.734, "coord_origin": "TOPLEFT"}, "text": "models trained on OTSL perform better, especially in recognizing", "orig": "models trained on OTSL perform better, especially in recognizing", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 29, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 447.577, "r_y0": 317.023, "r_x1": 480.595, "r_y1": 317.023, "r_x2": 480.595, "r_y2": 305.734, "r_x3": 447.577, "r_y3": 305.734, "coord_origin": "TOPLEFT"}, "text": "complex", "orig": "complex", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 30, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 327.982, "r_x1": 480.595, "r_y1": 327.982, "r_x2": 480.595, "r_y2": 316.693, "r_x3": 134.765, "r_y3": 316.693, "coord_origin": "TOPLEFT"}, "text": "table structures, and maintain a much higher mAP score than the HTML counterpart.", "orig": "table structures, and maintain a much higher mAP score than the HTML counterpart.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 31, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 160.37, "r_y0": 350.746, "r_x1": 168.048, "r_y1": 350.746, "r_x2": 168.048, "r_y2": 339.457, "r_x3": 160.37, "r_y3": 339.457, "coord_origin": "TOPLEFT"}, "text": "#", "orig": "#", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 32, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 144.592, "r_y0": 363.697, "r_x1": 183.828, "r_y1": 363.697, "r_x2": 183.828, "r_y2": 352.408, "r_x3": 144.592, "r_y3": 352.408, "coord_origin": "TOPLEFT"}, "text": "enc-layers", "orig": "enc-layers", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 33, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 207.974, "r_y0": 350.746, "r_x1": 215.652, "r_y1": 350.746, "r_x2": 215.652, "r_y2": 339.457, "r_x3": 207.974, "r_y3": 339.457, "coord_origin": "TOPLEFT"}, "text": "#", "orig": "#", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 34, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 192.195, "r_y0": 363.697, "r_x1": 231.431, "r_y1": 363.697, "r_x2": 231.431, "r_y2": 352.408, "r_x3": 192.195, "r_y3": 352.408, "coord_origin": "TOPLEFT"}, "text": "dec-layers", "orig": "dec-layers", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 35, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 239.798, "r_y0": 356.225, "r_x1": 278.318, "r_y1": 356.225, "r_x2": 278.318, "r_y2": 344.936, "r_x3": 239.798, "r_y3": 344.936, "coord_origin": "TOPLEFT"}, "text": "Language", "orig": "Language", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 36, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 324.67, "r_y0": 350.746, "r_x1": 348.264, "r_y1": 350.746, "r_x2": 348.264, "r_y2": 339.457, "r_x3": 324.67, "r_y3": 339.457, "coord_origin": "TOPLEFT"}, "text": "TEDs", "orig": "TEDs", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 37, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 396.271, "r_y0": 350.746, "r_x1": 417.127, "r_y1": 350.746, "r_x2": 417.127, "r_y2": 339.457, "r_x3": 396.271, "r_y3": 339.457, "coord_origin": "TOPLEFT"}, "text": "mAP", "orig": "mAP", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 38, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 394.927, "r_y0": 361.705, "r_x1": 418.473, "r_y1": 361.705, "r_x2": 418.473, "r_y2": 350.416, "r_x3": 394.927, "r_y3": 350.416, "coord_origin": "TOPLEFT"}, "text": "(0.75)", "orig": "(0.75)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 39, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 430.771, "r_y0": 350.746, "r_x1": 467.142, "r_y1": 350.746, "r_x2": 467.142, "r_y2": 339.457, "r_x3": 430.771, "r_y3": 339.457, "coord_origin": "TOPLEFT"}, "text": "Inference", "orig": "Inference", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 40, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 427.148, "r_y0": 361.705, "r_x1": 470.761, "r_y1": 361.705, "r_x2": 470.761, "r_y2": 350.416, "r_x3": 427.148, "r_y3": 350.416, "coord_origin": "TOPLEFT"}, "text": "time (secs)", "orig": "time (secs)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 41, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 286.686, "r_y0": 363.697, "r_x1": 312.333, "r_y1": 363.697, "r_x2": 312.333, "r_y2": 352.408, "r_x3": 286.686, "r_y3": 352.408, "coord_origin": "TOPLEFT"}, "text": "simple", "orig": "simple", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 42, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 320.702, "r_y0": 363.697, "r_x1": 353.72, "r_y1": 363.697, "r_x2": 353.72, "r_y2": 352.408, "r_x3": 320.702, "r_y3": 352.408, "coord_origin": "TOPLEFT"}, "text": "complex", "orig": "complex", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 43, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 369.306, "r_y0": 363.697, "r_x1": 379.031, "r_y1": 363.697, "r_x2": 379.031, "r_y2": 352.408, "r_x3": 369.306, "r_y3": 352.408, "coord_origin": "TOPLEFT"}, "text": "all", "orig": "all", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 44, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 161.906, "r_y0": 382.527, "r_x1": 166.513, "r_y1": 382.527, "r_x2": 166.513, "r_y2": 371.238, "r_x3": 161.906, "r_y3": 371.238, "coord_origin": "TOPLEFT"}, "text": "6", "orig": "6", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 45, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 209.509, "r_y0": 382.527, "r_x1": 214.116, "r_y1": 382.527, "r_x2": 214.116, "r_y2": 371.238, "r_x3": 209.509, "r_y3": 371.238, "coord_origin": "TOPLEFT"}, "text": "6", "orig": "6", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 46, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 246.71, "r_y0": 377.047, "r_x1": 271.405, "r_y1": 377.047, "r_x2": 271.405, "r_y2": 365.758, "r_x3": 246.71, "r_y3": 365.758, "coord_origin": "TOPLEFT"}, "text": "OTSL", "orig": "OTSL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 47, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 289.017, "r_y0": 377.047, "r_x1": 310.004, "r_y1": 377.047, "r_x2": 310.004, "r_y2": 365.758, "r_x3": 289.017, "r_y3": 365.758, "coord_origin": "TOPLEFT"}, "text": "0.965", "orig": "0.965", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 48, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 326.717, "r_y0": 377.047, "r_x1": 347.704, "r_y1": 377.047, "r_x2": 347.704, "r_y2": 365.758, "r_x3": 326.717, "r_y3": 365.758, "coord_origin": "TOPLEFT"}, "text": "0.934", "orig": "0.934", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 49, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 363.676, "r_y0": 377.047, "r_x1": 384.663, "r_y1": 377.047, "r_x2": 384.663, "r_y2": 365.758, "r_x3": 363.676, "r_y3": 365.758, "coord_origin": "TOPLEFT"}, "text": "0.955", "orig": "0.955", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 50, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 397.27, "r_y0": 375.899, "r_x1": 416.127, "r_y1": 375.899, "r_x2": 416.127, "r_y2": 367.973, "r_x3": 397.27, "r_y3": 367.973, "coord_origin": "TOPLEFT"}, "text": "0.88", "orig": "0.88", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 51, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 439.527, "r_y0": 375.899, "r_x1": 458.384, "r_y1": 375.899, "r_x2": 458.384, "r_y2": 367.973, "r_x3": 439.527, "r_y3": 367.973, "coord_origin": "TOPLEFT"}, "text": "2.73", "orig": "2.73", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 52, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 245.176, "r_y0": 389.999, "r_x1": 272.94, "r_y1": 389.999, "r_x2": 272.94, "r_y2": 378.71, "r_x3": 245.176, "r_y3": 378.71, "coord_origin": "TOPLEFT"}, "text": "HTML", "orig": "HTML", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 53, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 289.017, "r_y0": 389.999, "r_x1": 310.004, "r_y1": 389.999, "r_x2": 310.004, "r_y2": 378.71, "r_x3": 289.017, "r_y3": 378.71, "coord_origin": "TOPLEFT"}, "text": "0.969", "orig": "0.969", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 54, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 326.717, "r_y0": 389.999, "r_x1": 347.704, "r_y1": 389.999, "r_x2": 347.704, "r_y2": 378.71, "r_x3": 326.717, "r_y3": 378.71, "coord_origin": "TOPLEFT"}, "text": "0.927", "orig": "0.927", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 55, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 363.676, "r_y0": 389.999, "r_x1": 384.663, "r_y1": 389.999, "r_x2": 384.663, "r_y2": 378.71, "r_x3": 363.676, "r_y3": 378.71, "coord_origin": "TOPLEFT"}, "text": "0.955", "orig": "0.955", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 56, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 396.206, "r_y0": 389.999, "r_x1": 417.193, "r_y1": 389.999, "r_x2": 417.193, "r_y2": 378.71, "r_x3": 396.206, "r_y3": 378.71, "coord_origin": "TOPLEFT"}, "text": "0.857", "orig": "0.857", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 57, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 440.767, "r_y0": 389.999, "r_x1": 457.147, "r_y1": 389.999, "r_x2": 457.147, "r_y2": 378.71, "r_x3": 440.767, "r_y3": 378.71, "coord_origin": "TOPLEFT"}, "text": "5.39", "orig": "5.39", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 58, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 161.906, "r_y0": 408.828, "r_x1": 166.513, "r_y1": 408.828, "r_x2": 166.513, "r_y2": 397.539, "r_x3": 161.906, "r_y3": 397.539, "coord_origin": "TOPLEFT"}, "text": "4", "orig": "4", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 59, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 209.509, "r_y0": 408.828, "r_x1": 214.116, "r_y1": 408.828, "r_x2": 214.116, "r_y2": 397.539, "r_x3": 209.509, "r_y3": 397.539, "coord_origin": "TOPLEFT"}, "text": "4", "orig": "4", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 60, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 246.71, "r_y0": 403.349, "r_x1": 271.405, "r_y1": 403.349, "r_x2": 271.405, "r_y2": 392.06, "r_x3": 246.71, "r_y3": 392.06, "coord_origin": "TOPLEFT"}, "text": "OTSL", "orig": "OTSL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 61, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 289.017, "r_y0": 403.349, "r_x1": 310.004, "r_y1": 403.349, "r_x2": 310.004, "r_y2": 392.06, "r_x3": 289.017, "r_y3": 392.06, "coord_origin": "TOPLEFT"}, "text": "0.938", "orig": "0.938", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 62, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 326.717, "r_y0": 403.349, "r_x1": 347.704, "r_y1": 403.349, "r_x2": 347.704, "r_y2": 392.06, "r_x3": 326.717, "r_y3": 392.06, "coord_origin": "TOPLEFT"}, "text": "0.904", "orig": "0.904", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 63, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 363.676, "r_y0": 403.349, "r_x1": 384.663, "r_y1": 403.349, "r_x2": 384.663, "r_y2": 392.06, "r_x3": 363.676, "r_y3": 392.06, "coord_origin": "TOPLEFT"}, "text": "0.927", "orig": "0.927", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 64, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 394.618, "r_y0": 402.201, "r_x1": 418.779, "r_y1": 402.201, "r_x2": 418.779, "r_y2": 394.275, "r_x3": 394.618, "r_y3": 394.275, "coord_origin": "TOPLEFT"}, "text": "0.853", "orig": "0.853", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 65, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 439.527, "r_y0": 402.201, "r_x1": 458.384, "r_y1": 402.201, "r_x2": 458.384, "r_y2": 394.275, "r_x3": 439.527, "r_y3": 394.275, "coord_origin": "TOPLEFT"}, "text": "1.97", "orig": "1.97", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 66, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 245.176, "r_y0": 416.3, "r_x1": 272.94, "r_y1": 416.3, "r_x2": 272.94, "r_y2": 405.011, "r_x3": 245.176, "r_y3": 405.011, "coord_origin": "TOPLEFT"}, "text": "HTML", "orig": "HTML", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 67, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 289.017, "r_y0": 416.3, "r_x1": 310.004, "r_y1": 416.3, "r_x2": 310.004, "r_y2": 405.011, "r_x3": 289.017, "r_y3": 405.011, "coord_origin": "TOPLEFT"}, "text": "0.952", "orig": "0.952", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 68, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 326.717, "r_y0": 416.3, "r_x1": 347.704, "r_y1": 416.3, "r_x2": 347.704, "r_y2": 405.011, "r_x3": 326.717, "r_y3": 405.011, "coord_origin": "TOPLEFT"}, "text": "0.909", "orig": "0.909", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 69, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 362.088, "r_y0": 415.152, "r_x1": 386.249, "r_y1": 415.152, "r_x2": 386.249, "r_y2": 407.226, "r_x3": 362.088, "r_y3": 407.226, "coord_origin": "TOPLEFT"}, "text": "0.938", "orig": "0.938", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 70, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 396.206, "r_y0": 416.3, "r_x1": 417.193, "r_y1": 416.3, "r_x2": 417.193, "r_y2": 405.011, "r_x3": 396.206, "r_y3": 405.011, "coord_origin": "TOPLEFT"}, "text": "0.843", "orig": "0.843", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 71, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 440.767, "r_y0": 416.3, "r_x1": 457.147, "r_y1": 416.3, "r_x2": 457.147, "r_y2": 405.011, "r_x3": 440.767, "r_y3": 405.011, "coord_origin": "TOPLEFT"}, "text": "3.77", "orig": "3.77", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 72, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 161.906, "r_y0": 435.129, "r_x1": 166.513, "r_y1": 435.129, "r_x2": 166.513, "r_y2": 423.84, "r_x3": 161.906, "r_y3": 423.84, "coord_origin": "TOPLEFT"}, "text": "2", "orig": "2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 73, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 209.509, "r_y0": 435.129, "r_x1": 214.116, "r_y1": 435.129, "r_x2": 214.116, "r_y2": 423.84, "r_x3": 209.509, "r_y3": 423.84, "coord_origin": "TOPLEFT"}, "text": "4", "orig": "4", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 74, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 246.71, "r_y0": 429.65, "r_x1": 271.405, "r_y1": 429.65, "r_x2": 271.405, "r_y2": 418.361, "r_x3": 246.71, "r_y3": 418.361, "coord_origin": "TOPLEFT"}, "text": "OTSL", "orig": "OTSL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 75, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 289.017, "r_y0": 429.65, "r_x1": 310.004, "r_y1": 429.65, "r_x2": 310.004, "r_y2": 418.361, "r_x3": 289.017, "r_y3": 418.361, "coord_origin": "TOPLEFT"}, "text": "0.923", "orig": "0.923", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 76, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 326.717, "r_y0": 429.65, "r_x1": 347.704, "r_y1": 429.65, "r_x2": 347.704, "r_y2": 418.361, "r_x3": 326.717, "r_y3": 418.361, "coord_origin": "TOPLEFT"}, "text": "0.897", "orig": "0.897", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 77, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 363.676, "r_y0": 429.65, "r_x1": 384.663, "r_y1": 429.65, "r_x2": 384.663, "r_y2": 418.361, "r_x3": 363.676, "r_y3": 418.361, "coord_origin": "TOPLEFT"}, "text": "0.915", "orig": "0.915", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 78, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 394.618, "r_y0": 428.502, "r_x1": 418.779, "r_y1": 428.502, "r_x2": 418.779, "r_y2": 420.576, "r_x3": 394.618, "r_y3": 420.576, "coord_origin": "TOPLEFT"}, "text": "0.859", "orig": "0.859", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 79, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 439.527, "r_y0": 428.502, "r_x1": 458.384, "r_y1": 428.502, "r_x2": 458.384, "r_y2": 420.576, "r_x3": 439.527, "r_y3": 420.576, "coord_origin": "TOPLEFT"}, "text": "1.91", "orig": "1.91", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 80, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 245.176, "r_y0": 442.601, "r_x1": 272.94, "r_y1": 442.601, "r_x2": 272.94, "r_y2": 431.312, "r_x3": 245.176, "r_y3": 431.312, "coord_origin": "TOPLEFT"}, "text": "HTML", "orig": "HTML", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 81, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 289.017, "r_y0": 442.601, "r_x1": 310.004, "r_y1": 442.601, "r_x2": 310.004, "r_y2": 431.312, "r_x3": 289.017, "r_y3": 431.312, "coord_origin": "TOPLEFT"}, "text": "0.945", "orig": "0.945", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 82, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 326.717, "r_y0": 442.601, "r_x1": 347.704, "r_y1": 442.601, "r_x2": 347.704, "r_y2": 431.312, "r_x3": 326.717, "r_y3": 431.312, "coord_origin": "TOPLEFT"}, "text": "0.901", "orig": "0.901", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 83, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 362.088, "r_y0": 441.453, "r_x1": 386.249, "r_y1": 441.453, "r_x2": 386.249, "r_y2": 433.527, "r_x3": 362.088, "r_y3": 433.527, "coord_origin": "TOPLEFT"}, "text": "0.931", "orig": "0.931", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 84, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 396.206, "r_y0": 442.601, "r_x1": 417.193, "r_y1": 442.601, "r_x2": 417.193, "r_y2": 431.312, "r_x3": 396.206, "r_y3": 431.312, "coord_origin": "TOPLEFT"}, "text": "0.834", "orig": "0.834", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 85, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 440.767, "r_y0": 442.601, "r_x1": 457.147, "r_y1": 442.601, "r_x2": 457.147, "r_y2": 431.312, "r_x3": 440.767, "r_y3": 431.312, "coord_origin": "TOPLEFT"}, "text": "3.81", "orig": "3.81", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 86, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 161.906, "r_y0": 461.431, "r_x1": 166.513, "r_y1": 461.431, "r_x2": 166.513, "r_y2": 450.142, "r_x3": 161.906, "r_y3": 450.142, "coord_origin": "TOPLEFT"}, "text": "4", "orig": "4", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 87, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 209.509, "r_y0": 461.431, "r_x1": 214.116, "r_y1": 461.431, "r_x2": 214.116, "r_y2": 450.142, "r_x3": 209.509, "r_y3": 450.142, "coord_origin": "TOPLEFT"}, "text": "2", "orig": "2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 88, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 246.71, "r_y0": 455.951, "r_x1": 271.405, "r_y1": 455.951, "r_x2": 271.405, "r_y2": 444.662, "r_x3": 246.71, "r_y3": 444.662, "coord_origin": "TOPLEFT"}, "text": "OTSL", "orig": "OTSL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 89, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 289.017, "r_y0": 455.951, "r_x1": 310.004, "r_y1": 455.951, "r_x2": 310.004, "r_y2": 444.662, "r_x3": 289.017, "r_y3": 444.662, "coord_origin": "TOPLEFT"}, "text": "0.952", "orig": "0.952", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 90, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 329.021, "r_y0": 455.951, "r_x1": 345.401, "r_y1": 455.951, "r_x2": 345.401, "r_y2": 444.662, "r_x3": 329.021, "r_y3": 444.662, "coord_origin": "TOPLEFT"}, "text": "0.92", "orig": "0.92", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 91, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 362.088, "r_y0": 454.803, "r_x1": 386.249, "r_y1": 454.803, "r_x2": 386.249, "r_y2": 446.877, "r_x3": 362.088, "r_y3": 446.877, "coord_origin": "TOPLEFT"}, "text": "0.942", "orig": "0.942", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 92, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 394.618, "r_y0": 454.803, "r_x1": 418.779, "r_y1": 454.803, "r_x2": 418.779, "r_y2": 446.877, "r_x3": 394.618, "r_y3": 446.877, "coord_origin": "TOPLEFT"}, "text": "0.857", "orig": "0.857", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 93, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 439.527, "r_y0": 454.803, "r_x1": 458.384, "r_y1": 454.803, "r_x2": 458.384, "r_y2": 446.877, "r_x3": 439.527, "r_y3": 446.877, "coord_origin": "TOPLEFT"}, "text": "1.22", "orig": "1.22", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 94, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 245.176, "r_y0": 468.903, "r_x1": 272.94, "r_y1": 468.903, "r_x2": 272.94, "r_y2": 457.614, "r_x3": 245.176, "r_y3": 457.614, "coord_origin": "TOPLEFT"}, "text": "HTML", "orig": "HTML", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 95, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 289.017, "r_y0": 468.903, "r_x1": 310.004, "r_y1": 468.903, "r_x2": 310.004, "r_y2": 457.614, "r_x3": 289.017, "r_y3": 457.614, "coord_origin": "TOPLEFT"}, "text": "0.944", "orig": "0.944", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 96, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 326.717, "r_y0": 468.903, "r_x1": 347.704, "r_y1": 468.903, "r_x2": 347.704, "r_y2": 457.614, "r_x3": 326.717, "r_y3": 457.614, "coord_origin": "TOPLEFT"}, "text": "0.903", "orig": "0.903", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 97, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 363.676, "r_y0": 468.903, "r_x1": 384.663, "r_y1": 468.903, "r_x2": 384.663, "r_y2": 457.614, "r_x3": 363.676, "r_y3": 457.614, "coord_origin": "TOPLEFT"}, "text": "0.931", "orig": "0.931", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 98, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 396.206, "r_y0": 468.903, "r_x1": 417.193, "r_y1": 468.903, "r_x2": 417.193, "r_y2": 457.614, "r_x3": 396.206, "r_y3": 457.614, "coord_origin": "TOPLEFT"}, "text": "0.824", "orig": "0.824", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 99, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 446.653, "r_y0": 468.903, "r_x1": 451.26, "r_y1": 468.903, "r_x2": 451.26, "r_y2": 457.614, "r_x3": 446.653, "r_y3": 457.614, "coord_origin": "TOPLEFT"}, "text": "2", "orig": "2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 100, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 516.9590000000001, "r_x1": 149.402, "r_y1": 516.9590000000001, "r_x2": 149.402, "r_y2": 508.152, "r_x3": 134.765, "r_y3": 508.152, "coord_origin": "TOPLEFT"}, "text": "5.2", "orig": "5.2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 101, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 160.859, "r_y0": 516.9590000000001, "r_x1": 264.403, "r_y1": 516.9590000000001, "r_x2": 264.403, "r_y2": 508.152, "r_x3": 160.859, "r_y3": 508.152, "coord_origin": "TOPLEFT"}, "text": "Quantitative Results", "orig": "Quantitative Results", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 102, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 533.348, "r_x1": 480.591, "r_y1": 533.348, "r_x2": 480.591, "r_y2": 524.5509999999999, "r_x3": 134.765, "r_y3": 524.5509999999999, "coord_origin": "TOPLEFT"}, "text": "We picked the model parameter configuration that produced the best prediction", "orig": "We picked the model parameter configuration that produced the best prediction", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 103, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 545.304, "r_x1": 164.921, "r_y1": 545.304, "r_x2": 164.921, "r_y2": 536.5070000000001, "r_x3": 134.765, "r_y3": 536.5070000000001, "coord_origin": "TOPLEFT"}, "text": "quality", "orig": "quality", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 104, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 169.324, "r_y0": 545.304, "r_x1": 480.587, "r_y1": 545.304, "r_x2": 480.587, "r_y2": 536.5070000000001, "r_x3": 169.324, "r_y3": 536.5070000000001, "coord_origin": "TOPLEFT"}, "text": "(enc=6, dec=6, heads=8) with PubTabNet alone, then independently", "orig": "(enc=6, dec=6, heads=8) with PubTabNet alone, then independently", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 105, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 557.259, "r_x1": 480.596, "r_y1": 557.259, "r_x2": 480.596, "r_y2": 548.462, "r_x3": 134.765, "r_y3": 548.462, "coord_origin": "TOPLEFT"}, "text": "trained and evaluated it on three publicly available data sets: PubTabNet (395k", "orig": "trained and evaluated it on three publicly available data sets: PubTabNet (395k", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 106, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 569.2139999999999, "r_x1": 480.592, "r_y1": 569.2139999999999, "r_x2": 480.592, "r_y2": 560.417, "r_x3": 134.765, "r_y3": 560.417, "coord_origin": "TOPLEFT"}, "text": "samples), FinTabNet (113k samples) and PubTables-1M (about 1M samples).", "orig": "samples), FinTabNet (113k samples) and PubTables-1M (about 1M samples).", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 107, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 581.169, "r_x1": 480.591, "r_y1": 581.169, "r_x2": 480.591, "r_y2": 572.3720000000001, "r_x3": 134.765, "r_y3": 572.3720000000001, "coord_origin": "TOPLEFT"}, "text": "Performance results are presented in Table. 2. It is clearly evident that the model", "orig": "Performance results are presented in Table. 2. It is clearly evident that the model", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 108, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 593.124, "r_x1": 480.596, "r_y1": 593.124, "r_x2": 480.596, "r_y2": 584.327, "r_x3": 134.765, "r_y3": 584.327, "coord_origin": "TOPLEFT"}, "text": "trained on OTSL outperforms HTML across the board, keeping high TEDs and", "orig": "trained on OTSL outperforms HTML across the board, keeping high TEDs and", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 109, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 605.08, "r_x1": 480.588, "r_y1": 605.08, "r_x2": 480.588, "r_y2": 596.283, "r_x3": 134.765, "r_y3": 596.283, "coord_origin": "TOPLEFT"}, "text": "mAP scores even on difficult financial tables (FinTabNet) that contain sparse", "orig": "mAP scores even on difficult financial tables (FinTabNet) that contain sparse", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 110, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 617.035, "r_x1": 206.787, "r_y1": 617.035, "r_x2": 206.787, "r_y2": 608.238, "r_x3": 134.765, "r_y3": 608.238, "coord_origin": "TOPLEFT"}, "text": "and large tables.", "orig": "and large tables.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 111, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 149.709, "r_y0": 628.99, "r_x1": 205.597, "r_y1": 628.99, "r_x2": 205.597, "r_y2": 620.193, "r_x3": 149.709, "r_y3": 620.193, "coord_origin": "TOPLEFT"}, "text": "Additionally,", "orig": "Additionally,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 112, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 210.578, "r_y0": 628.99, "r_x1": 224.412, "r_y1": 628.99, "r_x2": 224.412, "r_y2": 620.193, "r_x3": 210.578, "r_y3": 620.193, "coord_origin": "TOPLEFT"}, "text": "the", "orig": "the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 113, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 229.383, "r_y0": 628.99, "r_x1": 257.74, "r_y1": 628.99, "r_x2": 257.74, "r_y2": 620.193, "r_x3": 229.383, "r_y3": 620.193, "coord_origin": "TOPLEFT"}, "text": "results", "orig": "results", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 114, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 262.722, "r_y0": 628.99, "r_x1": 307.319, "r_y1": 628.99, "r_x2": 307.319, "r_y2": 620.193, "r_x3": 262.722, "r_y3": 620.193, "coord_origin": "TOPLEFT"}, "text": "show that", "orig": "show that", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 115, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 312.301, "r_y0": 628.99, "r_x1": 480.593, "r_y1": 628.99, "r_x2": 480.593, "r_y2": 620.193, "r_x3": 312.301, "r_y3": 620.193, "coord_origin": "TOPLEFT"}, "text": "OTSL has an advantage over HTML", "orig": "OTSL has an advantage over HTML", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 116, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 640.9449999999999, "r_x1": 480.596, "r_y1": 640.9449999999999, "r_x2": 480.596, "r_y2": 632.148, "r_x3": 134.765, "r_y3": 632.148, "coord_origin": "TOPLEFT"}, "text": "when applied on a bigger data set like PubTables-1M and achieves significantly", "orig": "when applied on a bigger data set like PubTables-1M and achieves significantly", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 117, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 652.9, "r_x1": 480.593, "r_y1": 652.9, "r_x2": 480.593, "r_y2": 644.1030000000001, "r_x3": 134.765, "r_y3": 644.1030000000001, "coord_origin": "TOPLEFT"}, "text": "improved scores. Finally, OTSL achieves faster inference due to fewer decoding", "orig": "improved scores. Finally, OTSL achieves faster inference due to fewer decoding", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 118, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 664.855, "r_x1": 405.797, "r_y1": 664.855, "r_x2": 405.797, "r_y2": 656.058, "r_x3": 134.765, "r_y3": 656.058, "coord_origin": "TOPLEFT"}, "text": "steps which is a result of the reduced sequence representation.", "orig": "steps which is a result of the reduced sequence representation.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "parsed_page": null, "predictions": {"layout": {"clusters": [{"id": 8, "label": "page_header", "bbox": {"l": 194.478, "t": 91.49300000000005, "r": 447.543, "b": 102.78200000000004, "coord_origin": "TOPLEFT"}, "confidence": 0.9373378753662109, "cells": [{"index": 0, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 194.478, "r_y0": 102.78200000000004, "r_x1": 447.543, "r_y1": 102.78200000000004, "r_x2": 447.543, "r_y2": 91.49300000000005, "r_x3": 194.478, "r_y3": 91.49300000000005, "coord_origin": "TOPLEFT"}, "text": "Optimized Table Tokenization for Table Structure Recognition", "orig": "Optimized Table Tokenization for Table Structure Recognition", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 9, "label": "page_header", "bbox": {"l": 475.984, "t": 91.49300000000005, "r": 480.591, "b": 102.78200000000004, "coord_origin": "TOPLEFT"}, "confidence": 0.8857625722885132, "cells": [{"index": 1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 475.984, "r_y0": 102.78200000000004, "r_x1": 480.591, "r_y1": 102.78200000000004, "r_x2": 480.591, "r_y2": 91.49300000000005, "r_x3": 475.984, "r_y3": 91.49300000000005, "coord_origin": "TOPLEFT"}, "text": "9", "orig": "9", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 4, "label": "text", "bbox": {"l": 134.765, "t": 118.93399999999997, "r": 480.596, "b": 151.64200000000005, "coord_origin": "TOPLEFT"}, "confidence": 0.9805440306663513, "cells": [{"index": 2, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 127.731, "r_x1": 480.594, "r_y1": 127.731, "r_x2": 480.594, "r_y2": 118.93399999999997, "r_x3": 134.765, "r_y3": 118.93399999999997, "coord_origin": "TOPLEFT"}, "text": "order to compute the TED score. Inference timing results for all experiments", "orig": "order to compute the TED score. Inference timing results for all experiments", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 3, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 139.68600000000004, "r_x1": 480.596, "r_y1": 139.68600000000004, "r_x2": 480.596, "r_y2": 130.889, "r_x3": 134.765, "r_y3": 130.889, "coord_origin": "TOPLEFT"}, "text": "were obtained from the same machine on a single core with AMD EPYC 7763", "orig": "were obtained from the same machine on a single core with AMD EPYC 7763", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 4, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 151.64200000000005, "r_x1": 210.785, "r_y1": 151.64200000000005, "r_x2": 210.785, "r_y2": 142.84500000000003, "r_x3": 134.765, "r_y3": 142.84500000000003, "coord_origin": "TOPLEFT"}, "text": "CPU @2.45 GHz.", "orig": "CPU @2.45 GHz.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 6, "label": "section_header", "bbox": {"l": 134.765, "t": 169.18600000000004, "r": 318.448, "b": 177.99300000000005, "coord_origin": "TOPLEFT"}, "confidence": 0.9579681158065796, "cells": [{"index": 5, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 177.99300000000005, "r_x1": 149.402, "r_y1": 177.99300000000005, "r_x2": 149.402, "r_y2": 169.18600000000004, "r_x3": 134.765, "r_y3": 169.18600000000004, "coord_origin": "TOPLEFT"}, "text": "5.1", "orig": "5.1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 6, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 160.859, "r_y0": 177.99300000000005, "r_x1": 318.448, "r_y1": 177.99300000000005, "r_x2": 318.448, "r_y2": 169.18600000000004, "r_x3": 160.859, "r_y3": 169.18600000000004, "coord_origin": "TOPLEFT"}, "text": "Hyper Parameter Optimization", "orig": "Hyper Parameter Optimization", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 3, "label": "text", "bbox": {"l": 134.765, "t": 185.586, "r": 480.593, "b": 254.159, "coord_origin": "TOPLEFT"}, "confidence": 0.9842326641082764, "cells": [{"index": 7, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 194.38300000000004, "r_x1": 480.592, "r_y1": 194.38300000000004, "r_x2": 480.592, "r_y2": 185.586, "r_x3": 134.765, "r_y3": 185.586, "coord_origin": "TOPLEFT"}, "text": "We have chosen the PubTabNet data set to perform HPO, since it includes a", "orig": "We have chosen the PubTabNet data set to perform HPO, since it includes a", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 8, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 206.33799999999997, "r_x1": 480.592, "r_y1": 206.33799999999997, "r_x2": 480.592, "r_y2": 197.54100000000005, "r_x3": 134.765, "r_y3": 197.54100000000005, "coord_origin": "TOPLEFT"}, "text": "highly diverse set of tables. Also we report TED scores separately for simple and", "orig": "highly diverse set of tables. Also we report TED scores separately for simple and", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 9, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 218.293, "r_x1": 480.592, "r_y1": 218.293, "r_x2": 480.592, "r_y2": 209.49599999999998, "r_x3": 134.765, "r_y3": 209.49599999999998, "coord_origin": "TOPLEFT"}, "text": "complex tables (tables with cell spans). Results are presented in Table. 1. It is", "orig": "complex tables (tables with cell spans). Results are presented in Table. 1. It is", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 10, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 230.24800000000005, "r_x1": 480.593, "r_y1": 230.24800000000005, "r_x2": 480.593, "r_y2": 221.45100000000002, "r_x3": 134.765, "r_y3": 221.45100000000002, "coord_origin": "TOPLEFT"}, "text": "evident that with OTSL, our model achieves the same TED score and slightly", "orig": "evident that with OTSL, our model achieves the same TED score and slightly", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 11, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 242.20299999999997, "r_x1": 440.942, "r_y1": 242.20299999999997, "r_x2": 440.942, "r_y2": 233.40599999999995, "r_x3": 134.765, "r_y3": 233.40599999999995, "coord_origin": "TOPLEFT"}, "text": "better mAP scores in comparison to HTML. However OTSL yields a", "orig": "better mAP scores in comparison to HTML. However OTSL yields a", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 12, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 444.868, "r_y0": 242.20299999999997, "r_x1": 480.588, "r_y1": 242.20299999999997, "r_x2": 480.588, "r_y2": 233.40599999999995, "r_x3": 444.868, "r_y3": 233.40599999999995, "coord_origin": "TOPLEFT"}, "text": "2x speed", "orig": "2x speed", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 13, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 254.159, "r_x1": 145.201, "r_y1": 254.159, "r_x2": 145.201, "r_y2": 245.36199999999997, "r_x3": 134.765, "r_y3": 245.36199999999997, "coord_origin": "TOPLEFT"}, "text": "up", "orig": "up", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 14, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 149.149, "r_y0": 254.159, "r_x1": 311.22, "r_y1": 254.159, "r_x2": 311.22, "r_y2": 245.36199999999997, "r_x3": 149.149, "r_y3": 245.36199999999997, "coord_origin": "TOPLEFT"}, "text": "in the inference runtime over HTML.", "orig": "in the inference runtime over HTML.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 7, "label": "caption", "bbox": {"l": 134.765, "t": 272.85699999999997, "r": 480.595, "b": 327.982, "coord_origin": "TOPLEFT"}, "confidence": 0.9570781588554382, "cells": [{"index": 15, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 282.998, "r_x1": 160.118, "r_y1": 282.998, "r_x2": 160.118, "r_y2": 275.072, "r_x3": 134.765, "r_y3": 275.072, "coord_origin": "TOPLEFT"}, "text": "Table", "orig": "Table", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 16, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 167.345, "r_y0": 282.998, "r_x1": 175.595, "r_y1": 282.998, "r_x2": 175.595, "r_y2": 275.072, "r_x3": 167.345, "r_y3": 275.072, "coord_origin": "TOPLEFT"}, "text": "1.", "orig": "1.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 17, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 188.133, "r_y0": 284.146, "r_x1": 255.736, "r_y1": 284.146, "r_x2": 255.736, "r_y2": 272.85699999999997, "r_x3": 188.133, "r_y3": 272.85699999999997, "coord_origin": "TOPLEFT"}, "text": "HPO performed", "orig": "HPO performed", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 18, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 262.013, "r_y0": 284.146, "r_x1": 269.69, "r_y1": 284.146, "r_x2": 269.69, "r_y2": 272.85699999999997, "r_x3": 262.013, "r_y3": 272.85699999999997, "coord_origin": "TOPLEFT"}, "text": "in", "orig": "in", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 19, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 275.957, "r_y0": 284.146, "r_x1": 300.652, "r_y1": 284.146, "r_x2": 300.652, "r_y2": 272.85699999999997, "r_x3": 275.957, "r_y3": 272.85699999999997, "coord_origin": "TOPLEFT"}, "text": "OTSL", "orig": "OTSL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 20, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 306.92, "r_y0": 284.146, "r_x1": 321.763, "r_y1": 284.146, "r_x2": 321.763, "r_y2": 272.85699999999997, "r_x3": 306.92, "r_y3": 272.85699999999997, "coord_origin": "TOPLEFT"}, "text": "and", "orig": "and", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 21, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 328.03, "r_y0": 284.146, "r_x1": 419.24, "r_y1": 284.146, "r_x2": 419.24, "r_y2": 272.85699999999997, "r_x3": 328.03, "r_y3": 272.85699999999997, "coord_origin": "TOPLEFT"}, "text": "HTML representation", "orig": "HTML representation", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 22, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 425.508, "r_y0": 284.146, "r_x1": 435.233, "r_y1": 284.146, "r_x2": 435.233, "r_y2": 272.85699999999997, "r_x3": 425.508, "r_y3": 272.85699999999997, "coord_origin": "TOPLEFT"}, "text": "on", "orig": "on", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 23, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 441.509, "r_y0": 284.146, "r_x1": 454.309, "r_y1": 284.146, "r_x2": 454.309, "r_y2": 272.85699999999997, "r_x3": 441.509, "r_y3": 272.85699999999997, "coord_origin": "TOPLEFT"}, "text": "the", "orig": "the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 24, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 460.576, "r_y0": 284.146, "r_x1": 480.594, "r_y1": 284.146, "r_x2": 480.594, "r_y2": 272.85699999999997, "r_x3": 460.576, "r_y3": 272.85699999999997, "coord_origin": "TOPLEFT"}, "text": "same", "orig": "same", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 25, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 295.105, "r_x1": 480.595, "r_y1": 295.105, "r_x2": 480.595, "r_y2": 283.816, "r_x3": 134.765, "r_y3": 283.816, "coord_origin": "TOPLEFT"}, "text": "transformer-based TableFormer [9] architecture, trained only on PubTabNet [22]. Ef-", "orig": "transformer-based TableFormer [9] architecture, trained only on PubTabNet [22]. Ef-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 26, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 306.064, "r_x1": 480.595, "r_y1": 306.064, "r_x2": 480.595, "r_y2": 294.775, "r_x3": 134.765, "r_y3": 294.775, "coord_origin": "TOPLEFT"}, "text": "fects of reducing the # of layers in encoder and decoder stages of the model show that", "orig": "fects of reducing the # of layers in encoder and decoder stages of the model show that", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 27, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 317.023, "r_x1": 163.504, "r_y1": 317.023, "r_x2": 163.504, "r_y2": 305.734, "r_x3": 134.765, "r_y3": 305.734, "coord_origin": "TOPLEFT"}, "text": "smaller", "orig": "smaller", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 28, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 167.817, "r_y0": 317.023, "r_x1": 443.264, "r_y1": 317.023, "r_x2": 443.264, "r_y2": 305.734, "r_x3": 167.817, "r_y3": 305.734, "coord_origin": "TOPLEFT"}, "text": "models trained on OTSL perform better, especially in recognizing", "orig": "models trained on OTSL perform better, especially in recognizing", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 29, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 447.577, "r_y0": 317.023, "r_x1": 480.595, "r_y1": 317.023, "r_x2": 480.595, "r_y2": 305.734, "r_x3": 447.577, "r_y3": 305.734, "coord_origin": "TOPLEFT"}, "text": "complex", "orig": "complex", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 30, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 327.982, "r_x1": 480.595, "r_y1": 327.982, "r_x2": 480.595, "r_y2": 316.693, "r_x3": 134.765, "r_y3": 316.693, "coord_origin": "TOPLEFT"}, "text": "table structures, and maintain a much higher mAP score than the HTML counterpart.", "orig": "table structures, and maintain a much higher mAP score than the HTML counterpart.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 0, "label": "table", "bbox": {"l": 139.66845703125, "t": 337.5747985839844, "r": 475.00372314453125, "b": 469.4721374511719, "coord_origin": "TOPLEFT"}, "confidence": 0.9901032447814941, "cells": [{"index": 31, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 160.37, "r_y0": 350.746, "r_x1": 168.048, "r_y1": 350.746, "r_x2": 168.048, "r_y2": 339.457, "r_x3": 160.37, "r_y3": 339.457, "coord_origin": "TOPLEFT"}, "text": "#", "orig": "#", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 32, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 144.592, "r_y0": 363.697, "r_x1": 183.828, "r_y1": 363.697, "r_x2": 183.828, "r_y2": 352.408, "r_x3": 144.592, "r_y3": 352.408, "coord_origin": "TOPLEFT"}, "text": "enc-layers", "orig": "enc-layers", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 33, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 207.974, "r_y0": 350.746, "r_x1": 215.652, "r_y1": 350.746, "r_x2": 215.652, "r_y2": 339.457, "r_x3": 207.974, "r_y3": 339.457, "coord_origin": "TOPLEFT"}, "text": "#", "orig": "#", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 34, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 192.195, "r_y0": 363.697, "r_x1": 231.431, "r_y1": 363.697, "r_x2": 231.431, "r_y2": 352.408, "r_x3": 192.195, "r_y3": 352.408, "coord_origin": "TOPLEFT"}, "text": "dec-layers", "orig": "dec-layers", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 35, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 239.798, "r_y0": 356.225, "r_x1": 278.318, "r_y1": 356.225, "r_x2": 278.318, "r_y2": 344.936, "r_x3": 239.798, "r_y3": 344.936, "coord_origin": "TOPLEFT"}, "text": "Language", "orig": "Language", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 36, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 324.67, "r_y0": 350.746, "r_x1": 348.264, "r_y1": 350.746, "r_x2": 348.264, "r_y2": 339.457, "r_x3": 324.67, "r_y3": 339.457, "coord_origin": "TOPLEFT"}, "text": "TEDs", "orig": "TEDs", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 37, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 396.271, "r_y0": 350.746, "r_x1": 417.127, "r_y1": 350.746, "r_x2": 417.127, "r_y2": 339.457, "r_x3": 396.271, "r_y3": 339.457, "coord_origin": "TOPLEFT"}, "text": "mAP", "orig": "mAP", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 38, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 394.927, "r_y0": 361.705, "r_x1": 418.473, "r_y1": 361.705, "r_x2": 418.473, "r_y2": 350.416, "r_x3": 394.927, "r_y3": 350.416, "coord_origin": "TOPLEFT"}, "text": "(0.75)", "orig": "(0.75)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 39, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 430.771, "r_y0": 350.746, "r_x1": 467.142, "r_y1": 350.746, "r_x2": 467.142, "r_y2": 339.457, "r_x3": 430.771, "r_y3": 339.457, "coord_origin": "TOPLEFT"}, "text": "Inference", "orig": "Inference", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 40, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 427.148, "r_y0": 361.705, "r_x1": 470.761, "r_y1": 361.705, "r_x2": 470.761, "r_y2": 350.416, "r_x3": 427.148, "r_y3": 350.416, "coord_origin": "TOPLEFT"}, "text": "time (secs)", "orig": "time (secs)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 41, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 286.686, "r_y0": 363.697, "r_x1": 312.333, "r_y1": 363.697, "r_x2": 312.333, "r_y2": 352.408, "r_x3": 286.686, "r_y3": 352.408, "coord_origin": "TOPLEFT"}, "text": "simple", "orig": "simple", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 42, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 320.702, "r_y0": 363.697, "r_x1": 353.72, "r_y1": 363.697, "r_x2": 353.72, "r_y2": 352.408, "r_x3": 320.702, "r_y3": 352.408, "coord_origin": "TOPLEFT"}, "text": "complex", "orig": "complex", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 43, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 369.306, "r_y0": 363.697, "r_x1": 379.031, "r_y1": 363.697, "r_x2": 379.031, "r_y2": 352.408, "r_x3": 369.306, "r_y3": 352.408, "coord_origin": "TOPLEFT"}, "text": "all", "orig": "all", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 44, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 161.906, "r_y0": 382.527, "r_x1": 166.513, "r_y1": 382.527, "r_x2": 166.513, "r_y2": 371.238, "r_x3": 161.906, "r_y3": 371.238, "coord_origin": "TOPLEFT"}, "text": "6", "orig": "6", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 45, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 209.509, "r_y0": 382.527, "r_x1": 214.116, "r_y1": 382.527, "r_x2": 214.116, "r_y2": 371.238, "r_x3": 209.509, "r_y3": 371.238, "coord_origin": "TOPLEFT"}, "text": "6", "orig": "6", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 46, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 246.71, "r_y0": 377.047, "r_x1": 271.405, "r_y1": 377.047, "r_x2": 271.405, "r_y2": 365.758, "r_x3": 246.71, "r_y3": 365.758, "coord_origin": "TOPLEFT"}, "text": "OTSL", "orig": "OTSL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 47, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 289.017, "r_y0": 377.047, "r_x1": 310.004, "r_y1": 377.047, "r_x2": 310.004, "r_y2": 365.758, "r_x3": 289.017, "r_y3": 365.758, "coord_origin": "TOPLEFT"}, "text": "0.965", "orig": "0.965", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 48, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 326.717, "r_y0": 377.047, "r_x1": 347.704, "r_y1": 377.047, "r_x2": 347.704, "r_y2": 365.758, "r_x3": 326.717, "r_y3": 365.758, "coord_origin": "TOPLEFT"}, "text": "0.934", "orig": "0.934", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 49, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 363.676, "r_y0": 377.047, "r_x1": 384.663, "r_y1": 377.047, "r_x2": 384.663, "r_y2": 365.758, "r_x3": 363.676, "r_y3": 365.758, "coord_origin": "TOPLEFT"}, "text": "0.955", "orig": "0.955", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 50, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 397.27, "r_y0": 375.899, "r_x1": 416.127, "r_y1": 375.899, "r_x2": 416.127, "r_y2": 367.973, "r_x3": 397.27, "r_y3": 367.973, "coord_origin": "TOPLEFT"}, "text": "0.88", "orig": "0.88", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 51, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 439.527, "r_y0": 375.899, "r_x1": 458.384, "r_y1": 375.899, "r_x2": 458.384, "r_y2": 367.973, "r_x3": 439.527, "r_y3": 367.973, "coord_origin": "TOPLEFT"}, "text": "2.73", "orig": "2.73", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 52, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 245.176, "r_y0": 389.999, "r_x1": 272.94, "r_y1": 389.999, "r_x2": 272.94, "r_y2": 378.71, "r_x3": 245.176, "r_y3": 378.71, "coord_origin": "TOPLEFT"}, "text": "HTML", "orig": "HTML", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 53, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 289.017, "r_y0": 389.999, "r_x1": 310.004, "r_y1": 389.999, "r_x2": 310.004, "r_y2": 378.71, "r_x3": 289.017, "r_y3": 378.71, "coord_origin": "TOPLEFT"}, "text": "0.969", "orig": "0.969", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 54, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 326.717, "r_y0": 389.999, "r_x1": 347.704, "r_y1": 389.999, "r_x2": 347.704, "r_y2": 378.71, "r_x3": 326.717, "r_y3": 378.71, "coord_origin": "TOPLEFT"}, "text": "0.927", "orig": "0.927", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 55, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 363.676, "r_y0": 389.999, "r_x1": 384.663, "r_y1": 389.999, "r_x2": 384.663, "r_y2": 378.71, "r_x3": 363.676, "r_y3": 378.71, "coord_origin": "TOPLEFT"}, "text": "0.955", "orig": "0.955", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 56, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 396.206, "r_y0": 389.999, "r_x1": 417.193, "r_y1": 389.999, "r_x2": 417.193, "r_y2": 378.71, "r_x3": 396.206, "r_y3": 378.71, "coord_origin": "TOPLEFT"}, "text": "0.857", "orig": "0.857", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 57, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 440.767, "r_y0": 389.999, "r_x1": 457.147, "r_y1": 389.999, "r_x2": 457.147, "r_y2": 378.71, "r_x3": 440.767, "r_y3": 378.71, "coord_origin": "TOPLEFT"}, "text": "5.39", "orig": "5.39", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 58, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 161.906, "r_y0": 408.828, "r_x1": 166.513, "r_y1": 408.828, "r_x2": 166.513, "r_y2": 397.539, "r_x3": 161.906, "r_y3": 397.539, "coord_origin": "TOPLEFT"}, "text": "4", "orig": "4", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 59, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 209.509, "r_y0": 408.828, "r_x1": 214.116, "r_y1": 408.828, "r_x2": 214.116, "r_y2": 397.539, "r_x3": 209.509, "r_y3": 397.539, "coord_origin": "TOPLEFT"}, "text": "4", "orig": "4", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 60, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 246.71, "r_y0": 403.349, "r_x1": 271.405, "r_y1": 403.349, "r_x2": 271.405, "r_y2": 392.06, "r_x3": 246.71, "r_y3": 392.06, "coord_origin": "TOPLEFT"}, "text": "OTSL", "orig": "OTSL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 61, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 289.017, "r_y0": 403.349, "r_x1": 310.004, "r_y1": 403.349, "r_x2": 310.004, "r_y2": 392.06, "r_x3": 289.017, "r_y3": 392.06, "coord_origin": "TOPLEFT"}, "text": "0.938", "orig": "0.938", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 62, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 326.717, "r_y0": 403.349, "r_x1": 347.704, "r_y1": 403.349, "r_x2": 347.704, "r_y2": 392.06, "r_x3": 326.717, "r_y3": 392.06, "coord_origin": "TOPLEFT"}, "text": "0.904", "orig": "0.904", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 63, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 363.676, "r_y0": 403.349, "r_x1": 384.663, "r_y1": 403.349, "r_x2": 384.663, "r_y2": 392.06, "r_x3": 363.676, "r_y3": 392.06, "coord_origin": "TOPLEFT"}, "text": "0.927", "orig": "0.927", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 64, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 394.618, "r_y0": 402.201, "r_x1": 418.779, "r_y1": 402.201, "r_x2": 418.779, "r_y2": 394.275, "r_x3": 394.618, "r_y3": 394.275, "coord_origin": "TOPLEFT"}, "text": "0.853", "orig": "0.853", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 65, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 439.527, "r_y0": 402.201, "r_x1": 458.384, "r_y1": 402.201, "r_x2": 458.384, "r_y2": 394.275, "r_x3": 439.527, "r_y3": 394.275, "coord_origin": "TOPLEFT"}, "text": "1.97", "orig": "1.97", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 66, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 245.176, "r_y0": 416.3, "r_x1": 272.94, "r_y1": 416.3, "r_x2": 272.94, "r_y2": 405.011, "r_x3": 245.176, "r_y3": 405.011, "coord_origin": "TOPLEFT"}, "text": "HTML", "orig": "HTML", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 67, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 289.017, "r_y0": 416.3, "r_x1": 310.004, "r_y1": 416.3, "r_x2": 310.004, "r_y2": 405.011, "r_x3": 289.017, "r_y3": 405.011, "coord_origin": "TOPLEFT"}, "text": "0.952", "orig": "0.952", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 68, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 326.717, "r_y0": 416.3, "r_x1": 347.704, "r_y1": 416.3, "r_x2": 347.704, "r_y2": 405.011, "r_x3": 326.717, "r_y3": 405.011, "coord_origin": "TOPLEFT"}, "text": "0.909", "orig": "0.909", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 69, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 362.088, "r_y0": 415.152, "r_x1": 386.249, "r_y1": 415.152, "r_x2": 386.249, "r_y2": 407.226, "r_x3": 362.088, "r_y3": 407.226, "coord_origin": "TOPLEFT"}, "text": "0.938", "orig": "0.938", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 70, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 396.206, "r_y0": 416.3, "r_x1": 417.193, "r_y1": 416.3, "r_x2": 417.193, "r_y2": 405.011, "r_x3": 396.206, "r_y3": 405.011, "coord_origin": "TOPLEFT"}, "text": "0.843", "orig": "0.843", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 71, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 440.767, "r_y0": 416.3, "r_x1": 457.147, "r_y1": 416.3, "r_x2": 457.147, "r_y2": 405.011, "r_x3": 440.767, "r_y3": 405.011, "coord_origin": "TOPLEFT"}, "text": "3.77", "orig": "3.77", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 72, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 161.906, "r_y0": 435.129, "r_x1": 166.513, "r_y1": 435.129, "r_x2": 166.513, "r_y2": 423.84, "r_x3": 161.906, "r_y3": 423.84, "coord_origin": "TOPLEFT"}, "text": "2", "orig": "2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 73, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 209.509, "r_y0": 435.129, "r_x1": 214.116, "r_y1": 435.129, "r_x2": 214.116, "r_y2": 423.84, "r_x3": 209.509, "r_y3": 423.84, "coord_origin": "TOPLEFT"}, "text": "4", "orig": "4", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 74, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 246.71, "r_y0": 429.65, "r_x1": 271.405, "r_y1": 429.65, "r_x2": 271.405, "r_y2": 418.361, "r_x3": 246.71, "r_y3": 418.361, "coord_origin": "TOPLEFT"}, "text": "OTSL", "orig": "OTSL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 75, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 289.017, "r_y0": 429.65, "r_x1": 310.004, "r_y1": 429.65, "r_x2": 310.004, "r_y2": 418.361, "r_x3": 289.017, "r_y3": 418.361, "coord_origin": "TOPLEFT"}, "text": "0.923", "orig": "0.923", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 76, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 326.717, "r_y0": 429.65, "r_x1": 347.704, "r_y1": 429.65, "r_x2": 347.704, "r_y2": 418.361, "r_x3": 326.717, "r_y3": 418.361, "coord_origin": "TOPLEFT"}, "text": "0.897", "orig": "0.897", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 77, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 363.676, "r_y0": 429.65, "r_x1": 384.663, "r_y1": 429.65, "r_x2": 384.663, "r_y2": 418.361, "r_x3": 363.676, "r_y3": 418.361, "coord_origin": "TOPLEFT"}, "text": "0.915", "orig": "0.915", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 78, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 394.618, "r_y0": 428.502, "r_x1": 418.779, "r_y1": 428.502, "r_x2": 418.779, "r_y2": 420.576, "r_x3": 394.618, "r_y3": 420.576, "coord_origin": "TOPLEFT"}, "text": "0.859", "orig": "0.859", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 79, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 439.527, "r_y0": 428.502, "r_x1": 458.384, "r_y1": 428.502, "r_x2": 458.384, "r_y2": 420.576, "r_x3": 439.527, "r_y3": 420.576, "coord_origin": "TOPLEFT"}, "text": "1.91", "orig": "1.91", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 80, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 245.176, "r_y0": 442.601, "r_x1": 272.94, "r_y1": 442.601, "r_x2": 272.94, "r_y2": 431.312, "r_x3": 245.176, "r_y3": 431.312, "coord_origin": "TOPLEFT"}, "text": "HTML", "orig": "HTML", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 81, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 289.017, "r_y0": 442.601, "r_x1": 310.004, "r_y1": 442.601, "r_x2": 310.004, "r_y2": 431.312, "r_x3": 289.017, "r_y3": 431.312, "coord_origin": "TOPLEFT"}, "text": "0.945", "orig": "0.945", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 82, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 326.717, "r_y0": 442.601, "r_x1": 347.704, "r_y1": 442.601, "r_x2": 347.704, "r_y2": 431.312, "r_x3": 326.717, "r_y3": 431.312, "coord_origin": "TOPLEFT"}, "text": "0.901", "orig": "0.901", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 83, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 362.088, "r_y0": 441.453, "r_x1": 386.249, "r_y1": 441.453, "r_x2": 386.249, "r_y2": 433.527, "r_x3": 362.088, "r_y3": 433.527, "coord_origin": "TOPLEFT"}, "text": "0.931", "orig": "0.931", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 84, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 396.206, "r_y0": 442.601, "r_x1": 417.193, "r_y1": 442.601, "r_x2": 417.193, "r_y2": 431.312, "r_x3": 396.206, "r_y3": 431.312, "coord_origin": "TOPLEFT"}, "text": "0.834", "orig": "0.834", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 85, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 440.767, "r_y0": 442.601, "r_x1": 457.147, "r_y1": 442.601, "r_x2": 457.147, "r_y2": 431.312, "r_x3": 440.767, "r_y3": 431.312, "coord_origin": "TOPLEFT"}, "text": "3.81", "orig": "3.81", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 86, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 161.906, "r_y0": 461.431, "r_x1": 166.513, "r_y1": 461.431, "r_x2": 166.513, "r_y2": 450.142, "r_x3": 161.906, "r_y3": 450.142, "coord_origin": "TOPLEFT"}, "text": "4", "orig": "4", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 87, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 209.509, "r_y0": 461.431, "r_x1": 214.116, "r_y1": 461.431, "r_x2": 214.116, "r_y2": 450.142, "r_x3": 209.509, "r_y3": 450.142, "coord_origin": "TOPLEFT"}, "text": "2", "orig": "2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 88, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 246.71, "r_y0": 455.951, "r_x1": 271.405, "r_y1": 455.951, "r_x2": 271.405, "r_y2": 444.662, "r_x3": 246.71, "r_y3": 444.662, "coord_origin": "TOPLEFT"}, "text": "OTSL", "orig": "OTSL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 89, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 289.017, "r_y0": 455.951, "r_x1": 310.004, "r_y1": 455.951, "r_x2": 310.004, "r_y2": 444.662, "r_x3": 289.017, "r_y3": 444.662, "coord_origin": "TOPLEFT"}, "text": "0.952", "orig": "0.952", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 90, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 329.021, "r_y0": 455.951, "r_x1": 345.401, "r_y1": 455.951, "r_x2": 345.401, "r_y2": 444.662, "r_x3": 329.021, "r_y3": 444.662, "coord_origin": "TOPLEFT"}, "text": "0.92", "orig": "0.92", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 91, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 362.088, "r_y0": 454.803, "r_x1": 386.249, "r_y1": 454.803, "r_x2": 386.249, "r_y2": 446.877, "r_x3": 362.088, "r_y3": 446.877, "coord_origin": "TOPLEFT"}, "text": "0.942", "orig": "0.942", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 92, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 394.618, "r_y0": 454.803, "r_x1": 418.779, "r_y1": 454.803, "r_x2": 418.779, "r_y2": 446.877, "r_x3": 394.618, "r_y3": 446.877, "coord_origin": "TOPLEFT"}, "text": "0.857", "orig": "0.857", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 93, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 439.527, "r_y0": 454.803, "r_x1": 458.384, "r_y1": 454.803, "r_x2": 458.384, "r_y2": 446.877, "r_x3": 439.527, "r_y3": 446.877, "coord_origin": "TOPLEFT"}, "text": "1.22", "orig": "1.22", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 94, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 245.176, "r_y0": 468.903, "r_x1": 272.94, "r_y1": 468.903, "r_x2": 272.94, "r_y2": 457.614, "r_x3": 245.176, "r_y3": 457.614, "coord_origin": "TOPLEFT"}, "text": "HTML", "orig": "HTML", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 95, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 289.017, "r_y0": 468.903, "r_x1": 310.004, "r_y1": 468.903, "r_x2": 310.004, "r_y2": 457.614, "r_x3": 289.017, "r_y3": 457.614, "coord_origin": "TOPLEFT"}, "text": "0.944", "orig": "0.944", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 96, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 326.717, "r_y0": 468.903, "r_x1": 347.704, "r_y1": 468.903, "r_x2": 347.704, "r_y2": 457.614, "r_x3": 326.717, "r_y3": 457.614, "coord_origin": "TOPLEFT"}, "text": "0.903", "orig": "0.903", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 97, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 363.676, "r_y0": 468.903, "r_x1": 384.663, "r_y1": 468.903, "r_x2": 384.663, "r_y2": 457.614, "r_x3": 363.676, "r_y3": 457.614, "coord_origin": "TOPLEFT"}, "text": "0.931", "orig": "0.931", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 98, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 396.206, "r_y0": 468.903, "r_x1": 417.193, "r_y1": 468.903, "r_x2": 417.193, "r_y2": 457.614, "r_x3": 396.206, "r_y3": 457.614, "coord_origin": "TOPLEFT"}, "text": "0.824", "orig": "0.824", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 99, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 446.653, "r_y0": 468.903, "r_x1": 451.26, "r_y1": 468.903, "r_x2": 451.26, "r_y2": 457.614, "r_x3": 446.653, "r_y3": 457.614, "coord_origin": "TOPLEFT"}, "text": "2", "orig": "2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": [{"id": 11, "label": "text", "bbox": {"l": 160.37, "t": 339.457, "r": 168.048, "b": 350.746, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 31, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 160.37, "r_y0": 350.746, "r_x1": 168.048, "r_y1": 350.746, "r_x2": 168.048, "r_y2": 339.457, "r_x3": 160.37, "r_y3": 339.457, "coord_origin": "TOPLEFT"}, "text": "#", "orig": "#", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 12, "label": "text", "bbox": {"l": 144.592, "t": 352.408, "r": 183.828, "b": 363.697, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 32, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 144.592, "r_y0": 363.697, "r_x1": 183.828, "r_y1": 363.697, "r_x2": 183.828, "r_y2": 352.408, "r_x3": 144.592, "r_y3": 352.408, "coord_origin": "TOPLEFT"}, "text": "enc-layers", "orig": "enc-layers", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 13, "label": "text", "bbox": {"l": 207.974, "t": 339.457, "r": 215.652, "b": 350.746, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 33, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 207.974, "r_y0": 350.746, "r_x1": 215.652, "r_y1": 350.746, "r_x2": 215.652, "r_y2": 339.457, "r_x3": 207.974, "r_y3": 339.457, "coord_origin": "TOPLEFT"}, "text": "#", "orig": "#", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 14, "label": "text", "bbox": {"l": 192.195, "t": 352.408, "r": 231.431, "b": 363.697, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 34, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 192.195, "r_y0": 363.697, "r_x1": 231.431, "r_y1": 363.697, "r_x2": 231.431, "r_y2": 352.408, "r_x3": 192.195, "r_y3": 352.408, "coord_origin": "TOPLEFT"}, "text": "dec-layers", "orig": "dec-layers", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 15, "label": "text", "bbox": {"l": 239.798, "t": 344.936, "r": 278.318, "b": 356.225, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 35, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 239.798, "r_y0": 356.225, "r_x1": 278.318, "r_y1": 356.225, "r_x2": 278.318, "r_y2": 344.936, "r_x3": 239.798, "r_y3": 344.936, "coord_origin": "TOPLEFT"}, "text": "Language", "orig": "Language", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 16, "label": "text", "bbox": {"l": 324.67, "t": 339.457, "r": 348.264, "b": 350.746, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 36, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 324.67, "r_y0": 350.746, "r_x1": 348.264, "r_y1": 350.746, "r_x2": 348.264, "r_y2": 339.457, "r_x3": 324.67, "r_y3": 339.457, "coord_origin": "TOPLEFT"}, "text": "TEDs", "orig": "TEDs", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 17, "label": "text", "bbox": {"l": 396.271, "t": 339.457, "r": 417.127, "b": 350.746, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 37, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 396.271, "r_y0": 350.746, "r_x1": 417.127, "r_y1": 350.746, "r_x2": 417.127, "r_y2": 339.457, "r_x3": 396.271, "r_y3": 339.457, "coord_origin": "TOPLEFT"}, "text": "mAP", "orig": "mAP", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 18, "label": "text", "bbox": {"l": 394.927, "t": 350.416, "r": 418.473, "b": 361.705, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 38, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 394.927, "r_y0": 361.705, "r_x1": 418.473, "r_y1": 361.705, "r_x2": 418.473, "r_y2": 350.416, "r_x3": 394.927, "r_y3": 350.416, "coord_origin": "TOPLEFT"}, "text": "(0.75)", "orig": "(0.75)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 19, "label": "text", "bbox": {"l": 430.771, "t": 339.457, "r": 467.142, "b": 350.746, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 39, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 430.771, "r_y0": 350.746, "r_x1": 467.142, "r_y1": 350.746, "r_x2": 467.142, "r_y2": 339.457, "r_x3": 430.771, "r_y3": 339.457, "coord_origin": "TOPLEFT"}, "text": "Inference", "orig": "Inference", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 20, "label": "text", "bbox": {"l": 427.148, "t": 350.416, "r": 470.761, "b": 361.705, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 40, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 427.148, "r_y0": 361.705, "r_x1": 470.761, "r_y1": 361.705, "r_x2": 470.761, "r_y2": 350.416, "r_x3": 427.148, "r_y3": 350.416, "coord_origin": "TOPLEFT"}, "text": "time (secs)", "orig": "time (secs)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 21, "label": "text", "bbox": {"l": 286.686, "t": 352.408, "r": 312.333, "b": 363.697, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 41, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 286.686, "r_y0": 363.697, "r_x1": 312.333, "r_y1": 363.697, "r_x2": 312.333, "r_y2": 352.408, "r_x3": 286.686, "r_y3": 352.408, "coord_origin": "TOPLEFT"}, "text": "simple", "orig": "simple", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 22, "label": "text", "bbox": {"l": 320.702, "t": 352.408, "r": 353.72, "b": 363.697, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 42, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 320.702, "r_y0": 363.697, "r_x1": 353.72, "r_y1": 363.697, "r_x2": 353.72, "r_y2": 352.408, "r_x3": 320.702, "r_y3": 352.408, "coord_origin": "TOPLEFT"}, "text": "complex", "orig": "complex", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 23, "label": "text", "bbox": {"l": 369.306, "t": 352.408, "r": 379.031, "b": 363.697, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 43, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 369.306, "r_y0": 363.697, "r_x1": 379.031, "r_y1": 363.697, "r_x2": 379.031, "r_y2": 352.408, "r_x3": 369.306, "r_y3": 352.408, "coord_origin": "TOPLEFT"}, "text": "all", "orig": "all", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 24, "label": "text", "bbox": {"l": 161.906, "t": 371.238, "r": 166.513, "b": 382.527, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 44, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 161.906, "r_y0": 382.527, "r_x1": 166.513, "r_y1": 382.527, "r_x2": 166.513, "r_y2": 371.238, "r_x3": 161.906, "r_y3": 371.238, "coord_origin": "TOPLEFT"}, "text": "6", "orig": "6", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 25, "label": "text", "bbox": {"l": 209.509, "t": 371.238, "r": 214.116, "b": 382.527, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 45, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 209.509, "r_y0": 382.527, "r_x1": 214.116, "r_y1": 382.527, "r_x2": 214.116, "r_y2": 371.238, "r_x3": 209.509, "r_y3": 371.238, "coord_origin": "TOPLEFT"}, "text": "6", "orig": "6", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 26, "label": "text", "bbox": {"l": 246.71, "t": 365.758, "r": 271.405, "b": 377.047, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 46, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 246.71, "r_y0": 377.047, "r_x1": 271.405, "r_y1": 377.047, "r_x2": 271.405, "r_y2": 365.758, "r_x3": 246.71, "r_y3": 365.758, "coord_origin": "TOPLEFT"}, "text": "OTSL", "orig": "OTSL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 27, "label": "text", "bbox": {"l": 289.017, "t": 365.758, "r": 310.004, "b": 377.047, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 47, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 289.017, "r_y0": 377.047, "r_x1": 310.004, "r_y1": 377.047, "r_x2": 310.004, "r_y2": 365.758, "r_x3": 289.017, "r_y3": 365.758, "coord_origin": "TOPLEFT"}, "text": "0.965", "orig": "0.965", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 28, "label": "text", "bbox": {"l": 326.717, "t": 365.758, "r": 347.704, "b": 377.047, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 48, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 326.717, "r_y0": 377.047, "r_x1": 347.704, "r_y1": 377.047, "r_x2": 347.704, "r_y2": 365.758, "r_x3": 326.717, "r_y3": 365.758, "coord_origin": "TOPLEFT"}, "text": "0.934", "orig": "0.934", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 29, "label": "text", "bbox": {"l": 363.676, "t": 365.758, "r": 384.663, "b": 377.047, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 49, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 363.676, "r_y0": 377.047, "r_x1": 384.663, "r_y1": 377.047, "r_x2": 384.663, "r_y2": 365.758, "r_x3": 363.676, "r_y3": 365.758, "coord_origin": "TOPLEFT"}, "text": "0.955", "orig": "0.955", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 30, "label": "text", "bbox": {"l": 397.27, "t": 367.973, "r": 416.127, "b": 375.899, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 50, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 397.27, "r_y0": 375.899, "r_x1": 416.127, "r_y1": 375.899, "r_x2": 416.127, "r_y2": 367.973, "r_x3": 397.27, "r_y3": 367.973, "coord_origin": "TOPLEFT"}, "text": "0.88", "orig": "0.88", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 31, "label": "text", "bbox": {"l": 439.527, "t": 367.973, "r": 458.384, "b": 375.899, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 51, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 439.527, "r_y0": 375.899, "r_x1": 458.384, "r_y1": 375.899, "r_x2": 458.384, "r_y2": 367.973, "r_x3": 439.527, "r_y3": 367.973, "coord_origin": "TOPLEFT"}, "text": "2.73", "orig": "2.73", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 32, "label": "text", "bbox": {"l": 245.176, "t": 378.71, "r": 272.94, "b": 389.999, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 52, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 245.176, "r_y0": 389.999, "r_x1": 272.94, "r_y1": 389.999, "r_x2": 272.94, "r_y2": 378.71, "r_x3": 245.176, "r_y3": 378.71, "coord_origin": "TOPLEFT"}, "text": "HTML", "orig": "HTML", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 33, "label": "text", "bbox": {"l": 289.017, "t": 378.71, "r": 310.004, "b": 389.999, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 53, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 289.017, "r_y0": 389.999, "r_x1": 310.004, "r_y1": 389.999, "r_x2": 310.004, "r_y2": 378.71, "r_x3": 289.017, "r_y3": 378.71, "coord_origin": "TOPLEFT"}, "text": "0.969", "orig": "0.969", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 34, "label": "text", "bbox": {"l": 326.717, "t": 378.71, "r": 347.704, "b": 389.999, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 54, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 326.717, "r_y0": 389.999, "r_x1": 347.704, "r_y1": 389.999, "r_x2": 347.704, "r_y2": 378.71, "r_x3": 326.717, "r_y3": 378.71, "coord_origin": "TOPLEFT"}, "text": "0.927", "orig": "0.927", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 35, "label": "text", "bbox": {"l": 363.676, "t": 378.71, "r": 384.663, "b": 389.999, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 55, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 363.676, "r_y0": 389.999, "r_x1": 384.663, "r_y1": 389.999, "r_x2": 384.663, "r_y2": 378.71, "r_x3": 363.676, "r_y3": 378.71, "coord_origin": "TOPLEFT"}, "text": "0.955", "orig": "0.955", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 36, "label": "text", "bbox": {"l": 396.206, "t": 378.71, "r": 417.193, "b": 389.999, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 56, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 396.206, "r_y0": 389.999, "r_x1": 417.193, "r_y1": 389.999, "r_x2": 417.193, "r_y2": 378.71, "r_x3": 396.206, "r_y3": 378.71, "coord_origin": "TOPLEFT"}, "text": "0.857", "orig": "0.857", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 37, "label": "text", "bbox": {"l": 440.767, "t": 378.71, "r": 457.147, "b": 389.999, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 57, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 440.767, "r_y0": 389.999, "r_x1": 457.147, "r_y1": 389.999, "r_x2": 457.147, "r_y2": 378.71, "r_x3": 440.767, "r_y3": 378.71, "coord_origin": "TOPLEFT"}, "text": "5.39", "orig": "5.39", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 38, "label": "text", "bbox": {"l": 161.906, "t": 397.539, "r": 166.513, "b": 408.828, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 58, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 161.906, "r_y0": 408.828, "r_x1": 166.513, "r_y1": 408.828, "r_x2": 166.513, "r_y2": 397.539, "r_x3": 161.906, "r_y3": 397.539, "coord_origin": "TOPLEFT"}, "text": "4", "orig": "4", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 39, "label": "text", "bbox": {"l": 209.509, "t": 397.539, "r": 214.116, "b": 408.828, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 59, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 209.509, "r_y0": 408.828, "r_x1": 214.116, "r_y1": 408.828, "r_x2": 214.116, "r_y2": 397.539, "r_x3": 209.509, "r_y3": 397.539, "coord_origin": "TOPLEFT"}, "text": "4", "orig": "4", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 40, "label": "text", "bbox": {"l": 246.71, "t": 392.06, "r": 271.405, "b": 403.349, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 60, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 246.71, "r_y0": 403.349, "r_x1": 271.405, "r_y1": 403.349, "r_x2": 271.405, "r_y2": 392.06, "r_x3": 246.71, "r_y3": 392.06, "coord_origin": "TOPLEFT"}, "text": "OTSL", "orig": "OTSL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 41, "label": "text", "bbox": {"l": 289.017, "t": 392.06, "r": 310.004, "b": 403.349, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 61, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 289.017, "r_y0": 403.349, "r_x1": 310.004, "r_y1": 403.349, "r_x2": 310.004, "r_y2": 392.06, "r_x3": 289.017, "r_y3": 392.06, "coord_origin": "TOPLEFT"}, "text": "0.938", "orig": "0.938", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 42, "label": "text", "bbox": {"l": 326.717, "t": 392.06, "r": 347.704, "b": 403.349, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 62, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 326.717, "r_y0": 403.349, "r_x1": 347.704, "r_y1": 403.349, "r_x2": 347.704, "r_y2": 392.06, "r_x3": 326.717, "r_y3": 392.06, "coord_origin": "TOPLEFT"}, "text": "0.904", "orig": "0.904", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 43, "label": "text", "bbox": {"l": 363.676, "t": 392.06, "r": 384.663, "b": 403.349, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 63, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 363.676, "r_y0": 403.349, "r_x1": 384.663, "r_y1": 403.349, "r_x2": 384.663, "r_y2": 392.06, "r_x3": 363.676, "r_y3": 392.06, "coord_origin": "TOPLEFT"}, "text": "0.927", "orig": "0.927", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 44, "label": "text", "bbox": {"l": 394.618, "t": 394.275, "r": 418.779, "b": 402.201, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 64, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 394.618, "r_y0": 402.201, "r_x1": 418.779, "r_y1": 402.201, "r_x2": 418.779, "r_y2": 394.275, "r_x3": 394.618, "r_y3": 394.275, "coord_origin": "TOPLEFT"}, "text": "0.853", "orig": "0.853", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 45, "label": "text", "bbox": {"l": 439.527, "t": 394.275, "r": 458.384, "b": 402.201, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 65, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 439.527, "r_y0": 402.201, "r_x1": 458.384, "r_y1": 402.201, "r_x2": 458.384, "r_y2": 394.275, "r_x3": 439.527, "r_y3": 394.275, "coord_origin": "TOPLEFT"}, "text": "1.97", "orig": "1.97", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 46, "label": "text", "bbox": {"l": 245.176, "t": 405.011, "r": 272.94, "b": 416.3, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 66, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 245.176, "r_y0": 416.3, "r_x1": 272.94, "r_y1": 416.3, "r_x2": 272.94, "r_y2": 405.011, "r_x3": 245.176, "r_y3": 405.011, "coord_origin": "TOPLEFT"}, "text": "HTML", "orig": "HTML", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 47, "label": "text", "bbox": {"l": 289.017, "t": 405.011, "r": 310.004, "b": 416.3, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 67, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 289.017, "r_y0": 416.3, "r_x1": 310.004, "r_y1": 416.3, "r_x2": 310.004, "r_y2": 405.011, "r_x3": 289.017, "r_y3": 405.011, "coord_origin": "TOPLEFT"}, "text": "0.952", "orig": "0.952", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 48, "label": "text", "bbox": {"l": 326.717, "t": 405.011, "r": 347.704, "b": 416.3, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 68, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 326.717, "r_y0": 416.3, "r_x1": 347.704, "r_y1": 416.3, "r_x2": 347.704, "r_y2": 405.011, "r_x3": 326.717, "r_y3": 405.011, "coord_origin": "TOPLEFT"}, "text": "0.909", "orig": "0.909", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 49, "label": "text", "bbox": {"l": 362.088, "t": 407.226, "r": 386.249, "b": 415.152, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 69, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 362.088, "r_y0": 415.152, "r_x1": 386.249, "r_y1": 415.152, "r_x2": 386.249, "r_y2": 407.226, "r_x3": 362.088, "r_y3": 407.226, "coord_origin": "TOPLEFT"}, "text": "0.938", "orig": "0.938", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 50, "label": "text", "bbox": {"l": 396.206, "t": 405.011, "r": 417.193, "b": 416.3, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 70, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 396.206, "r_y0": 416.3, "r_x1": 417.193, "r_y1": 416.3, "r_x2": 417.193, "r_y2": 405.011, "r_x3": 396.206, "r_y3": 405.011, "coord_origin": "TOPLEFT"}, "text": "0.843", "orig": "0.843", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 51, "label": "text", "bbox": {"l": 440.767, "t": 405.011, "r": 457.147, "b": 416.3, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 71, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 440.767, "r_y0": 416.3, "r_x1": 457.147, "r_y1": 416.3, "r_x2": 457.147, "r_y2": 405.011, "r_x3": 440.767, "r_y3": 405.011, "coord_origin": "TOPLEFT"}, "text": "3.77", "orig": "3.77", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 52, "label": "text", "bbox": {"l": 161.906, "t": 423.84, "r": 166.513, "b": 435.129, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 72, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 161.906, "r_y0": 435.129, "r_x1": 166.513, "r_y1": 435.129, "r_x2": 166.513, "r_y2": 423.84, "r_x3": 161.906, "r_y3": 423.84, "coord_origin": "TOPLEFT"}, "text": "2", "orig": "2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 53, "label": "text", "bbox": {"l": 209.509, "t": 423.84, "r": 214.116, "b": 435.129, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 73, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 209.509, "r_y0": 435.129, "r_x1": 214.116, "r_y1": 435.129, "r_x2": 214.116, "r_y2": 423.84, "r_x3": 209.509, "r_y3": 423.84, "coord_origin": "TOPLEFT"}, "text": "4", "orig": "4", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 54, "label": "text", "bbox": {"l": 246.71, "t": 418.361, "r": 271.405, "b": 429.65, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 74, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 246.71, "r_y0": 429.65, "r_x1": 271.405, "r_y1": 429.65, "r_x2": 271.405, "r_y2": 418.361, "r_x3": 246.71, "r_y3": 418.361, "coord_origin": "TOPLEFT"}, "text": "OTSL", "orig": "OTSL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 55, "label": "text", "bbox": {"l": 289.017, "t": 418.361, "r": 310.004, "b": 429.65, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 75, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 289.017, "r_y0": 429.65, "r_x1": 310.004, "r_y1": 429.65, "r_x2": 310.004, "r_y2": 418.361, "r_x3": 289.017, "r_y3": 418.361, "coord_origin": "TOPLEFT"}, "text": "0.923", "orig": "0.923", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 56, "label": "text", "bbox": {"l": 326.717, "t": 418.361, "r": 347.704, "b": 429.65, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 76, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 326.717, "r_y0": 429.65, "r_x1": 347.704, "r_y1": 429.65, "r_x2": 347.704, "r_y2": 418.361, "r_x3": 326.717, "r_y3": 418.361, "coord_origin": "TOPLEFT"}, "text": "0.897", "orig": "0.897", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 57, "label": "text", "bbox": {"l": 363.676, "t": 418.361, "r": 384.663, "b": 429.65, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 77, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 363.676, "r_y0": 429.65, "r_x1": 384.663, "r_y1": 429.65, "r_x2": 384.663, "r_y2": 418.361, "r_x3": 363.676, "r_y3": 418.361, "coord_origin": "TOPLEFT"}, "text": "0.915", "orig": "0.915", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 58, "label": "text", "bbox": {"l": 394.618, "t": 420.576, "r": 418.779, "b": 428.502, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 78, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 394.618, "r_y0": 428.502, "r_x1": 418.779, "r_y1": 428.502, "r_x2": 418.779, "r_y2": 420.576, "r_x3": 394.618, "r_y3": 420.576, "coord_origin": "TOPLEFT"}, "text": "0.859", "orig": "0.859", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 59, "label": "text", "bbox": {"l": 439.527, "t": 420.576, "r": 458.384, "b": 428.502, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 79, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 439.527, "r_y0": 428.502, "r_x1": 458.384, "r_y1": 428.502, "r_x2": 458.384, "r_y2": 420.576, "r_x3": 439.527, "r_y3": 420.576, "coord_origin": "TOPLEFT"}, "text": "1.91", "orig": "1.91", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 60, "label": "text", "bbox": {"l": 245.176, "t": 431.312, "r": 272.94, "b": 442.601, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 80, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 245.176, "r_y0": 442.601, "r_x1": 272.94, "r_y1": 442.601, "r_x2": 272.94, "r_y2": 431.312, "r_x3": 245.176, "r_y3": 431.312, "coord_origin": "TOPLEFT"}, "text": "HTML", "orig": "HTML", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 61, "label": "text", "bbox": {"l": 289.017, "t": 431.312, "r": 310.004, "b": 442.601, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 81, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 289.017, "r_y0": 442.601, "r_x1": 310.004, "r_y1": 442.601, "r_x2": 310.004, "r_y2": 431.312, "r_x3": 289.017, "r_y3": 431.312, "coord_origin": "TOPLEFT"}, "text": "0.945", "orig": "0.945", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 62, "label": "text", "bbox": {"l": 326.717, "t": 431.312, "r": 347.704, "b": 442.601, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 82, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 326.717, "r_y0": 442.601, "r_x1": 347.704, "r_y1": 442.601, "r_x2": 347.704, "r_y2": 431.312, "r_x3": 326.717, "r_y3": 431.312, "coord_origin": "TOPLEFT"}, "text": "0.901", "orig": "0.901", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 63, "label": "text", "bbox": {"l": 362.088, "t": 433.527, "r": 386.249, "b": 441.453, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 83, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 362.088, "r_y0": 441.453, "r_x1": 386.249, "r_y1": 441.453, "r_x2": 386.249, "r_y2": 433.527, "r_x3": 362.088, "r_y3": 433.527, "coord_origin": "TOPLEFT"}, "text": "0.931", "orig": "0.931", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 64, "label": "text", "bbox": {"l": 396.206, "t": 431.312, "r": 417.193, "b": 442.601, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 84, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 396.206, "r_y0": 442.601, "r_x1": 417.193, "r_y1": 442.601, "r_x2": 417.193, "r_y2": 431.312, "r_x3": 396.206, "r_y3": 431.312, "coord_origin": "TOPLEFT"}, "text": "0.834", "orig": "0.834", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 65, "label": "text", "bbox": {"l": 440.767, "t": 431.312, "r": 457.147, "b": 442.601, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 85, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 440.767, "r_y0": 442.601, "r_x1": 457.147, "r_y1": 442.601, "r_x2": 457.147, "r_y2": 431.312, "r_x3": 440.767, "r_y3": 431.312, "coord_origin": "TOPLEFT"}, "text": "3.81", "orig": "3.81", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 66, "label": "text", "bbox": {"l": 161.906, "t": 450.142, "r": 166.513, "b": 461.431, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 86, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 161.906, "r_y0": 461.431, "r_x1": 166.513, "r_y1": 461.431, "r_x2": 166.513, "r_y2": 450.142, "r_x3": 161.906, "r_y3": 450.142, "coord_origin": "TOPLEFT"}, "text": "4", "orig": "4", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 67, "label": "text", "bbox": {"l": 209.509, "t": 450.142, "r": 214.116, "b": 461.431, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 87, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 209.509, "r_y0": 461.431, "r_x1": 214.116, "r_y1": 461.431, "r_x2": 214.116, "r_y2": 450.142, "r_x3": 209.509, "r_y3": 450.142, "coord_origin": "TOPLEFT"}, "text": "2", "orig": "2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 68, "label": "text", "bbox": {"l": 246.71, "t": 444.662, "r": 271.405, "b": 455.951, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 88, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 246.71, "r_y0": 455.951, "r_x1": 271.405, "r_y1": 455.951, "r_x2": 271.405, "r_y2": 444.662, "r_x3": 246.71, "r_y3": 444.662, "coord_origin": "TOPLEFT"}, "text": "OTSL", "orig": "OTSL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 69, "label": "text", "bbox": {"l": 289.017, "t": 444.662, "r": 310.004, "b": 455.951, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 89, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 289.017, "r_y0": 455.951, "r_x1": 310.004, "r_y1": 455.951, "r_x2": 310.004, "r_y2": 444.662, "r_x3": 289.017, "r_y3": 444.662, "coord_origin": "TOPLEFT"}, "text": "0.952", "orig": "0.952", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 70, "label": "text", "bbox": {"l": 329.021, "t": 444.662, "r": 345.401, "b": 455.951, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 90, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 329.021, "r_y0": 455.951, "r_x1": 345.401, "r_y1": 455.951, "r_x2": 345.401, "r_y2": 444.662, "r_x3": 329.021, "r_y3": 444.662, "coord_origin": "TOPLEFT"}, "text": "0.92", "orig": "0.92", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 71, "label": "text", "bbox": {"l": 362.088, "t": 446.877, "r": 386.249, "b": 454.803, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 91, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 362.088, "r_y0": 454.803, "r_x1": 386.249, "r_y1": 454.803, "r_x2": 386.249, "r_y2": 446.877, "r_x3": 362.088, "r_y3": 446.877, "coord_origin": "TOPLEFT"}, "text": "0.942", "orig": "0.942", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 72, "label": "text", "bbox": {"l": 394.618, "t": 446.877, "r": 418.779, "b": 454.803, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 92, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 394.618, "r_y0": 454.803, "r_x1": 418.779, "r_y1": 454.803, "r_x2": 418.779, "r_y2": 446.877, "r_x3": 394.618, "r_y3": 446.877, "coord_origin": "TOPLEFT"}, "text": "0.857", "orig": "0.857", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 73, "label": "text", "bbox": {"l": 439.527, "t": 446.877, "r": 458.384, "b": 454.803, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 93, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 439.527, "r_y0": 454.803, "r_x1": 458.384, "r_y1": 454.803, "r_x2": 458.384, "r_y2": 446.877, "r_x3": 439.527, "r_y3": 446.877, "coord_origin": "TOPLEFT"}, "text": "1.22", "orig": "1.22", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 74, "label": "text", "bbox": {"l": 245.176, "t": 457.614, "r": 272.94, "b": 468.903, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 94, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 245.176, "r_y0": 468.903, "r_x1": 272.94, "r_y1": 468.903, "r_x2": 272.94, "r_y2": 457.614, "r_x3": 245.176, "r_y3": 457.614, "coord_origin": "TOPLEFT"}, "text": "HTML", "orig": "HTML", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 75, "label": "text", "bbox": {"l": 289.017, "t": 457.614, "r": 310.004, "b": 468.903, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 95, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 289.017, "r_y0": 468.903, "r_x1": 310.004, "r_y1": 468.903, "r_x2": 310.004, "r_y2": 457.614, "r_x3": 289.017, "r_y3": 457.614, "coord_origin": "TOPLEFT"}, "text": "0.944", "orig": "0.944", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 76, "label": "text", "bbox": {"l": 326.717, "t": 457.614, "r": 347.704, "b": 468.903, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 96, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 326.717, "r_y0": 468.903, "r_x1": 347.704, "r_y1": 468.903, "r_x2": 347.704, "r_y2": 457.614, "r_x3": 326.717, "r_y3": 457.614, "coord_origin": "TOPLEFT"}, "text": "0.903", "orig": "0.903", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 77, "label": "text", "bbox": {"l": 363.676, "t": 457.614, "r": 384.663, "b": 468.903, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 97, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 363.676, "r_y0": 468.903, "r_x1": 384.663, "r_y1": 468.903, "r_x2": 384.663, "r_y2": 457.614, "r_x3": 363.676, "r_y3": 457.614, "coord_origin": "TOPLEFT"}, "text": "0.931", "orig": "0.931", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 78, "label": "text", "bbox": {"l": 396.206, "t": 457.614, "r": 417.193, "b": 468.903, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 98, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 396.206, "r_y0": 468.903, "r_x1": 417.193, "r_y1": 468.903, "r_x2": 417.193, "r_y2": 457.614, "r_x3": 396.206, "r_y3": 457.614, "coord_origin": "TOPLEFT"}, "text": "0.824", "orig": "0.824", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 79, "label": "text", "bbox": {"l": 446.653, "t": 457.614, "r": 451.26, "b": 468.903, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 99, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 446.653, "r_y0": 468.903, "r_x1": 451.26, "r_y1": 468.903, "r_x2": 451.26, "r_y2": 457.614, "r_x3": 446.653, "r_y3": 457.614, "coord_origin": "TOPLEFT"}, "text": "2", "orig": "2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}]}, {"id": 5, "label": "section_header", "bbox": {"l": 134.765, "t": 508.152, "r": 264.403, "b": 516.9590000000001, "coord_origin": "TOPLEFT"}, "confidence": 0.9592539668083191, "cells": [{"index": 100, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 516.9590000000001, "r_x1": 149.402, "r_y1": 516.9590000000001, "r_x2": 149.402, "r_y2": 508.152, "r_x3": 134.765, "r_y3": 508.152, "coord_origin": "TOPLEFT"}, "text": "5.2", "orig": "5.2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 101, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 160.859, "r_y0": 516.9590000000001, "r_x1": 264.403, "r_y1": 516.9590000000001, "r_x2": 264.403, "r_y2": 508.152, "r_x3": 160.859, "r_y3": 508.152, "coord_origin": "TOPLEFT"}, "text": "Quantitative Results", "orig": "Quantitative Results", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 1, "label": "text", "bbox": {"l": 134.765, "t": 524.5509999999999, "r": 480.596, "b": 617.035, "coord_origin": "TOPLEFT"}, "confidence": 0.9854757189750671, "cells": [{"index": 102, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 533.348, "r_x1": 480.591, "r_y1": 533.348, "r_x2": 480.591, "r_y2": 524.5509999999999, "r_x3": 134.765, "r_y3": 524.5509999999999, "coord_origin": "TOPLEFT"}, "text": "We picked the model parameter configuration that produced the best prediction", "orig": "We picked the model parameter configuration that produced the best prediction", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 103, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 545.304, "r_x1": 164.921, "r_y1": 545.304, "r_x2": 164.921, "r_y2": 536.5070000000001, "r_x3": 134.765, "r_y3": 536.5070000000001, "coord_origin": "TOPLEFT"}, "text": "quality", "orig": "quality", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 104, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 169.324, "r_y0": 545.304, "r_x1": 480.587, "r_y1": 545.304, "r_x2": 480.587, "r_y2": 536.5070000000001, "r_x3": 169.324, "r_y3": 536.5070000000001, "coord_origin": "TOPLEFT"}, "text": "(enc=6, dec=6, heads=8) with PubTabNet alone, then independently", "orig": "(enc=6, dec=6, heads=8) with PubTabNet alone, then independently", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 105, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 557.259, "r_x1": 480.596, "r_y1": 557.259, "r_x2": 480.596, "r_y2": 548.462, "r_x3": 134.765, "r_y3": 548.462, "coord_origin": "TOPLEFT"}, "text": "trained and evaluated it on three publicly available data sets: PubTabNet (395k", "orig": "trained and evaluated it on three publicly available data sets: PubTabNet (395k", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 106, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 569.2139999999999, "r_x1": 480.592, "r_y1": 569.2139999999999, "r_x2": 480.592, "r_y2": 560.417, "r_x3": 134.765, "r_y3": 560.417, "coord_origin": "TOPLEFT"}, "text": "samples), FinTabNet (113k samples) and PubTables-1M (about 1M samples).", "orig": "samples), FinTabNet (113k samples) and PubTables-1M (about 1M samples).", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 107, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 581.169, "r_x1": 480.591, "r_y1": 581.169, "r_x2": 480.591, "r_y2": 572.3720000000001, "r_x3": 134.765, "r_y3": 572.3720000000001, "coord_origin": "TOPLEFT"}, "text": "Performance results are presented in Table. 2. It is clearly evident that the model", "orig": "Performance results are presented in Table. 2. It is clearly evident that the model", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 108, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 593.124, "r_x1": 480.596, "r_y1": 593.124, "r_x2": 480.596, "r_y2": 584.327, "r_x3": 134.765, "r_y3": 584.327, "coord_origin": "TOPLEFT"}, "text": "trained on OTSL outperforms HTML across the board, keeping high TEDs and", "orig": "trained on OTSL outperforms HTML across the board, keeping high TEDs and", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 109, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 605.08, "r_x1": 480.588, "r_y1": 605.08, "r_x2": 480.588, "r_y2": 596.283, "r_x3": 134.765, "r_y3": 596.283, "coord_origin": "TOPLEFT"}, "text": "mAP scores even on difficult financial tables (FinTabNet) that contain sparse", "orig": "mAP scores even on difficult financial tables (FinTabNet) that contain sparse", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 110, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 617.035, "r_x1": 206.787, "r_y1": 617.035, "r_x2": 206.787, "r_y2": 608.238, "r_x3": 134.765, "r_y3": 608.238, "coord_origin": "TOPLEFT"}, "text": "and large tables.", "orig": "and large tables.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 2, "label": "text", "bbox": {"l": 134.765, "t": 620.193, "r": 480.596, "b": 664.855, "coord_origin": "TOPLEFT"}, "confidence": 0.9851234555244446, "cells": [{"index": 111, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 149.709, "r_y0": 628.99, "r_x1": 205.597, "r_y1": 628.99, "r_x2": 205.597, "r_y2": 620.193, "r_x3": 149.709, "r_y3": 620.193, "coord_origin": "TOPLEFT"}, "text": "Additionally,", "orig": "Additionally,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 112, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 210.578, "r_y0": 628.99, "r_x1": 224.412, "r_y1": 628.99, "r_x2": 224.412, "r_y2": 620.193, "r_x3": 210.578, "r_y3": 620.193, "coord_origin": "TOPLEFT"}, "text": "the", "orig": "the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 113, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 229.383, "r_y0": 628.99, "r_x1": 257.74, "r_y1": 628.99, "r_x2": 257.74, "r_y2": 620.193, "r_x3": 229.383, "r_y3": 620.193, "coord_origin": "TOPLEFT"}, "text": "results", "orig": "results", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 114, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 262.722, "r_y0": 628.99, "r_x1": 307.319, "r_y1": 628.99, "r_x2": 307.319, "r_y2": 620.193, "r_x3": 262.722, "r_y3": 620.193, "coord_origin": "TOPLEFT"}, "text": "show that", "orig": "show that", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 115, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 312.301, "r_y0": 628.99, "r_x1": 480.593, "r_y1": 628.99, "r_x2": 480.593, "r_y2": 620.193, "r_x3": 312.301, "r_y3": 620.193, "coord_origin": "TOPLEFT"}, "text": "OTSL has an advantage over HTML", "orig": "OTSL has an advantage over HTML", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 116, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 640.9449999999999, "r_x1": 480.596, "r_y1": 640.9449999999999, "r_x2": 480.596, "r_y2": 632.148, "r_x3": 134.765, "r_y3": 632.148, "coord_origin": "TOPLEFT"}, "text": "when applied on a bigger data set like PubTables-1M and achieves significantly", "orig": "when applied on a bigger data set like PubTables-1M and achieves significantly", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 117, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 652.9, "r_x1": 480.593, "r_y1": 652.9, "r_x2": 480.593, "r_y2": 644.1030000000001, "r_x3": 134.765, "r_y3": 644.1030000000001, "coord_origin": "TOPLEFT"}, "text": "improved scores. Finally, OTSL achieves faster inference due to fewer decoding", "orig": "improved scores. Finally, OTSL achieves faster inference due to fewer decoding", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 118, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 664.855, "r_x1": 405.797, "r_y1": 664.855, "r_x2": 405.797, "r_y2": 656.058, "r_x3": 134.765, "r_y3": 656.058, "coord_origin": "TOPLEFT"}, "text": "steps which is a result of the reduced sequence representation.", "orig": "steps which is a result of the reduced sequence representation.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}]}, "tablestructure": {"table_map": {"0": {"label": "table", "id": 0, "page_no": 8, "cluster": {"id": 0, "label": "table", "bbox": {"l": 139.66845703125, "t": 337.5747985839844, "r": 475.00372314453125, "b": 469.4721374511719, "coord_origin": "TOPLEFT"}, "confidence": 0.9901032447814941, "cells": [{"index": 31, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 160.37, "r_y0": 350.746, "r_x1": 168.048, "r_y1": 350.746, "r_x2": 168.048, "r_y2": 339.457, "r_x3": 160.37, "r_y3": 339.457, "coord_origin": "TOPLEFT"}, "text": "#", "orig": "#", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 32, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 144.592, "r_y0": 363.697, "r_x1": 183.828, "r_y1": 363.697, "r_x2": 183.828, "r_y2": 352.408, "r_x3": 144.592, "r_y3": 352.408, "coord_origin": "TOPLEFT"}, "text": "enc-layers", "orig": "enc-layers", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 33, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 207.974, "r_y0": 350.746, "r_x1": 215.652, "r_y1": 350.746, "r_x2": 215.652, "r_y2": 339.457, "r_x3": 207.974, "r_y3": 339.457, "coord_origin": "TOPLEFT"}, "text": "#", "orig": "#", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 34, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 192.195, "r_y0": 363.697, "r_x1": 231.431, "r_y1": 363.697, "r_x2": 231.431, "r_y2": 352.408, "r_x3": 192.195, "r_y3": 352.408, "coord_origin": "TOPLEFT"}, "text": "dec-layers", "orig": "dec-layers", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 35, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 239.798, "r_y0": 356.225, "r_x1": 278.318, "r_y1": 356.225, "r_x2": 278.318, "r_y2": 344.936, "r_x3": 239.798, "r_y3": 344.936, "coord_origin": "TOPLEFT"}, "text": "Language", "orig": "Language", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 36, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 324.67, "r_y0": 350.746, "r_x1": 348.264, "r_y1": 350.746, "r_x2": 348.264, "r_y2": 339.457, "r_x3": 324.67, "r_y3": 339.457, "coord_origin": "TOPLEFT"}, "text": "TEDs", "orig": "TEDs", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 37, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 396.271, "r_y0": 350.746, "r_x1": 417.127, "r_y1": 350.746, "r_x2": 417.127, "r_y2": 339.457, "r_x3": 396.271, "r_y3": 339.457, "coord_origin": "TOPLEFT"}, "text": "mAP", "orig": "mAP", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 38, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 394.927, "r_y0": 361.705, "r_x1": 418.473, "r_y1": 361.705, "r_x2": 418.473, "r_y2": 350.416, "r_x3": 394.927, "r_y3": 350.416, "coord_origin": "TOPLEFT"}, "text": "(0.75)", "orig": "(0.75)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 39, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 430.771, "r_y0": 350.746, "r_x1": 467.142, "r_y1": 350.746, "r_x2": 467.142, "r_y2": 339.457, "r_x3": 430.771, "r_y3": 339.457, "coord_origin": "TOPLEFT"}, "text": "Inference", "orig": "Inference", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 40, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 427.148, "r_y0": 361.705, "r_x1": 470.761, "r_y1": 361.705, "r_x2": 470.761, "r_y2": 350.416, "r_x3": 427.148, "r_y3": 350.416, "coord_origin": "TOPLEFT"}, "text": "time (secs)", "orig": "time (secs)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 41, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 286.686, "r_y0": 363.697, "r_x1": 312.333, "r_y1": 363.697, "r_x2": 312.333, "r_y2": 352.408, "r_x3": 286.686, "r_y3": 352.408, "coord_origin": "TOPLEFT"}, "text": "simple", "orig": "simple", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 42, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 320.702, "r_y0": 363.697, "r_x1": 353.72, "r_y1": 363.697, "r_x2": 353.72, "r_y2": 352.408, "r_x3": 320.702, "r_y3": 352.408, "coord_origin": "TOPLEFT"}, "text": "complex", "orig": "complex", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 43, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 369.306, "r_y0": 363.697, "r_x1": 379.031, "r_y1": 363.697, "r_x2": 379.031, "r_y2": 352.408, "r_x3": 369.306, "r_y3": 352.408, "coord_origin": "TOPLEFT"}, "text": "all", "orig": "all", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 44, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 161.906, "r_y0": 382.527, "r_x1": 166.513, "r_y1": 382.527, "r_x2": 166.513, "r_y2": 371.238, "r_x3": 161.906, "r_y3": 371.238, "coord_origin": "TOPLEFT"}, "text": "6", "orig": "6", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 45, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 209.509, "r_y0": 382.527, "r_x1": 214.116, "r_y1": 382.527, "r_x2": 214.116, "r_y2": 371.238, "r_x3": 209.509, "r_y3": 371.238, "coord_origin": "TOPLEFT"}, "text": "6", "orig": "6", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 46, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 246.71, "r_y0": 377.047, "r_x1": 271.405, "r_y1": 377.047, "r_x2": 271.405, "r_y2": 365.758, "r_x3": 246.71, "r_y3": 365.758, "coord_origin": "TOPLEFT"}, "text": "OTSL", "orig": "OTSL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 47, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 289.017, "r_y0": 377.047, "r_x1": 310.004, "r_y1": 377.047, "r_x2": 310.004, "r_y2": 365.758, "r_x3": 289.017, "r_y3": 365.758, "coord_origin": "TOPLEFT"}, "text": "0.965", "orig": "0.965", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 48, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 326.717, "r_y0": 377.047, "r_x1": 347.704, "r_y1": 377.047, "r_x2": 347.704, "r_y2": 365.758, "r_x3": 326.717, "r_y3": 365.758, "coord_origin": "TOPLEFT"}, "text": "0.934", "orig": "0.934", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 49, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 363.676, "r_y0": 377.047, "r_x1": 384.663, "r_y1": 377.047, "r_x2": 384.663, "r_y2": 365.758, "r_x3": 363.676, "r_y3": 365.758, "coord_origin": "TOPLEFT"}, "text": "0.955", "orig": "0.955", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 50, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 397.27, "r_y0": 375.899, "r_x1": 416.127, "r_y1": 375.899, "r_x2": 416.127, "r_y2": 367.973, "r_x3": 397.27, "r_y3": 367.973, "coord_origin": "TOPLEFT"}, "text": "0.88", "orig": "0.88", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 51, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 439.527, "r_y0": 375.899, "r_x1": 458.384, "r_y1": 375.899, "r_x2": 458.384, "r_y2": 367.973, "r_x3": 439.527, "r_y3": 367.973, "coord_origin": "TOPLEFT"}, "text": "2.73", "orig": "2.73", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 52, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 245.176, "r_y0": 389.999, "r_x1": 272.94, "r_y1": 389.999, "r_x2": 272.94, "r_y2": 378.71, "r_x3": 245.176, "r_y3": 378.71, "coord_origin": "TOPLEFT"}, "text": "HTML", "orig": "HTML", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 53, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 289.017, "r_y0": 389.999, "r_x1": 310.004, "r_y1": 389.999, "r_x2": 310.004, "r_y2": 378.71, "r_x3": 289.017, "r_y3": 378.71, "coord_origin": "TOPLEFT"}, "text": "0.969", "orig": "0.969", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 54, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 326.717, "r_y0": 389.999, "r_x1": 347.704, "r_y1": 389.999, "r_x2": 347.704, "r_y2": 378.71, "r_x3": 326.717, "r_y3": 378.71, "coord_origin": "TOPLEFT"}, "text": "0.927", "orig": "0.927", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 55, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 363.676, "r_y0": 389.999, "r_x1": 384.663, "r_y1": 389.999, "r_x2": 384.663, "r_y2": 378.71, "r_x3": 363.676, "r_y3": 378.71, "coord_origin": "TOPLEFT"}, "text": "0.955", "orig": "0.955", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 56, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 396.206, "r_y0": 389.999, "r_x1": 417.193, "r_y1": 389.999, "r_x2": 417.193, "r_y2": 378.71, "r_x3": 396.206, "r_y3": 378.71, "coord_origin": "TOPLEFT"}, "text": "0.857", "orig": "0.857", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 57, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 440.767, "r_y0": 389.999, "r_x1": 457.147, "r_y1": 389.999, "r_x2": 457.147, "r_y2": 378.71, "r_x3": 440.767, "r_y3": 378.71, "coord_origin": "TOPLEFT"}, "text": "5.39", "orig": "5.39", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 58, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 161.906, "r_y0": 408.828, "r_x1": 166.513, "r_y1": 408.828, "r_x2": 166.513, "r_y2": 397.539, "r_x3": 161.906, "r_y3": 397.539, "coord_origin": "TOPLEFT"}, "text": "4", "orig": "4", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 59, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 209.509, "r_y0": 408.828, "r_x1": 214.116, "r_y1": 408.828, "r_x2": 214.116, "r_y2": 397.539, "r_x3": 209.509, "r_y3": 397.539, "coord_origin": "TOPLEFT"}, "text": "4", "orig": "4", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 60, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 246.71, "r_y0": 403.349, "r_x1": 271.405, "r_y1": 403.349, "r_x2": 271.405, "r_y2": 392.06, "r_x3": 246.71, "r_y3": 392.06, "coord_origin": "TOPLEFT"}, "text": "OTSL", "orig": "OTSL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 61, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 289.017, "r_y0": 403.349, "r_x1": 310.004, "r_y1": 403.349, "r_x2": 310.004, "r_y2": 392.06, "r_x3": 289.017, "r_y3": 392.06, "coord_origin": "TOPLEFT"}, "text": "0.938", "orig": "0.938", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 62, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 326.717, "r_y0": 403.349, "r_x1": 347.704, "r_y1": 403.349, "r_x2": 347.704, "r_y2": 392.06, "r_x3": 326.717, "r_y3": 392.06, "coord_origin": "TOPLEFT"}, "text": "0.904", "orig": "0.904", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 63, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 363.676, "r_y0": 403.349, "r_x1": 384.663, "r_y1": 403.349, "r_x2": 384.663, "r_y2": 392.06, "r_x3": 363.676, "r_y3": 392.06, "coord_origin": "TOPLEFT"}, "text": "0.927", "orig": "0.927", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 64, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 394.618, "r_y0": 402.201, "r_x1": 418.779, "r_y1": 402.201, "r_x2": 418.779, "r_y2": 394.275, "r_x3": 394.618, "r_y3": 394.275, "coord_origin": "TOPLEFT"}, "text": "0.853", "orig": "0.853", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 65, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 439.527, "r_y0": 402.201, "r_x1": 458.384, "r_y1": 402.201, "r_x2": 458.384, "r_y2": 394.275, "r_x3": 439.527, "r_y3": 394.275, "coord_origin": "TOPLEFT"}, "text": "1.97", "orig": "1.97", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 66, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 245.176, "r_y0": 416.3, "r_x1": 272.94, "r_y1": 416.3, "r_x2": 272.94, "r_y2": 405.011, "r_x3": 245.176, "r_y3": 405.011, "coord_origin": "TOPLEFT"}, "text": "HTML", "orig": "HTML", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 67, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 289.017, "r_y0": 416.3, "r_x1": 310.004, "r_y1": 416.3, "r_x2": 310.004, "r_y2": 405.011, "r_x3": 289.017, "r_y3": 405.011, "coord_origin": "TOPLEFT"}, "text": "0.952", "orig": "0.952", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 68, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 326.717, "r_y0": 416.3, "r_x1": 347.704, "r_y1": 416.3, "r_x2": 347.704, "r_y2": 405.011, "r_x3": 326.717, "r_y3": 405.011, "coord_origin": "TOPLEFT"}, "text": "0.909", "orig": "0.909", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 69, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 362.088, "r_y0": 415.152, "r_x1": 386.249, "r_y1": 415.152, "r_x2": 386.249, "r_y2": 407.226, "r_x3": 362.088, "r_y3": 407.226, "coord_origin": "TOPLEFT"}, "text": "0.938", "orig": "0.938", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 70, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 396.206, "r_y0": 416.3, "r_x1": 417.193, "r_y1": 416.3, "r_x2": 417.193, "r_y2": 405.011, "r_x3": 396.206, "r_y3": 405.011, "coord_origin": "TOPLEFT"}, "text": "0.843", "orig": "0.843", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 71, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 440.767, "r_y0": 416.3, "r_x1": 457.147, "r_y1": 416.3, "r_x2": 457.147, "r_y2": 405.011, "r_x3": 440.767, "r_y3": 405.011, "coord_origin": "TOPLEFT"}, "text": "3.77", "orig": "3.77", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 72, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 161.906, "r_y0": 435.129, "r_x1": 166.513, "r_y1": 435.129, "r_x2": 166.513, "r_y2": 423.84, "r_x3": 161.906, "r_y3": 423.84, "coord_origin": "TOPLEFT"}, "text": "2", "orig": "2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 73, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 209.509, "r_y0": 435.129, "r_x1": 214.116, "r_y1": 435.129, "r_x2": 214.116, "r_y2": 423.84, "r_x3": 209.509, "r_y3": 423.84, "coord_origin": "TOPLEFT"}, "text": "4", "orig": "4", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 74, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 246.71, "r_y0": 429.65, "r_x1": 271.405, "r_y1": 429.65, "r_x2": 271.405, "r_y2": 418.361, "r_x3": 246.71, "r_y3": 418.361, "coord_origin": "TOPLEFT"}, "text": "OTSL", "orig": "OTSL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 75, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 289.017, "r_y0": 429.65, "r_x1": 310.004, "r_y1": 429.65, "r_x2": 310.004, "r_y2": 418.361, "r_x3": 289.017, "r_y3": 418.361, "coord_origin": "TOPLEFT"}, "text": "0.923", "orig": "0.923", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 76, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 326.717, "r_y0": 429.65, "r_x1": 347.704, "r_y1": 429.65, "r_x2": 347.704, "r_y2": 418.361, "r_x3": 326.717, "r_y3": 418.361, "coord_origin": "TOPLEFT"}, "text": "0.897", "orig": "0.897", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 77, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 363.676, "r_y0": 429.65, "r_x1": 384.663, "r_y1": 429.65, "r_x2": 384.663, "r_y2": 418.361, "r_x3": 363.676, "r_y3": 418.361, "coord_origin": "TOPLEFT"}, "text": "0.915", "orig": "0.915", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 78, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 394.618, "r_y0": 428.502, "r_x1": 418.779, "r_y1": 428.502, "r_x2": 418.779, "r_y2": 420.576, "r_x3": 394.618, "r_y3": 420.576, "coord_origin": "TOPLEFT"}, "text": "0.859", "orig": "0.859", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 79, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 439.527, "r_y0": 428.502, "r_x1": 458.384, "r_y1": 428.502, "r_x2": 458.384, "r_y2": 420.576, "r_x3": 439.527, "r_y3": 420.576, "coord_origin": "TOPLEFT"}, "text": "1.91", "orig": "1.91", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 80, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 245.176, "r_y0": 442.601, "r_x1": 272.94, "r_y1": 442.601, "r_x2": 272.94, "r_y2": 431.312, "r_x3": 245.176, "r_y3": 431.312, "coord_origin": "TOPLEFT"}, "text": "HTML", "orig": "HTML", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 81, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 289.017, "r_y0": 442.601, "r_x1": 310.004, "r_y1": 442.601, "r_x2": 310.004, "r_y2": 431.312, "r_x3": 289.017, "r_y3": 431.312, "coord_origin": "TOPLEFT"}, "text": "0.945", "orig": "0.945", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 82, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 326.717, "r_y0": 442.601, "r_x1": 347.704, "r_y1": 442.601, "r_x2": 347.704, "r_y2": 431.312, "r_x3": 326.717, "r_y3": 431.312, "coord_origin": "TOPLEFT"}, "text": "0.901", "orig": "0.901", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 83, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 362.088, "r_y0": 441.453, "r_x1": 386.249, "r_y1": 441.453, "r_x2": 386.249, "r_y2": 433.527, "r_x3": 362.088, "r_y3": 433.527, "coord_origin": "TOPLEFT"}, "text": "0.931", "orig": "0.931", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 84, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 396.206, "r_y0": 442.601, "r_x1": 417.193, "r_y1": 442.601, "r_x2": 417.193, "r_y2": 431.312, "r_x3": 396.206, "r_y3": 431.312, "coord_origin": "TOPLEFT"}, "text": "0.834", "orig": "0.834", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 85, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 440.767, "r_y0": 442.601, "r_x1": 457.147, "r_y1": 442.601, "r_x2": 457.147, "r_y2": 431.312, "r_x3": 440.767, "r_y3": 431.312, "coord_origin": "TOPLEFT"}, "text": "3.81", "orig": "3.81", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 86, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 161.906, "r_y0": 461.431, "r_x1": 166.513, "r_y1": 461.431, "r_x2": 166.513, "r_y2": 450.142, "r_x3": 161.906, "r_y3": 450.142, "coord_origin": "TOPLEFT"}, "text": "4", "orig": "4", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 87, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 209.509, "r_y0": 461.431, "r_x1": 214.116, "r_y1": 461.431, "r_x2": 214.116, "r_y2": 450.142, "r_x3": 209.509, "r_y3": 450.142, "coord_origin": "TOPLEFT"}, "text": "2", "orig": "2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 88, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 246.71, "r_y0": 455.951, "r_x1": 271.405, "r_y1": 455.951, "r_x2": 271.405, "r_y2": 444.662, "r_x3": 246.71, "r_y3": 444.662, "coord_origin": "TOPLEFT"}, "text": "OTSL", "orig": "OTSL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 89, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 289.017, "r_y0": 455.951, "r_x1": 310.004, "r_y1": 455.951, "r_x2": 310.004, "r_y2": 444.662, "r_x3": 289.017, "r_y3": 444.662, "coord_origin": "TOPLEFT"}, "text": "0.952", "orig": "0.952", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 90, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 329.021, "r_y0": 455.951, "r_x1": 345.401, "r_y1": 455.951, "r_x2": 345.401, "r_y2": 444.662, "r_x3": 329.021, "r_y3": 444.662, "coord_origin": "TOPLEFT"}, "text": "0.92", "orig": "0.92", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 91, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 362.088, "r_y0": 454.803, "r_x1": 386.249, "r_y1": 454.803, "r_x2": 386.249, "r_y2": 446.877, "r_x3": 362.088, "r_y3": 446.877, "coord_origin": "TOPLEFT"}, "text": "0.942", "orig": "0.942", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 92, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 394.618, "r_y0": 454.803, "r_x1": 418.779, "r_y1": 454.803, "r_x2": 418.779, "r_y2": 446.877, "r_x3": 394.618, "r_y3": 446.877, "coord_origin": "TOPLEFT"}, "text": "0.857", "orig": "0.857", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 93, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 439.527, "r_y0": 454.803, "r_x1": 458.384, "r_y1": 454.803, "r_x2": 458.384, "r_y2": 446.877, "r_x3": 439.527, "r_y3": 446.877, "coord_origin": "TOPLEFT"}, "text": "1.22", "orig": "1.22", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 94, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 245.176, "r_y0": 468.903, "r_x1": 272.94, "r_y1": 468.903, "r_x2": 272.94, "r_y2": 457.614, "r_x3": 245.176, "r_y3": 457.614, "coord_origin": "TOPLEFT"}, "text": "HTML", "orig": "HTML", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 95, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 289.017, "r_y0": 468.903, "r_x1": 310.004, "r_y1": 468.903, "r_x2": 310.004, "r_y2": 457.614, "r_x3": 289.017, "r_y3": 457.614, "coord_origin": "TOPLEFT"}, "text": "0.944", "orig": "0.944", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 96, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 326.717, "r_y0": 468.903, "r_x1": 347.704, "r_y1": 468.903, "r_x2": 347.704, "r_y2": 457.614, "r_x3": 326.717, "r_y3": 457.614, "coord_origin": "TOPLEFT"}, "text": "0.903", "orig": "0.903", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 97, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 363.676, "r_y0": 468.903, "r_x1": 384.663, "r_y1": 468.903, "r_x2": 384.663, "r_y2": 457.614, "r_x3": 363.676, "r_y3": 457.614, "coord_origin": "TOPLEFT"}, "text": "0.931", "orig": "0.931", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 98, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 396.206, "r_y0": 468.903, "r_x1": 417.193, "r_y1": 468.903, "r_x2": 417.193, "r_y2": 457.614, "r_x3": 396.206, "r_y3": 457.614, "coord_origin": "TOPLEFT"}, "text": "0.824", "orig": "0.824", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 99, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 446.653, "r_y0": 468.903, "r_x1": 451.26, "r_y1": 468.903, "r_x2": 451.26, "r_y2": 457.614, "r_x3": 446.653, "r_y3": 457.614, "coord_origin": "TOPLEFT"}, "text": "2", "orig": "2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": [{"id": 11, "label": "text", "bbox": {"l": 160.37, "t": 339.457, "r": 168.048, "b": 350.746, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 31, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 160.37, "r_y0": 350.746, "r_x1": 168.048, "r_y1": 350.746, "r_x2": 168.048, "r_y2": 339.457, "r_x3": 160.37, "r_y3": 339.457, "coord_origin": "TOPLEFT"}, "text": "#", "orig": "#", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 12, "label": "text", "bbox": {"l": 144.592, "t": 352.408, "r": 183.828, "b": 363.697, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 32, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 144.592, "r_y0": 363.697, "r_x1": 183.828, "r_y1": 363.697, "r_x2": 183.828, "r_y2": 352.408, "r_x3": 144.592, "r_y3": 352.408, "coord_origin": "TOPLEFT"}, "text": "enc-layers", "orig": "enc-layers", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 13, "label": "text", "bbox": {"l": 207.974, "t": 339.457, "r": 215.652, "b": 350.746, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 33, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 207.974, "r_y0": 350.746, "r_x1": 215.652, "r_y1": 350.746, "r_x2": 215.652, "r_y2": 339.457, "r_x3": 207.974, "r_y3": 339.457, "coord_origin": "TOPLEFT"}, "text": "#", "orig": "#", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 14, "label": "text", "bbox": {"l": 192.195, "t": 352.408, "r": 231.431, "b": 363.697, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 34, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 192.195, "r_y0": 363.697, "r_x1": 231.431, "r_y1": 363.697, "r_x2": 231.431, "r_y2": 352.408, "r_x3": 192.195, "r_y3": 352.408, "coord_origin": "TOPLEFT"}, "text": "dec-layers", "orig": "dec-layers", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 15, "label": "text", "bbox": {"l": 239.798, "t": 344.936, "r": 278.318, "b": 356.225, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 35, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 239.798, "r_y0": 356.225, "r_x1": 278.318, "r_y1": 356.225, "r_x2": 278.318, "r_y2": 344.936, "r_x3": 239.798, "r_y3": 344.936, "coord_origin": "TOPLEFT"}, "text": "Language", "orig": "Language", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 16, "label": "text", "bbox": {"l": 324.67, "t": 339.457, "r": 348.264, "b": 350.746, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 36, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 324.67, "r_y0": 350.746, "r_x1": 348.264, "r_y1": 350.746, "r_x2": 348.264, "r_y2": 339.457, "r_x3": 324.67, "r_y3": 339.457, "coord_origin": "TOPLEFT"}, "text": "TEDs", "orig": "TEDs", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 17, "label": "text", "bbox": {"l": 396.271, "t": 339.457, "r": 417.127, "b": 350.746, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 37, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 396.271, "r_y0": 350.746, "r_x1": 417.127, "r_y1": 350.746, "r_x2": 417.127, "r_y2": 339.457, "r_x3": 396.271, "r_y3": 339.457, "coord_origin": "TOPLEFT"}, "text": "mAP", "orig": "mAP", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 18, "label": "text", "bbox": {"l": 394.927, "t": 350.416, "r": 418.473, "b": 361.705, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 38, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 394.927, "r_y0": 361.705, "r_x1": 418.473, "r_y1": 361.705, "r_x2": 418.473, "r_y2": 350.416, "r_x3": 394.927, "r_y3": 350.416, "coord_origin": "TOPLEFT"}, "text": "(0.75)", "orig": "(0.75)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 19, "label": "text", "bbox": {"l": 430.771, "t": 339.457, "r": 467.142, "b": 350.746, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 39, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 430.771, "r_y0": 350.746, "r_x1": 467.142, "r_y1": 350.746, "r_x2": 467.142, "r_y2": 339.457, "r_x3": 430.771, "r_y3": 339.457, "coord_origin": "TOPLEFT"}, "text": "Inference", "orig": "Inference", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 20, "label": "text", "bbox": {"l": 427.148, "t": 350.416, "r": 470.761, "b": 361.705, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 40, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 427.148, "r_y0": 361.705, "r_x1": 470.761, "r_y1": 361.705, "r_x2": 470.761, "r_y2": 350.416, "r_x3": 427.148, "r_y3": 350.416, "coord_origin": "TOPLEFT"}, "text": "time (secs)", "orig": "time (secs)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 21, "label": "text", "bbox": {"l": 286.686, "t": 352.408, "r": 312.333, "b": 363.697, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 41, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 286.686, "r_y0": 363.697, "r_x1": 312.333, "r_y1": 363.697, "r_x2": 312.333, "r_y2": 352.408, "r_x3": 286.686, "r_y3": 352.408, "coord_origin": "TOPLEFT"}, "text": "simple", "orig": "simple", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 22, "label": "text", "bbox": {"l": 320.702, "t": 352.408, "r": 353.72, "b": 363.697, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 42, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 320.702, "r_y0": 363.697, "r_x1": 353.72, "r_y1": 363.697, "r_x2": 353.72, "r_y2": 352.408, "r_x3": 320.702, "r_y3": 352.408, "coord_origin": "TOPLEFT"}, "text": "complex", "orig": "complex", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 23, "label": "text", "bbox": {"l": 369.306, "t": 352.408, "r": 379.031, "b": 363.697, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 43, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 369.306, "r_y0": 363.697, "r_x1": 379.031, "r_y1": 363.697, "r_x2": 379.031, "r_y2": 352.408, "r_x3": 369.306, "r_y3": 352.408, "coord_origin": "TOPLEFT"}, "text": "all", "orig": "all", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 24, "label": "text", "bbox": {"l": 161.906, "t": 371.238, "r": 166.513, "b": 382.527, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 44, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 161.906, "r_y0": 382.527, "r_x1": 166.513, "r_y1": 382.527, "r_x2": 166.513, "r_y2": 371.238, "r_x3": 161.906, "r_y3": 371.238, "coord_origin": "TOPLEFT"}, "text": "6", "orig": "6", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 25, "label": "text", "bbox": {"l": 209.509, "t": 371.238, "r": 214.116, "b": 382.527, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 45, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 209.509, "r_y0": 382.527, "r_x1": 214.116, "r_y1": 382.527, "r_x2": 214.116, "r_y2": 371.238, "r_x3": 209.509, "r_y3": 371.238, "coord_origin": "TOPLEFT"}, "text": "6", "orig": "6", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 26, "label": "text", "bbox": {"l": 246.71, "t": 365.758, "r": 271.405, "b": 377.047, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 46, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 246.71, "r_y0": 377.047, "r_x1": 271.405, "r_y1": 377.047, "r_x2": 271.405, "r_y2": 365.758, "r_x3": 246.71, "r_y3": 365.758, "coord_origin": "TOPLEFT"}, "text": "OTSL", "orig": "OTSL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 27, "label": "text", "bbox": {"l": 289.017, "t": 365.758, "r": 310.004, "b": 377.047, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 47, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 289.017, "r_y0": 377.047, "r_x1": 310.004, "r_y1": 377.047, "r_x2": 310.004, "r_y2": 365.758, "r_x3": 289.017, "r_y3": 365.758, "coord_origin": "TOPLEFT"}, "text": "0.965", "orig": "0.965", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 28, "label": "text", "bbox": {"l": 326.717, "t": 365.758, "r": 347.704, "b": 377.047, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 48, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 326.717, "r_y0": 377.047, "r_x1": 347.704, "r_y1": 377.047, "r_x2": 347.704, "r_y2": 365.758, "r_x3": 326.717, "r_y3": 365.758, "coord_origin": "TOPLEFT"}, "text": "0.934", "orig": "0.934", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 29, "label": "text", "bbox": {"l": 363.676, "t": 365.758, "r": 384.663, "b": 377.047, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 49, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 363.676, "r_y0": 377.047, "r_x1": 384.663, "r_y1": 377.047, "r_x2": 384.663, "r_y2": 365.758, "r_x3": 363.676, "r_y3": 365.758, "coord_origin": "TOPLEFT"}, "text": "0.955", "orig": "0.955", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 30, "label": "text", "bbox": {"l": 397.27, "t": 367.973, "r": 416.127, "b": 375.899, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 50, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 397.27, "r_y0": 375.899, "r_x1": 416.127, "r_y1": 375.899, "r_x2": 416.127, "r_y2": 367.973, "r_x3": 397.27, "r_y3": 367.973, "coord_origin": "TOPLEFT"}, "text": "0.88", "orig": "0.88", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 31, "label": "text", "bbox": {"l": 439.527, "t": 367.973, "r": 458.384, "b": 375.899, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 51, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 439.527, "r_y0": 375.899, "r_x1": 458.384, "r_y1": 375.899, "r_x2": 458.384, "r_y2": 367.973, "r_x3": 439.527, "r_y3": 367.973, "coord_origin": "TOPLEFT"}, "text": "2.73", "orig": "2.73", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 32, "label": "text", "bbox": {"l": 245.176, "t": 378.71, "r": 272.94, "b": 389.999, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 52, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 245.176, "r_y0": 389.999, "r_x1": 272.94, "r_y1": 389.999, "r_x2": 272.94, "r_y2": 378.71, "r_x3": 245.176, "r_y3": 378.71, "coord_origin": "TOPLEFT"}, "text": "HTML", "orig": "HTML", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 33, "label": "text", "bbox": {"l": 289.017, "t": 378.71, "r": 310.004, "b": 389.999, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 53, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 289.017, "r_y0": 389.999, "r_x1": 310.004, "r_y1": 389.999, "r_x2": 310.004, "r_y2": 378.71, "r_x3": 289.017, "r_y3": 378.71, "coord_origin": "TOPLEFT"}, "text": "0.969", "orig": "0.969", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 34, "label": "text", "bbox": {"l": 326.717, "t": 378.71, "r": 347.704, "b": 389.999, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 54, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 326.717, "r_y0": 389.999, "r_x1": 347.704, "r_y1": 389.999, "r_x2": 347.704, "r_y2": 378.71, "r_x3": 326.717, "r_y3": 378.71, "coord_origin": "TOPLEFT"}, "text": "0.927", "orig": "0.927", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 35, "label": "text", "bbox": {"l": 363.676, "t": 378.71, "r": 384.663, "b": 389.999, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 55, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 363.676, "r_y0": 389.999, "r_x1": 384.663, "r_y1": 389.999, "r_x2": 384.663, "r_y2": 378.71, "r_x3": 363.676, "r_y3": 378.71, "coord_origin": "TOPLEFT"}, "text": "0.955", "orig": "0.955", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 36, "label": "text", "bbox": {"l": 396.206, "t": 378.71, "r": 417.193, "b": 389.999, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 56, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 396.206, "r_y0": 389.999, "r_x1": 417.193, "r_y1": 389.999, "r_x2": 417.193, "r_y2": 378.71, "r_x3": 396.206, "r_y3": 378.71, "coord_origin": "TOPLEFT"}, "text": "0.857", "orig": "0.857", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 37, "label": "text", "bbox": {"l": 440.767, "t": 378.71, "r": 457.147, "b": 389.999, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 57, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 440.767, "r_y0": 389.999, "r_x1": 457.147, "r_y1": 389.999, "r_x2": 457.147, "r_y2": 378.71, "r_x3": 440.767, "r_y3": 378.71, "coord_origin": "TOPLEFT"}, "text": "5.39", "orig": "5.39", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 38, "label": "text", "bbox": {"l": 161.906, "t": 397.539, "r": 166.513, "b": 408.828, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 58, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 161.906, "r_y0": 408.828, "r_x1": 166.513, "r_y1": 408.828, "r_x2": 166.513, "r_y2": 397.539, "r_x3": 161.906, "r_y3": 397.539, "coord_origin": "TOPLEFT"}, "text": "4", "orig": "4", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 39, "label": "text", "bbox": {"l": 209.509, "t": 397.539, "r": 214.116, "b": 408.828, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 59, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 209.509, "r_y0": 408.828, "r_x1": 214.116, "r_y1": 408.828, "r_x2": 214.116, "r_y2": 397.539, "r_x3": 209.509, "r_y3": 397.539, "coord_origin": "TOPLEFT"}, "text": "4", "orig": "4", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 40, "label": "text", "bbox": {"l": 246.71, "t": 392.06, "r": 271.405, "b": 403.349, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 60, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 246.71, "r_y0": 403.349, "r_x1": 271.405, "r_y1": 403.349, "r_x2": 271.405, "r_y2": 392.06, "r_x3": 246.71, "r_y3": 392.06, "coord_origin": "TOPLEFT"}, "text": "OTSL", "orig": "OTSL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 41, "label": "text", "bbox": {"l": 289.017, "t": 392.06, "r": 310.004, "b": 403.349, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 61, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 289.017, "r_y0": 403.349, "r_x1": 310.004, "r_y1": 403.349, "r_x2": 310.004, "r_y2": 392.06, "r_x3": 289.017, "r_y3": 392.06, "coord_origin": "TOPLEFT"}, "text": "0.938", "orig": "0.938", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 42, "label": "text", "bbox": {"l": 326.717, "t": 392.06, "r": 347.704, "b": 403.349, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 62, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 326.717, "r_y0": 403.349, "r_x1": 347.704, "r_y1": 403.349, "r_x2": 347.704, "r_y2": 392.06, "r_x3": 326.717, "r_y3": 392.06, "coord_origin": "TOPLEFT"}, "text": "0.904", "orig": "0.904", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 43, "label": "text", "bbox": {"l": 363.676, "t": 392.06, "r": 384.663, "b": 403.349, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 63, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 363.676, "r_y0": 403.349, "r_x1": 384.663, "r_y1": 403.349, "r_x2": 384.663, "r_y2": 392.06, "r_x3": 363.676, "r_y3": 392.06, "coord_origin": "TOPLEFT"}, "text": "0.927", "orig": "0.927", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 44, "label": "text", "bbox": {"l": 394.618, "t": 394.275, "r": 418.779, "b": 402.201, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 64, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 394.618, "r_y0": 402.201, "r_x1": 418.779, "r_y1": 402.201, "r_x2": 418.779, "r_y2": 394.275, "r_x3": 394.618, "r_y3": 394.275, "coord_origin": "TOPLEFT"}, "text": "0.853", "orig": "0.853", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 45, "label": "text", "bbox": {"l": 439.527, "t": 394.275, "r": 458.384, "b": 402.201, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 65, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 439.527, "r_y0": 402.201, "r_x1": 458.384, "r_y1": 402.201, "r_x2": 458.384, "r_y2": 394.275, "r_x3": 439.527, "r_y3": 394.275, "coord_origin": "TOPLEFT"}, "text": "1.97", "orig": "1.97", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 46, "label": "text", "bbox": {"l": 245.176, "t": 405.011, "r": 272.94, "b": 416.3, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 66, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 245.176, "r_y0": 416.3, "r_x1": 272.94, "r_y1": 416.3, "r_x2": 272.94, "r_y2": 405.011, "r_x3": 245.176, "r_y3": 405.011, "coord_origin": "TOPLEFT"}, "text": "HTML", "orig": "HTML", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 47, "label": "text", "bbox": {"l": 289.017, "t": 405.011, "r": 310.004, "b": 416.3, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 67, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 289.017, "r_y0": 416.3, "r_x1": 310.004, "r_y1": 416.3, "r_x2": 310.004, "r_y2": 405.011, "r_x3": 289.017, "r_y3": 405.011, "coord_origin": "TOPLEFT"}, "text": "0.952", "orig": "0.952", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 48, "label": "text", "bbox": {"l": 326.717, "t": 405.011, "r": 347.704, "b": 416.3, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 68, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 326.717, "r_y0": 416.3, "r_x1": 347.704, "r_y1": 416.3, "r_x2": 347.704, "r_y2": 405.011, "r_x3": 326.717, "r_y3": 405.011, "coord_origin": "TOPLEFT"}, "text": "0.909", "orig": "0.909", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 49, "label": "text", "bbox": {"l": 362.088, "t": 407.226, "r": 386.249, "b": 415.152, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 69, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 362.088, "r_y0": 415.152, "r_x1": 386.249, "r_y1": 415.152, "r_x2": 386.249, "r_y2": 407.226, "r_x3": 362.088, "r_y3": 407.226, "coord_origin": "TOPLEFT"}, "text": "0.938", "orig": "0.938", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 50, "label": "text", "bbox": {"l": 396.206, "t": 405.011, "r": 417.193, "b": 416.3, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 70, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 396.206, "r_y0": 416.3, "r_x1": 417.193, "r_y1": 416.3, "r_x2": 417.193, "r_y2": 405.011, "r_x3": 396.206, "r_y3": 405.011, "coord_origin": "TOPLEFT"}, "text": "0.843", "orig": "0.843", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 51, "label": "text", "bbox": {"l": 440.767, "t": 405.011, "r": 457.147, "b": 416.3, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 71, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 440.767, "r_y0": 416.3, "r_x1": 457.147, "r_y1": 416.3, "r_x2": 457.147, "r_y2": 405.011, "r_x3": 440.767, "r_y3": 405.011, "coord_origin": "TOPLEFT"}, "text": "3.77", "orig": "3.77", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 52, "label": "text", "bbox": {"l": 161.906, "t": 423.84, "r": 166.513, "b": 435.129, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 72, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 161.906, "r_y0": 435.129, "r_x1": 166.513, "r_y1": 435.129, "r_x2": 166.513, "r_y2": 423.84, "r_x3": 161.906, "r_y3": 423.84, "coord_origin": "TOPLEFT"}, "text": "2", "orig": "2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 53, "label": "text", "bbox": {"l": 209.509, "t": 423.84, "r": 214.116, "b": 435.129, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 73, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 209.509, "r_y0": 435.129, "r_x1": 214.116, "r_y1": 435.129, "r_x2": 214.116, "r_y2": 423.84, "r_x3": 209.509, "r_y3": 423.84, "coord_origin": "TOPLEFT"}, "text": "4", "orig": "4", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 54, "label": "text", "bbox": {"l": 246.71, "t": 418.361, "r": 271.405, "b": 429.65, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 74, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 246.71, "r_y0": 429.65, "r_x1": 271.405, "r_y1": 429.65, "r_x2": 271.405, "r_y2": 418.361, "r_x3": 246.71, "r_y3": 418.361, "coord_origin": "TOPLEFT"}, "text": "OTSL", "orig": "OTSL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 55, "label": "text", "bbox": {"l": 289.017, "t": 418.361, "r": 310.004, "b": 429.65, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 75, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 289.017, "r_y0": 429.65, "r_x1": 310.004, "r_y1": 429.65, "r_x2": 310.004, "r_y2": 418.361, "r_x3": 289.017, "r_y3": 418.361, "coord_origin": "TOPLEFT"}, "text": "0.923", "orig": "0.923", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 56, "label": "text", "bbox": {"l": 326.717, "t": 418.361, "r": 347.704, "b": 429.65, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 76, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 326.717, "r_y0": 429.65, "r_x1": 347.704, "r_y1": 429.65, "r_x2": 347.704, "r_y2": 418.361, "r_x3": 326.717, "r_y3": 418.361, "coord_origin": "TOPLEFT"}, "text": "0.897", "orig": "0.897", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 57, "label": "text", "bbox": {"l": 363.676, "t": 418.361, "r": 384.663, "b": 429.65, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 77, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 363.676, "r_y0": 429.65, "r_x1": 384.663, "r_y1": 429.65, "r_x2": 384.663, "r_y2": 418.361, "r_x3": 363.676, "r_y3": 418.361, "coord_origin": "TOPLEFT"}, "text": "0.915", "orig": "0.915", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 58, "label": "text", "bbox": {"l": 394.618, "t": 420.576, "r": 418.779, "b": 428.502, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 78, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 394.618, "r_y0": 428.502, "r_x1": 418.779, "r_y1": 428.502, "r_x2": 418.779, "r_y2": 420.576, "r_x3": 394.618, "r_y3": 420.576, "coord_origin": "TOPLEFT"}, "text": "0.859", "orig": "0.859", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 59, "label": "text", "bbox": {"l": 439.527, "t": 420.576, "r": 458.384, "b": 428.502, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 79, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 439.527, "r_y0": 428.502, "r_x1": 458.384, "r_y1": 428.502, "r_x2": 458.384, "r_y2": 420.576, "r_x3": 439.527, "r_y3": 420.576, "coord_origin": "TOPLEFT"}, "text": "1.91", "orig": "1.91", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 60, "label": "text", "bbox": {"l": 245.176, "t": 431.312, "r": 272.94, "b": 442.601, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 80, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 245.176, "r_y0": 442.601, "r_x1": 272.94, "r_y1": 442.601, "r_x2": 272.94, "r_y2": 431.312, "r_x3": 245.176, "r_y3": 431.312, "coord_origin": "TOPLEFT"}, "text": "HTML", "orig": "HTML", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 61, "label": "text", "bbox": {"l": 289.017, "t": 431.312, "r": 310.004, "b": 442.601, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 81, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 289.017, "r_y0": 442.601, "r_x1": 310.004, "r_y1": 442.601, "r_x2": 310.004, "r_y2": 431.312, "r_x3": 289.017, "r_y3": 431.312, "coord_origin": "TOPLEFT"}, "text": "0.945", "orig": "0.945", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 62, "label": "text", "bbox": {"l": 326.717, "t": 431.312, "r": 347.704, "b": 442.601, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 82, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 326.717, "r_y0": 442.601, "r_x1": 347.704, "r_y1": 442.601, "r_x2": 347.704, "r_y2": 431.312, "r_x3": 326.717, "r_y3": 431.312, "coord_origin": "TOPLEFT"}, "text": "0.901", "orig": "0.901", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 63, "label": "text", "bbox": {"l": 362.088, "t": 433.527, "r": 386.249, "b": 441.453, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 83, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 362.088, "r_y0": 441.453, "r_x1": 386.249, "r_y1": 441.453, "r_x2": 386.249, "r_y2": 433.527, "r_x3": 362.088, "r_y3": 433.527, "coord_origin": "TOPLEFT"}, "text": "0.931", "orig": "0.931", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 64, "label": "text", "bbox": {"l": 396.206, "t": 431.312, "r": 417.193, "b": 442.601, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 84, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 396.206, "r_y0": 442.601, "r_x1": 417.193, "r_y1": 442.601, "r_x2": 417.193, "r_y2": 431.312, "r_x3": 396.206, "r_y3": 431.312, "coord_origin": "TOPLEFT"}, "text": "0.834", "orig": "0.834", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 65, "label": "text", "bbox": {"l": 440.767, "t": 431.312, "r": 457.147, "b": 442.601, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 85, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 440.767, "r_y0": 442.601, "r_x1": 457.147, "r_y1": 442.601, "r_x2": 457.147, "r_y2": 431.312, "r_x3": 440.767, "r_y3": 431.312, "coord_origin": "TOPLEFT"}, "text": "3.81", "orig": "3.81", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 66, "label": "text", "bbox": {"l": 161.906, "t": 450.142, "r": 166.513, "b": 461.431, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 86, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 161.906, "r_y0": 461.431, "r_x1": 166.513, "r_y1": 461.431, "r_x2": 166.513, "r_y2": 450.142, "r_x3": 161.906, "r_y3": 450.142, "coord_origin": "TOPLEFT"}, "text": "4", "orig": "4", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 67, "label": "text", "bbox": {"l": 209.509, "t": 450.142, "r": 214.116, "b": 461.431, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 87, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 209.509, "r_y0": 461.431, "r_x1": 214.116, "r_y1": 461.431, "r_x2": 214.116, "r_y2": 450.142, "r_x3": 209.509, "r_y3": 450.142, "coord_origin": "TOPLEFT"}, "text": "2", "orig": "2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 68, "label": "text", "bbox": {"l": 246.71, "t": 444.662, "r": 271.405, "b": 455.951, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 88, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 246.71, "r_y0": 455.951, "r_x1": 271.405, "r_y1": 455.951, "r_x2": 271.405, "r_y2": 444.662, "r_x3": 246.71, "r_y3": 444.662, "coord_origin": "TOPLEFT"}, "text": "OTSL", "orig": "OTSL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 69, "label": "text", "bbox": {"l": 289.017, "t": 444.662, "r": 310.004, "b": 455.951, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 89, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 289.017, "r_y0": 455.951, "r_x1": 310.004, "r_y1": 455.951, "r_x2": 310.004, "r_y2": 444.662, "r_x3": 289.017, "r_y3": 444.662, "coord_origin": "TOPLEFT"}, "text": "0.952", "orig": "0.952", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 70, "label": "text", "bbox": {"l": 329.021, "t": 444.662, "r": 345.401, "b": 455.951, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 90, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 329.021, "r_y0": 455.951, "r_x1": 345.401, "r_y1": 455.951, "r_x2": 345.401, "r_y2": 444.662, "r_x3": 329.021, "r_y3": 444.662, "coord_origin": "TOPLEFT"}, "text": "0.92", "orig": "0.92", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 71, "label": "text", "bbox": {"l": 362.088, "t": 446.877, "r": 386.249, "b": 454.803, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 91, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 362.088, "r_y0": 454.803, "r_x1": 386.249, "r_y1": 454.803, "r_x2": 386.249, "r_y2": 446.877, "r_x3": 362.088, "r_y3": 446.877, "coord_origin": "TOPLEFT"}, "text": "0.942", "orig": "0.942", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 72, "label": "text", "bbox": {"l": 394.618, "t": 446.877, "r": 418.779, "b": 454.803, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 92, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 394.618, "r_y0": 454.803, "r_x1": 418.779, "r_y1": 454.803, "r_x2": 418.779, "r_y2": 446.877, "r_x3": 394.618, "r_y3": 446.877, "coord_origin": "TOPLEFT"}, "text": "0.857", "orig": "0.857", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 73, "label": "text", "bbox": {"l": 439.527, "t": 446.877, "r": 458.384, "b": 454.803, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 93, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 439.527, "r_y0": 454.803, "r_x1": 458.384, "r_y1": 454.803, "r_x2": 458.384, "r_y2": 446.877, "r_x3": 439.527, "r_y3": 446.877, "coord_origin": "TOPLEFT"}, "text": "1.22", "orig": "1.22", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 74, "label": "text", "bbox": {"l": 245.176, "t": 457.614, "r": 272.94, "b": 468.903, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 94, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 245.176, "r_y0": 468.903, "r_x1": 272.94, "r_y1": 468.903, "r_x2": 272.94, "r_y2": 457.614, "r_x3": 245.176, "r_y3": 457.614, "coord_origin": "TOPLEFT"}, "text": "HTML", "orig": "HTML", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 75, "label": "text", "bbox": {"l": 289.017, "t": 457.614, "r": 310.004, "b": 468.903, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 95, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 289.017, "r_y0": 468.903, "r_x1": 310.004, "r_y1": 468.903, "r_x2": 310.004, "r_y2": 457.614, "r_x3": 289.017, "r_y3": 457.614, "coord_origin": "TOPLEFT"}, "text": "0.944", "orig": "0.944", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 76, "label": "text", "bbox": {"l": 326.717, "t": 457.614, "r": 347.704, "b": 468.903, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 96, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 326.717, "r_y0": 468.903, "r_x1": 347.704, "r_y1": 468.903, "r_x2": 347.704, "r_y2": 457.614, "r_x3": 326.717, "r_y3": 457.614, "coord_origin": "TOPLEFT"}, "text": "0.903", "orig": "0.903", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 77, "label": "text", "bbox": {"l": 363.676, "t": 457.614, "r": 384.663, "b": 468.903, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 97, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 363.676, "r_y0": 468.903, "r_x1": 384.663, "r_y1": 468.903, "r_x2": 384.663, "r_y2": 457.614, "r_x3": 363.676, "r_y3": 457.614, "coord_origin": "TOPLEFT"}, "text": "0.931", "orig": "0.931", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 78, "label": "text", "bbox": {"l": 396.206, "t": 457.614, "r": 417.193, "b": 468.903, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 98, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 396.206, "r_y0": 468.903, "r_x1": 417.193, "r_y1": 468.903, "r_x2": 417.193, "r_y2": 457.614, "r_x3": 396.206, "r_y3": 457.614, "coord_origin": "TOPLEFT"}, "text": "0.824", "orig": "0.824", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 79, "label": "text", "bbox": {"l": 446.653, "t": 457.614, "r": 451.26, "b": 468.903, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 99, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 446.653, "r_y0": 468.903, "r_x1": 451.26, "r_y1": 468.903, "r_x2": 451.26, "r_y2": 457.614, "r_x3": 446.653, "r_y3": 457.614, "coord_origin": "TOPLEFT"}, "text": "2", "orig": "2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}]}, "text": null, "otsl_seq": ["ched", "ched", "ched", "ched", "lcel", "lcel", "ched", "ched", "nl", "ucel", "ucel", "ucel", "ched", "ched", "ched", "ched", "ched", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "nl"], "num_rows": 6, "num_cols": 8, "table_cells": [{"bbox": {"l": 144.592, "t": 339.457, "r": 183.828, "b": 363.697, "coord_origin": "TOPLEFT"}, "row_span": 2, "col_span": 1, "start_row_offset_idx": 0, "end_row_offset_idx": 2, "start_col_offset_idx": 0, "end_col_offset_idx": 1, "text": "# enc-layers", "column_header": true, "row_header": false, "row_section": false}, {"bbox": {"l": 192.195, "t": 339.457, "r": 231.431, "b": 363.697, "coord_origin": "TOPLEFT"}, "row_span": 2, "col_span": 1, "start_row_offset_idx": 0, "end_row_offset_idx": 2, "start_col_offset_idx": 1, "end_col_offset_idx": 2, "text": "# dec-layers", "column_header": true, "row_header": false, "row_section": false}, {"bbox": {"l": 239.798, "t": 344.936, "r": 278.318, "b": 356.225, "coord_origin": "TOPLEFT"}, "row_span": 2, "col_span": 1, "start_row_offset_idx": 0, "end_row_offset_idx": 2, "start_col_offset_idx": 2, "end_col_offset_idx": 3, "text": "Language", "column_header": true, "row_header": false, "row_section": false}, {"bbox": {"l": 324.67, "t": 339.457, "r": 348.264, "b": 350.746, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 3, "start_row_offset_idx": 0, "end_row_offset_idx": 1, "start_col_offset_idx": 3, "end_col_offset_idx": 6, "text": "TEDs", "column_header": true, "row_header": false, "row_section": false}, {"bbox": {"l": 396.271, "t": 339.457, "r": 417.127, "b": 350.746, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 0, "end_row_offset_idx": 1, "start_col_offset_idx": 6, "end_col_offset_idx": 7, "text": "mAP", "column_header": true, "row_header": false, "row_section": false}, {"bbox": {"l": 394.927, "t": 350.416, "r": 418.473, "b": 361.705, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 1, "end_row_offset_idx": 2, "start_col_offset_idx": 6, "end_col_offset_idx": 7, "text": "(0.75)", "column_header": true, "row_header": false, "row_section": false}, {"bbox": {"l": 430.771, "t": 339.457, "r": 467.142, "b": 350.746, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 0, "end_row_offset_idx": 1, "start_col_offset_idx": 7, "end_col_offset_idx": 8, "text": "Inference", "column_header": true, "row_header": false, "row_section": false}, {"bbox": {"l": 427.148, "t": 350.416, "r": 470.761, "b": 361.705, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 1, "end_row_offset_idx": 2, "start_col_offset_idx": 7, "end_col_offset_idx": 8, "text": "time (secs)", "column_header": true, "row_header": false, "row_section": false}, {"bbox": {"l": 286.686, "t": 352.408, "r": 312.333, "b": 363.697, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 1, "end_row_offset_idx": 2, "start_col_offset_idx": 3, "end_col_offset_idx": 4, "text": "simple", "column_header": true, "row_header": false, "row_section": false}, {"bbox": {"l": 320.702, "t": 352.408, "r": 353.72, "b": 363.697, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 1, "end_row_offset_idx": 2, "start_col_offset_idx": 4, "end_col_offset_idx": 5, "text": "complex", "column_header": true, "row_header": false, "row_section": false}, {"bbox": {"l": 369.306, "t": 352.408, "r": 379.031, "b": 363.697, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 1, "end_row_offset_idx": 2, "start_col_offset_idx": 5, "end_col_offset_idx": 6, "text": "all", "column_header": true, "row_header": false, "row_section": false}, {"bbox": {"l": 161.906, "t": 371.238, "r": 166.513, "b": 382.527, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 2, "end_row_offset_idx": 3, "start_col_offset_idx": 0, "end_col_offset_idx": 1, "text": "6", "column_header": false, "row_header": false, "row_section": false}, {"bbox": {"l": 209.509, "t": 371.238, "r": 214.116, "b": 382.527, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 2, "end_row_offset_idx": 3, "start_col_offset_idx": 1, "end_col_offset_idx": 2, "text": "6", "column_header": false, "row_header": false, "row_section": false}, {"bbox": {"l": 245.176, "t": 365.758, "r": 272.94, "b": 389.999, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 2, "end_row_offset_idx": 3, "start_col_offset_idx": 2, "end_col_offset_idx": 3, "text": "OTSL HTML", "column_header": false, "row_header": false, "row_section": false}, {"bbox": {"l": 289.017, "t": 365.758, "r": 310.004, "b": 389.999, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 2, "end_row_offset_idx": 3, "start_col_offset_idx": 3, "end_col_offset_idx": 4, "text": "0.965 0.969", "column_header": false, "row_header": false, "row_section": false}, {"bbox": {"l": 326.717, "t": 365.758, "r": 347.704, "b": 389.999, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 2, "end_row_offset_idx": 3, "start_col_offset_idx": 4, "end_col_offset_idx": 5, "text": "0.934 0.927", "column_header": false, "row_header": false, "row_section": false}, {"bbox": {"l": 363.676, "t": 365.758, "r": 384.663, "b": 389.999, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 2, "end_row_offset_idx": 3, "start_col_offset_idx": 5, "end_col_offset_idx": 6, "text": "0.955 0.955", "column_header": false, "row_header": false, "row_section": false}, {"bbox": {"l": 396.206, "t": 367.973, "r": 417.193, "b": 389.999, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 2, "end_row_offset_idx": 3, "start_col_offset_idx": 6, "end_col_offset_idx": 7, "text": "0.88 0.857", "column_header": false, "row_header": false, "row_section": false}, {"bbox": {"l": 439.527, "t": 367.973, "r": 458.384, "b": 389.999, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 2, "end_row_offset_idx": 3, "start_col_offset_idx": 7, "end_col_offset_idx": 8, "text": "2.73 5.39", "column_header": false, "row_header": false, "row_section": false}, {"bbox": {"l": 161.906, "t": 397.539, "r": 166.513, "b": 408.828, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 3, "end_row_offset_idx": 4, "start_col_offset_idx": 0, "end_col_offset_idx": 1, "text": "4", "column_header": false, "row_header": false, "row_section": false}, {"bbox": {"l": 209.509, "t": 397.539, "r": 214.116, "b": 408.828, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 3, "end_row_offset_idx": 4, "start_col_offset_idx": 1, "end_col_offset_idx": 2, "text": "4", "column_header": false, "row_header": false, "row_section": false}, {"bbox": {"l": 245.176, "t": 392.06, "r": 272.94, "b": 416.3, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 3, "end_row_offset_idx": 4, "start_col_offset_idx": 2, "end_col_offset_idx": 3, "text": "OTSL HTML", "column_header": false, "row_header": false, "row_section": false}, {"bbox": {"l": 289.017, "t": 392.06, "r": 310.004, "b": 416.3, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 3, "end_row_offset_idx": 4, "start_col_offset_idx": 3, "end_col_offset_idx": 4, "text": "0.938 0.952", "column_header": false, "row_header": false, "row_section": false}, {"bbox": {"l": 326.717, "t": 392.06, "r": 347.704, "b": 416.3, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 3, "end_row_offset_idx": 4, "start_col_offset_idx": 4, "end_col_offset_idx": 5, "text": "0.904 0.909", "column_header": false, "row_header": false, "row_section": false}, {"bbox": {"l": 362.088, "t": 392.06, "r": 386.249, "b": 415.152, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 3, "end_row_offset_idx": 4, "start_col_offset_idx": 5, "end_col_offset_idx": 6, "text": "0.927 0.938", "column_header": false, "row_header": false, "row_section": false}, {"bbox": {"l": 394.618, "t": 394.275, "r": 418.779, "b": 416.3, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 3, "end_row_offset_idx": 4, "start_col_offset_idx": 6, "end_col_offset_idx": 7, "text": "0.853 0.843", "column_header": false, "row_header": false, "row_section": false}, {"bbox": {"l": 439.527, "t": 394.275, "r": 458.384, "b": 416.3, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 3, "end_row_offset_idx": 4, "start_col_offset_idx": 7, "end_col_offset_idx": 8, "text": "1.97 3.77", "column_header": false, "row_header": false, "row_section": false}, {"bbox": {"l": 161.906, "t": 423.84, "r": 166.513, "b": 435.129, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 4, "end_row_offset_idx": 5, "start_col_offset_idx": 0, "end_col_offset_idx": 1, "text": "2", "column_header": false, "row_header": false, "row_section": false}, {"bbox": {"l": 209.509, "t": 423.84, "r": 214.116, "b": 435.129, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 4, "end_row_offset_idx": 5, "start_col_offset_idx": 1, "end_col_offset_idx": 2, "text": "4", "column_header": false, "row_header": false, "row_section": false}, {"bbox": {"l": 245.176, "t": 418.361, "r": 272.94, "b": 442.601, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 4, "end_row_offset_idx": 5, "start_col_offset_idx": 2, "end_col_offset_idx": 3, "text": "OTSL HTML", "column_header": false, "row_header": false, "row_section": false}, {"bbox": {"l": 289.017, "t": 418.361, "r": 310.004, "b": 442.601, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 4, "end_row_offset_idx": 5, "start_col_offset_idx": 3, "end_col_offset_idx": 4, "text": "0.923 0.945", "column_header": false, "row_header": false, "row_section": false}, {"bbox": {"l": 326.717, "t": 418.361, "r": 347.704, "b": 442.601, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 4, "end_row_offset_idx": 5, "start_col_offset_idx": 4, "end_col_offset_idx": 5, "text": "0.897 0.901", "column_header": false, "row_header": false, "row_section": false}, {"bbox": {"l": 362.088, "t": 418.361, "r": 386.249, "b": 441.453, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 4, "end_row_offset_idx": 5, "start_col_offset_idx": 5, "end_col_offset_idx": 6, "text": "0.915 0.931", "column_header": false, "row_header": false, "row_section": false}, {"bbox": {"l": 394.618, "t": 420.576, "r": 418.779, "b": 442.601, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 4, "end_row_offset_idx": 5, "start_col_offset_idx": 6, "end_col_offset_idx": 7, "text": "0.859 0.834", "column_header": false, "row_header": false, "row_section": false}, {"bbox": {"l": 439.527, "t": 420.576, "r": 458.384, "b": 442.601, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 4, "end_row_offset_idx": 5, "start_col_offset_idx": 7, "end_col_offset_idx": 8, "text": "1.91 3.81", "column_header": false, "row_header": false, "row_section": false}, {"bbox": {"l": 161.906, "t": 450.142, "r": 166.513, "b": 461.431, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 5, "end_row_offset_idx": 6, "start_col_offset_idx": 0, "end_col_offset_idx": 1, "text": "4", "column_header": false, "row_header": false, "row_section": false}, {"bbox": {"l": 209.509, "t": 450.142, "r": 214.116, "b": 461.431, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 5, "end_row_offset_idx": 6, "start_col_offset_idx": 1, "end_col_offset_idx": 2, "text": "2", "column_header": false, "row_header": false, "row_section": false}, {"bbox": {"l": 245.176, "t": 444.662, "r": 272.94, "b": 468.903, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 5, "end_row_offset_idx": 6, "start_col_offset_idx": 2, "end_col_offset_idx": 3, "text": "OTSL HTML", "column_header": false, "row_header": false, "row_section": false}, {"bbox": {"l": 289.017, "t": 444.662, "r": 310.004, "b": 468.903, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 5, "end_row_offset_idx": 6, "start_col_offset_idx": 3, "end_col_offset_idx": 4, "text": "0.952 0.944", "column_header": false, "row_header": false, "row_section": false}, {"bbox": {"l": 326.717, "t": 444.662, "r": 347.704, "b": 468.903, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 5, "end_row_offset_idx": 6, "start_col_offset_idx": 4, "end_col_offset_idx": 5, "text": "0.92 0.903", "column_header": false, "row_header": false, "row_section": false}, {"bbox": {"l": 362.088, "t": 446.877, "r": 386.249, "b": 468.903, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 5, "end_row_offset_idx": 6, "start_col_offset_idx": 5, "end_col_offset_idx": 6, "text": "0.942 0.931", "column_header": false, "row_header": false, "row_section": false}, {"bbox": {"l": 394.618, "t": 446.877, "r": 418.779, "b": 468.903, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 5, "end_row_offset_idx": 6, "start_col_offset_idx": 6, "end_col_offset_idx": 7, "text": "0.857 0.824", "column_header": false, "row_header": false, "row_section": false}, {"bbox": {"l": 439.527, "t": 446.877, "r": 458.384, "b": 468.903, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 5, "end_row_offset_idx": 6, "start_col_offset_idx": 7, "end_col_offset_idx": 8, "text": "1.22 2", "column_header": false, "row_header": false, "row_section": false}]}}}, "figures_classification": null, "equations_prediction": null, "vlm_response": null}, "assembled": {"elements": [{"label": "page_header", "id": 8, "page_no": 8, "cluster": {"id": 8, "label": "page_header", "bbox": {"l": 194.478, "t": 91.49300000000005, "r": 447.543, "b": 102.78200000000004, "coord_origin": "TOPLEFT"}, "confidence": 0.9373378753662109, "cells": [{"index": 0, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 194.478, "r_y0": 102.78200000000004, "r_x1": 447.543, "r_y1": 102.78200000000004, "r_x2": 447.543, "r_y2": 91.49300000000005, "r_x3": 194.478, "r_y3": 91.49300000000005, "coord_origin": "TOPLEFT"}, "text": "Optimized Table Tokenization for Table Structure Recognition", "orig": "Optimized Table Tokenization for Table Structure Recognition", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "Optimized Table Tokenization for Table Structure Recognition"}, {"label": "page_header", "id": 9, "page_no": 8, "cluster": {"id": 9, "label": "page_header", "bbox": {"l": 475.984, "t": 91.49300000000005, "r": 480.591, "b": 102.78200000000004, "coord_origin": "TOPLEFT"}, "confidence": 0.8857625722885132, "cells": [{"index": 1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 475.984, "r_y0": 102.78200000000004, "r_x1": 480.591, "r_y1": 102.78200000000004, "r_x2": 480.591, "r_y2": 91.49300000000005, "r_x3": 475.984, "r_y3": 91.49300000000005, "coord_origin": "TOPLEFT"}, "text": "9", "orig": "9", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "9"}, {"label": "text", "id": 4, "page_no": 8, "cluster": {"id": 4, "label": "text", "bbox": {"l": 134.765, "t": 118.93399999999997, "r": 480.596, "b": 151.64200000000005, "coord_origin": "TOPLEFT"}, "confidence": 0.9805440306663513, "cells": [{"index": 2, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 127.731, "r_x1": 480.594, "r_y1": 127.731, "r_x2": 480.594, "r_y2": 118.93399999999997, "r_x3": 134.765, "r_y3": 118.93399999999997, "coord_origin": "TOPLEFT"}, "text": "order to compute the TED score. Inference timing results for all experiments", "orig": "order to compute the TED score. Inference timing results for all experiments", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 3, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 139.68600000000004, "r_x1": 480.596, "r_y1": 139.68600000000004, "r_x2": 480.596, "r_y2": 130.889, "r_x3": 134.765, "r_y3": 130.889, "coord_origin": "TOPLEFT"}, "text": "were obtained from the same machine on a single core with AMD EPYC 7763", "orig": "were obtained from the same machine on a single core with AMD EPYC 7763", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 4, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 151.64200000000005, "r_x1": 210.785, "r_y1": 151.64200000000005, "r_x2": 210.785, "r_y2": 142.84500000000003, "r_x3": 134.765, "r_y3": 142.84500000000003, "coord_origin": "TOPLEFT"}, "text": "CPU @2.45 GHz.", "orig": "CPU @2.45 GHz.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "order to compute the TED score. Inference timing results for all experiments were obtained from the same machine on a single core with AMD EPYC 7763 CPU @2.45 GHz."}, {"label": "section_header", "id": 6, "page_no": 8, "cluster": {"id": 6, "label": "section_header", "bbox": {"l": 134.765, "t": 169.18600000000004, "r": 318.448, "b": 177.99300000000005, "coord_origin": "TOPLEFT"}, "confidence": 0.9579681158065796, "cells": [{"index": 5, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 177.99300000000005, "r_x1": 149.402, "r_y1": 177.99300000000005, "r_x2": 149.402, "r_y2": 169.18600000000004, "r_x3": 134.765, "r_y3": 169.18600000000004, "coord_origin": "TOPLEFT"}, "text": "5.1", "orig": "5.1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 6, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 160.859, "r_y0": 177.99300000000005, "r_x1": 318.448, "r_y1": 177.99300000000005, "r_x2": 318.448, "r_y2": 169.18600000000004, "r_x3": 160.859, "r_y3": 169.18600000000004, "coord_origin": "TOPLEFT"}, "text": "Hyper Parameter Optimization", "orig": "Hyper Parameter Optimization", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "5.1 Hyper Parameter Optimization"}, {"label": "text", "id": 3, "page_no": 8, "cluster": {"id": 3, "label": "text", "bbox": {"l": 134.765, "t": 185.586, "r": 480.593, "b": 254.159, "coord_origin": "TOPLEFT"}, "confidence": 0.9842326641082764, "cells": [{"index": 7, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 194.38300000000004, "r_x1": 480.592, "r_y1": 194.38300000000004, "r_x2": 480.592, "r_y2": 185.586, "r_x3": 134.765, "r_y3": 185.586, "coord_origin": "TOPLEFT"}, "text": "We have chosen the PubTabNet data set to perform HPO, since it includes a", "orig": "We have chosen the PubTabNet data set to perform HPO, since it includes a", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 8, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 206.33799999999997, "r_x1": 480.592, "r_y1": 206.33799999999997, "r_x2": 480.592, "r_y2": 197.54100000000005, "r_x3": 134.765, "r_y3": 197.54100000000005, "coord_origin": "TOPLEFT"}, "text": "highly diverse set of tables. Also we report TED scores separately for simple and", "orig": "highly diverse set of tables. Also we report TED scores separately for simple and", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 9, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 218.293, "r_x1": 480.592, "r_y1": 218.293, "r_x2": 480.592, "r_y2": 209.49599999999998, "r_x3": 134.765, "r_y3": 209.49599999999998, "coord_origin": "TOPLEFT"}, "text": "complex tables (tables with cell spans). Results are presented in Table. 1. It is", "orig": "complex tables (tables with cell spans). Results are presented in Table. 1. It is", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 10, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 230.24800000000005, "r_x1": 480.593, "r_y1": 230.24800000000005, "r_x2": 480.593, "r_y2": 221.45100000000002, "r_x3": 134.765, "r_y3": 221.45100000000002, "coord_origin": "TOPLEFT"}, "text": "evident that with OTSL, our model achieves the same TED score and slightly", "orig": "evident that with OTSL, our model achieves the same TED score and slightly", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 11, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 242.20299999999997, "r_x1": 440.942, "r_y1": 242.20299999999997, "r_x2": 440.942, "r_y2": 233.40599999999995, "r_x3": 134.765, "r_y3": 233.40599999999995, "coord_origin": "TOPLEFT"}, "text": "better mAP scores in comparison to HTML. However OTSL yields a", "orig": "better mAP scores in comparison to HTML. However OTSL yields a", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 12, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 444.868, "r_y0": 242.20299999999997, "r_x1": 480.588, "r_y1": 242.20299999999997, "r_x2": 480.588, "r_y2": 233.40599999999995, "r_x3": 444.868, "r_y3": 233.40599999999995, "coord_origin": "TOPLEFT"}, "text": "2x speed", "orig": "2x speed", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 13, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 254.159, "r_x1": 145.201, "r_y1": 254.159, "r_x2": 145.201, "r_y2": 245.36199999999997, "r_x3": 134.765, "r_y3": 245.36199999999997, "coord_origin": "TOPLEFT"}, "text": "up", "orig": "up", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 14, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 149.149, "r_y0": 254.159, "r_x1": 311.22, "r_y1": 254.159, "r_x2": 311.22, "r_y2": 245.36199999999997, "r_x3": 149.149, "r_y3": 245.36199999999997, "coord_origin": "TOPLEFT"}, "text": "in the inference runtime over HTML.", "orig": "in the inference runtime over HTML.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "We have chosen the PubTabNet data set to perform HPO, since it includes a highly diverse set of tables. Also we report TED scores separately for simple and complex tables (tables with cell spans). Results are presented in Table. 1. It is evident that with OTSL, our model achieves the same TED score and slightly better mAP scores in comparison to HTML. However OTSL yields a 2x speed up in the inference runtime over HTML."}, {"label": "caption", "id": 7, "page_no": 8, "cluster": {"id": 7, "label": "caption", "bbox": {"l": 134.765, "t": 272.85699999999997, "r": 480.595, "b": 327.982, "coord_origin": "TOPLEFT"}, "confidence": 0.9570781588554382, "cells": [{"index": 15, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 282.998, "r_x1": 160.118, "r_y1": 282.998, "r_x2": 160.118, "r_y2": 275.072, "r_x3": 134.765, "r_y3": 275.072, "coord_origin": "TOPLEFT"}, "text": "Table", "orig": "Table", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 16, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 167.345, "r_y0": 282.998, "r_x1": 175.595, "r_y1": 282.998, "r_x2": 175.595, "r_y2": 275.072, "r_x3": 167.345, "r_y3": 275.072, "coord_origin": "TOPLEFT"}, "text": "1.", "orig": "1.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 17, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 188.133, "r_y0": 284.146, "r_x1": 255.736, "r_y1": 284.146, "r_x2": 255.736, "r_y2": 272.85699999999997, "r_x3": 188.133, "r_y3": 272.85699999999997, "coord_origin": "TOPLEFT"}, "text": "HPO performed", "orig": "HPO performed", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 18, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 262.013, "r_y0": 284.146, "r_x1": 269.69, "r_y1": 284.146, "r_x2": 269.69, "r_y2": 272.85699999999997, "r_x3": 262.013, "r_y3": 272.85699999999997, "coord_origin": "TOPLEFT"}, "text": "in", "orig": "in", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 19, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 275.957, "r_y0": 284.146, "r_x1": 300.652, "r_y1": 284.146, "r_x2": 300.652, "r_y2": 272.85699999999997, "r_x3": 275.957, "r_y3": 272.85699999999997, "coord_origin": "TOPLEFT"}, "text": "OTSL", "orig": "OTSL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 20, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 306.92, "r_y0": 284.146, "r_x1": 321.763, "r_y1": 284.146, "r_x2": 321.763, "r_y2": 272.85699999999997, "r_x3": 306.92, "r_y3": 272.85699999999997, "coord_origin": "TOPLEFT"}, "text": "and", "orig": "and", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 21, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 328.03, "r_y0": 284.146, "r_x1": 419.24, "r_y1": 284.146, "r_x2": 419.24, "r_y2": 272.85699999999997, "r_x3": 328.03, "r_y3": 272.85699999999997, "coord_origin": "TOPLEFT"}, "text": "HTML representation", "orig": "HTML representation", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 22, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 425.508, "r_y0": 284.146, "r_x1": 435.233, "r_y1": 284.146, "r_x2": 435.233, "r_y2": 272.85699999999997, "r_x3": 425.508, "r_y3": 272.85699999999997, "coord_origin": "TOPLEFT"}, "text": "on", "orig": "on", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 23, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 441.509, "r_y0": 284.146, "r_x1": 454.309, "r_y1": 284.146, "r_x2": 454.309, "r_y2": 272.85699999999997, "r_x3": 441.509, "r_y3": 272.85699999999997, "coord_origin": "TOPLEFT"}, "text": "the", "orig": "the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 24, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 460.576, "r_y0": 284.146, "r_x1": 480.594, "r_y1": 284.146, "r_x2": 480.594, "r_y2": 272.85699999999997, "r_x3": 460.576, "r_y3": 272.85699999999997, "coord_origin": "TOPLEFT"}, "text": "same", "orig": "same", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 25, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 295.105, "r_x1": 480.595, "r_y1": 295.105, "r_x2": 480.595, "r_y2": 283.816, "r_x3": 134.765, "r_y3": 283.816, "coord_origin": "TOPLEFT"}, "text": "transformer-based TableFormer [9] architecture, trained only on PubTabNet [22]. Ef-", "orig": "transformer-based TableFormer [9] architecture, trained only on PubTabNet [22]. Ef-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 26, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 306.064, "r_x1": 480.595, "r_y1": 306.064, "r_x2": 480.595, "r_y2": 294.775, "r_x3": 134.765, "r_y3": 294.775, "coord_origin": "TOPLEFT"}, "text": "fects of reducing the # of layers in encoder and decoder stages of the model show that", "orig": "fects of reducing the # of layers in encoder and decoder stages of the model show that", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 27, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 317.023, "r_x1": 163.504, "r_y1": 317.023, "r_x2": 163.504, "r_y2": 305.734, "r_x3": 134.765, "r_y3": 305.734, "coord_origin": "TOPLEFT"}, "text": "smaller", "orig": "smaller", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 28, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 167.817, "r_y0": 317.023, "r_x1": 443.264, "r_y1": 317.023, "r_x2": 443.264, "r_y2": 305.734, "r_x3": 167.817, "r_y3": 305.734, "coord_origin": "TOPLEFT"}, "text": "models trained on OTSL perform better, especially in recognizing", "orig": "models trained on OTSL perform better, especially in recognizing", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 29, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 447.577, "r_y0": 317.023, "r_x1": 480.595, "r_y1": 317.023, "r_x2": 480.595, "r_y2": 305.734, "r_x3": 447.577, "r_y3": 305.734, "coord_origin": "TOPLEFT"}, "text": "complex", "orig": "complex", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 30, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 327.982, "r_x1": 480.595, "r_y1": 327.982, "r_x2": 480.595, "r_y2": 316.693, "r_x3": 134.765, "r_y3": 316.693, "coord_origin": "TOPLEFT"}, "text": "table structures, and maintain a much higher mAP score than the HTML counterpart.", "orig": "table structures, and maintain a much higher mAP score than the HTML counterpart.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "Table 1. HPO performed in OTSL and HTML representation on the same transformer-based TableFormer [9] architecture, trained only on PubTabNet [22]. Effects of reducing the # of layers in encoder and decoder stages of the model show that smaller models trained on OTSL perform better, especially in recognizing complex table structures, and maintain a much higher mAP score than the HTML counterpart."}, {"label": "table", "id": 0, "page_no": 8, "cluster": {"id": 0, "label": "table", "bbox": {"l": 139.66845703125, "t": 337.5747985839844, "r": 475.00372314453125, "b": 469.4721374511719, "coord_origin": "TOPLEFT"}, "confidence": 0.9901032447814941, "cells": [{"index": 31, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 160.37, "r_y0": 350.746, "r_x1": 168.048, "r_y1": 350.746, "r_x2": 168.048, "r_y2": 339.457, "r_x3": 160.37, "r_y3": 339.457, "coord_origin": "TOPLEFT"}, "text": "#", "orig": "#", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 32, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 144.592, "r_y0": 363.697, "r_x1": 183.828, "r_y1": 363.697, "r_x2": 183.828, "r_y2": 352.408, "r_x3": 144.592, "r_y3": 352.408, "coord_origin": "TOPLEFT"}, "text": "enc-layers", "orig": "enc-layers", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 33, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 207.974, "r_y0": 350.746, "r_x1": 215.652, "r_y1": 350.746, "r_x2": 215.652, "r_y2": 339.457, "r_x3": 207.974, "r_y3": 339.457, "coord_origin": "TOPLEFT"}, "text": "#", "orig": "#", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 34, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 192.195, "r_y0": 363.697, "r_x1": 231.431, "r_y1": 363.697, "r_x2": 231.431, "r_y2": 352.408, "r_x3": 192.195, "r_y3": 352.408, "coord_origin": "TOPLEFT"}, "text": "dec-layers", "orig": "dec-layers", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 35, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 239.798, "r_y0": 356.225, "r_x1": 278.318, "r_y1": 356.225, "r_x2": 278.318, "r_y2": 344.936, "r_x3": 239.798, "r_y3": 344.936, "coord_origin": "TOPLEFT"}, "text": "Language", "orig": "Language", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 36, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 324.67, "r_y0": 350.746, "r_x1": 348.264, "r_y1": 350.746, "r_x2": 348.264, "r_y2": 339.457, "r_x3": 324.67, "r_y3": 339.457, "coord_origin": "TOPLEFT"}, "text": "TEDs", "orig": "TEDs", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 37, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 396.271, "r_y0": 350.746, "r_x1": 417.127, "r_y1": 350.746, "r_x2": 417.127, "r_y2": 339.457, "r_x3": 396.271, "r_y3": 339.457, "coord_origin": "TOPLEFT"}, "text": "mAP", "orig": "mAP", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 38, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 394.927, "r_y0": 361.705, "r_x1": 418.473, "r_y1": 361.705, "r_x2": 418.473, "r_y2": 350.416, "r_x3": 394.927, "r_y3": 350.416, "coord_origin": "TOPLEFT"}, "text": "(0.75)", "orig": "(0.75)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 39, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 430.771, "r_y0": 350.746, "r_x1": 467.142, "r_y1": 350.746, "r_x2": 467.142, "r_y2": 339.457, "r_x3": 430.771, "r_y3": 339.457, "coord_origin": "TOPLEFT"}, "text": "Inference", "orig": "Inference", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 40, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 427.148, "r_y0": 361.705, "r_x1": 470.761, "r_y1": 361.705, "r_x2": 470.761, "r_y2": 350.416, "r_x3": 427.148, "r_y3": 350.416, "coord_origin": "TOPLEFT"}, "text": "time (secs)", "orig": "time (secs)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 41, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 286.686, "r_y0": 363.697, "r_x1": 312.333, "r_y1": 363.697, "r_x2": 312.333, "r_y2": 352.408, "r_x3": 286.686, "r_y3": 352.408, "coord_origin": "TOPLEFT"}, "text": "simple", "orig": "simple", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 42, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 320.702, "r_y0": 363.697, "r_x1": 353.72, "r_y1": 363.697, "r_x2": 353.72, "r_y2": 352.408, "r_x3": 320.702, "r_y3": 352.408, "coord_origin": "TOPLEFT"}, "text": "complex", "orig": "complex", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 43, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 369.306, "r_y0": 363.697, "r_x1": 379.031, "r_y1": 363.697, "r_x2": 379.031, "r_y2": 352.408, "r_x3": 369.306, "r_y3": 352.408, "coord_origin": "TOPLEFT"}, "text": "all", "orig": "all", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 44, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 161.906, "r_y0": 382.527, "r_x1": 166.513, "r_y1": 382.527, "r_x2": 166.513, "r_y2": 371.238, "r_x3": 161.906, "r_y3": 371.238, "coord_origin": "TOPLEFT"}, "text": "6", "orig": "6", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 45, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 209.509, "r_y0": 382.527, "r_x1": 214.116, "r_y1": 382.527, "r_x2": 214.116, "r_y2": 371.238, "r_x3": 209.509, "r_y3": 371.238, "coord_origin": "TOPLEFT"}, "text": "6", "orig": "6", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 46, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 246.71, "r_y0": 377.047, "r_x1": 271.405, "r_y1": 377.047, "r_x2": 271.405, "r_y2": 365.758, "r_x3": 246.71, "r_y3": 365.758, "coord_origin": "TOPLEFT"}, "text": "OTSL", "orig": "OTSL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 47, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 289.017, "r_y0": 377.047, "r_x1": 310.004, "r_y1": 377.047, "r_x2": 310.004, "r_y2": 365.758, "r_x3": 289.017, "r_y3": 365.758, "coord_origin": "TOPLEFT"}, "text": "0.965", "orig": "0.965", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 48, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 326.717, "r_y0": 377.047, "r_x1": 347.704, "r_y1": 377.047, "r_x2": 347.704, "r_y2": 365.758, "r_x3": 326.717, "r_y3": 365.758, "coord_origin": "TOPLEFT"}, "text": "0.934", "orig": "0.934", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 49, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 363.676, "r_y0": 377.047, "r_x1": 384.663, "r_y1": 377.047, "r_x2": 384.663, "r_y2": 365.758, "r_x3": 363.676, "r_y3": 365.758, "coord_origin": "TOPLEFT"}, "text": "0.955", "orig": "0.955", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 50, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 397.27, "r_y0": 375.899, "r_x1": 416.127, "r_y1": 375.899, "r_x2": 416.127, "r_y2": 367.973, "r_x3": 397.27, "r_y3": 367.973, "coord_origin": "TOPLEFT"}, "text": "0.88", "orig": "0.88", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 51, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 439.527, "r_y0": 375.899, "r_x1": 458.384, "r_y1": 375.899, "r_x2": 458.384, "r_y2": 367.973, "r_x3": 439.527, "r_y3": 367.973, "coord_origin": "TOPLEFT"}, "text": "2.73", "orig": "2.73", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 52, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 245.176, "r_y0": 389.999, "r_x1": 272.94, "r_y1": 389.999, "r_x2": 272.94, "r_y2": 378.71, "r_x3": 245.176, "r_y3": 378.71, "coord_origin": "TOPLEFT"}, "text": "HTML", "orig": "HTML", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 53, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 289.017, "r_y0": 389.999, "r_x1": 310.004, "r_y1": 389.999, "r_x2": 310.004, "r_y2": 378.71, "r_x3": 289.017, "r_y3": 378.71, "coord_origin": "TOPLEFT"}, "text": "0.969", "orig": "0.969", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 54, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 326.717, "r_y0": 389.999, "r_x1": 347.704, "r_y1": 389.999, "r_x2": 347.704, "r_y2": 378.71, "r_x3": 326.717, "r_y3": 378.71, "coord_origin": "TOPLEFT"}, "text": "0.927", "orig": "0.927", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 55, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 363.676, "r_y0": 389.999, "r_x1": 384.663, "r_y1": 389.999, "r_x2": 384.663, "r_y2": 378.71, "r_x3": 363.676, "r_y3": 378.71, "coord_origin": "TOPLEFT"}, "text": "0.955", "orig": "0.955", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 56, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 396.206, "r_y0": 389.999, "r_x1": 417.193, "r_y1": 389.999, "r_x2": 417.193, "r_y2": 378.71, "r_x3": 396.206, "r_y3": 378.71, "coord_origin": "TOPLEFT"}, "text": "0.857", "orig": "0.857", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 57, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 440.767, "r_y0": 389.999, "r_x1": 457.147, "r_y1": 389.999, "r_x2": 457.147, "r_y2": 378.71, "r_x3": 440.767, "r_y3": 378.71, "coord_origin": "TOPLEFT"}, "text": "5.39", "orig": "5.39", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 58, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 161.906, "r_y0": 408.828, "r_x1": 166.513, "r_y1": 408.828, "r_x2": 166.513, "r_y2": 397.539, "r_x3": 161.906, "r_y3": 397.539, "coord_origin": "TOPLEFT"}, "text": "4", "orig": "4", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 59, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 209.509, "r_y0": 408.828, "r_x1": 214.116, "r_y1": 408.828, "r_x2": 214.116, "r_y2": 397.539, "r_x3": 209.509, "r_y3": 397.539, "coord_origin": "TOPLEFT"}, "text": "4", "orig": "4", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 60, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 246.71, "r_y0": 403.349, "r_x1": 271.405, "r_y1": 403.349, "r_x2": 271.405, "r_y2": 392.06, "r_x3": 246.71, "r_y3": 392.06, "coord_origin": "TOPLEFT"}, "text": "OTSL", "orig": "OTSL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 61, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 289.017, "r_y0": 403.349, "r_x1": 310.004, "r_y1": 403.349, "r_x2": 310.004, "r_y2": 392.06, "r_x3": 289.017, "r_y3": 392.06, "coord_origin": "TOPLEFT"}, "text": "0.938", "orig": "0.938", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 62, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 326.717, "r_y0": 403.349, "r_x1": 347.704, "r_y1": 403.349, "r_x2": 347.704, "r_y2": 392.06, "r_x3": 326.717, "r_y3": 392.06, "coord_origin": "TOPLEFT"}, "text": "0.904", "orig": "0.904", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 63, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 363.676, "r_y0": 403.349, "r_x1": 384.663, "r_y1": 403.349, "r_x2": 384.663, "r_y2": 392.06, "r_x3": 363.676, "r_y3": 392.06, "coord_origin": "TOPLEFT"}, "text": "0.927", "orig": "0.927", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 64, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 394.618, "r_y0": 402.201, "r_x1": 418.779, "r_y1": 402.201, "r_x2": 418.779, "r_y2": 394.275, "r_x3": 394.618, "r_y3": 394.275, "coord_origin": "TOPLEFT"}, "text": "0.853", "orig": "0.853", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 65, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 439.527, "r_y0": 402.201, "r_x1": 458.384, "r_y1": 402.201, "r_x2": 458.384, "r_y2": 394.275, "r_x3": 439.527, "r_y3": 394.275, "coord_origin": "TOPLEFT"}, "text": "1.97", "orig": "1.97", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 66, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 245.176, "r_y0": 416.3, "r_x1": 272.94, "r_y1": 416.3, "r_x2": 272.94, "r_y2": 405.011, "r_x3": 245.176, "r_y3": 405.011, "coord_origin": "TOPLEFT"}, "text": "HTML", "orig": "HTML", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 67, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 289.017, "r_y0": 416.3, "r_x1": 310.004, "r_y1": 416.3, "r_x2": 310.004, "r_y2": 405.011, "r_x3": 289.017, "r_y3": 405.011, "coord_origin": "TOPLEFT"}, "text": "0.952", "orig": "0.952", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 68, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 326.717, "r_y0": 416.3, "r_x1": 347.704, "r_y1": 416.3, "r_x2": 347.704, "r_y2": 405.011, "r_x3": 326.717, "r_y3": 405.011, "coord_origin": "TOPLEFT"}, "text": "0.909", "orig": "0.909", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 69, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 362.088, "r_y0": 415.152, "r_x1": 386.249, "r_y1": 415.152, "r_x2": 386.249, "r_y2": 407.226, "r_x3": 362.088, "r_y3": 407.226, "coord_origin": "TOPLEFT"}, "text": "0.938", "orig": "0.938", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 70, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 396.206, "r_y0": 416.3, "r_x1": 417.193, "r_y1": 416.3, "r_x2": 417.193, "r_y2": 405.011, "r_x3": 396.206, "r_y3": 405.011, "coord_origin": "TOPLEFT"}, "text": "0.843", "orig": "0.843", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 71, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 440.767, "r_y0": 416.3, "r_x1": 457.147, "r_y1": 416.3, "r_x2": 457.147, "r_y2": 405.011, "r_x3": 440.767, "r_y3": 405.011, "coord_origin": "TOPLEFT"}, "text": "3.77", "orig": "3.77", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 72, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 161.906, "r_y0": 435.129, "r_x1": 166.513, "r_y1": 435.129, "r_x2": 166.513, "r_y2": 423.84, "r_x3": 161.906, "r_y3": 423.84, "coord_origin": "TOPLEFT"}, "text": "2", "orig": "2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 73, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 209.509, "r_y0": 435.129, "r_x1": 214.116, "r_y1": 435.129, "r_x2": 214.116, "r_y2": 423.84, "r_x3": 209.509, "r_y3": 423.84, "coord_origin": "TOPLEFT"}, "text": "4", "orig": "4", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 74, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 246.71, "r_y0": 429.65, "r_x1": 271.405, "r_y1": 429.65, "r_x2": 271.405, "r_y2": 418.361, "r_x3": 246.71, "r_y3": 418.361, "coord_origin": "TOPLEFT"}, "text": "OTSL", "orig": "OTSL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 75, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 289.017, "r_y0": 429.65, "r_x1": 310.004, "r_y1": 429.65, "r_x2": 310.004, "r_y2": 418.361, "r_x3": 289.017, "r_y3": 418.361, "coord_origin": "TOPLEFT"}, "text": "0.923", "orig": "0.923", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 76, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 326.717, "r_y0": 429.65, "r_x1": 347.704, "r_y1": 429.65, "r_x2": 347.704, "r_y2": 418.361, "r_x3": 326.717, "r_y3": 418.361, "coord_origin": "TOPLEFT"}, "text": "0.897", "orig": "0.897", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 77, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 363.676, "r_y0": 429.65, "r_x1": 384.663, "r_y1": 429.65, "r_x2": 384.663, "r_y2": 418.361, "r_x3": 363.676, "r_y3": 418.361, "coord_origin": "TOPLEFT"}, "text": "0.915", "orig": "0.915", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 78, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 394.618, "r_y0": 428.502, "r_x1": 418.779, "r_y1": 428.502, "r_x2": 418.779, "r_y2": 420.576, "r_x3": 394.618, "r_y3": 420.576, "coord_origin": "TOPLEFT"}, "text": "0.859", "orig": "0.859", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 79, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 439.527, "r_y0": 428.502, "r_x1": 458.384, "r_y1": 428.502, "r_x2": 458.384, "r_y2": 420.576, "r_x3": 439.527, "r_y3": 420.576, "coord_origin": "TOPLEFT"}, "text": "1.91", "orig": "1.91", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 80, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 245.176, "r_y0": 442.601, "r_x1": 272.94, "r_y1": 442.601, "r_x2": 272.94, "r_y2": 431.312, "r_x3": 245.176, "r_y3": 431.312, "coord_origin": "TOPLEFT"}, "text": "HTML", "orig": "HTML", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 81, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 289.017, "r_y0": 442.601, "r_x1": 310.004, "r_y1": 442.601, "r_x2": 310.004, "r_y2": 431.312, "r_x3": 289.017, "r_y3": 431.312, "coord_origin": "TOPLEFT"}, "text": "0.945", "orig": "0.945", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 82, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 326.717, "r_y0": 442.601, "r_x1": 347.704, "r_y1": 442.601, "r_x2": 347.704, "r_y2": 431.312, "r_x3": 326.717, "r_y3": 431.312, "coord_origin": "TOPLEFT"}, "text": "0.901", "orig": "0.901", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 83, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 362.088, "r_y0": 441.453, "r_x1": 386.249, "r_y1": 441.453, "r_x2": 386.249, "r_y2": 433.527, "r_x3": 362.088, "r_y3": 433.527, "coord_origin": "TOPLEFT"}, "text": "0.931", "orig": "0.931", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 84, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 396.206, "r_y0": 442.601, "r_x1": 417.193, "r_y1": 442.601, "r_x2": 417.193, "r_y2": 431.312, "r_x3": 396.206, "r_y3": 431.312, "coord_origin": "TOPLEFT"}, "text": "0.834", "orig": "0.834", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 85, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 440.767, "r_y0": 442.601, "r_x1": 457.147, "r_y1": 442.601, "r_x2": 457.147, "r_y2": 431.312, "r_x3": 440.767, "r_y3": 431.312, "coord_origin": "TOPLEFT"}, "text": "3.81", "orig": "3.81", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 86, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 161.906, "r_y0": 461.431, "r_x1": 166.513, "r_y1": 461.431, "r_x2": 166.513, "r_y2": 450.142, "r_x3": 161.906, "r_y3": 450.142, "coord_origin": "TOPLEFT"}, "text": "4", "orig": "4", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 87, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 209.509, "r_y0": 461.431, "r_x1": 214.116, "r_y1": 461.431, "r_x2": 214.116, "r_y2": 450.142, "r_x3": 209.509, "r_y3": 450.142, "coord_origin": "TOPLEFT"}, "text": "2", "orig": "2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 88, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 246.71, "r_y0": 455.951, "r_x1": 271.405, "r_y1": 455.951, "r_x2": 271.405, "r_y2": 444.662, "r_x3": 246.71, "r_y3": 444.662, "coord_origin": "TOPLEFT"}, "text": "OTSL", "orig": "OTSL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 89, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 289.017, "r_y0": 455.951, "r_x1": 310.004, "r_y1": 455.951, "r_x2": 310.004, "r_y2": 444.662, "r_x3": 289.017, "r_y3": 444.662, "coord_origin": "TOPLEFT"}, "text": "0.952", "orig": "0.952", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 90, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 329.021, "r_y0": 455.951, "r_x1": 345.401, "r_y1": 455.951, "r_x2": 345.401, "r_y2": 444.662, "r_x3": 329.021, "r_y3": 444.662, "coord_origin": "TOPLEFT"}, "text": "0.92", "orig": "0.92", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 91, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 362.088, "r_y0": 454.803, "r_x1": 386.249, "r_y1": 454.803, "r_x2": 386.249, "r_y2": 446.877, "r_x3": 362.088, "r_y3": 446.877, "coord_origin": "TOPLEFT"}, "text": "0.942", "orig": "0.942", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 92, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 394.618, "r_y0": 454.803, "r_x1": 418.779, "r_y1": 454.803, "r_x2": 418.779, "r_y2": 446.877, "r_x3": 394.618, "r_y3": 446.877, "coord_origin": "TOPLEFT"}, "text": "0.857", "orig": "0.857", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 93, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 439.527, "r_y0": 454.803, "r_x1": 458.384, "r_y1": 454.803, "r_x2": 458.384, "r_y2": 446.877, "r_x3": 439.527, "r_y3": 446.877, "coord_origin": "TOPLEFT"}, "text": "1.22", "orig": "1.22", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 94, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 245.176, "r_y0": 468.903, "r_x1": 272.94, "r_y1": 468.903, "r_x2": 272.94, "r_y2": 457.614, "r_x3": 245.176, "r_y3": 457.614, "coord_origin": "TOPLEFT"}, "text": "HTML", "orig": "HTML", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 95, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 289.017, "r_y0": 468.903, "r_x1": 310.004, "r_y1": 468.903, "r_x2": 310.004, "r_y2": 457.614, "r_x3": 289.017, "r_y3": 457.614, "coord_origin": "TOPLEFT"}, "text": "0.944", "orig": "0.944", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 96, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 326.717, "r_y0": 468.903, "r_x1": 347.704, "r_y1": 468.903, "r_x2": 347.704, "r_y2": 457.614, "r_x3": 326.717, "r_y3": 457.614, "coord_origin": "TOPLEFT"}, "text": "0.903", "orig": "0.903", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 97, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 363.676, "r_y0": 468.903, "r_x1": 384.663, "r_y1": 468.903, "r_x2": 384.663, "r_y2": 457.614, "r_x3": 363.676, "r_y3": 457.614, "coord_origin": "TOPLEFT"}, "text": "0.931", "orig": "0.931", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 98, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 396.206, "r_y0": 468.903, "r_x1": 417.193, "r_y1": 468.903, "r_x2": 417.193, "r_y2": 457.614, "r_x3": 396.206, "r_y3": 457.614, "coord_origin": "TOPLEFT"}, "text": "0.824", "orig": "0.824", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 99, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 446.653, "r_y0": 468.903, "r_x1": 451.26, "r_y1": 468.903, "r_x2": 451.26, "r_y2": 457.614, "r_x3": 446.653, "r_y3": 457.614, "coord_origin": "TOPLEFT"}, "text": "2", "orig": "2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": [{"id": 11, "label": "text", "bbox": {"l": 160.37, "t": 339.457, "r": 168.048, "b": 350.746, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 31, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 160.37, "r_y0": 350.746, "r_x1": 168.048, "r_y1": 350.746, "r_x2": 168.048, "r_y2": 339.457, "r_x3": 160.37, "r_y3": 339.457, "coord_origin": "TOPLEFT"}, "text": "#", "orig": "#", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 12, "label": "text", "bbox": {"l": 144.592, "t": 352.408, "r": 183.828, "b": 363.697, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 32, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 144.592, "r_y0": 363.697, "r_x1": 183.828, "r_y1": 363.697, "r_x2": 183.828, "r_y2": 352.408, "r_x3": 144.592, "r_y3": 352.408, "coord_origin": "TOPLEFT"}, "text": "enc-layers", "orig": "enc-layers", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 13, "label": "text", "bbox": {"l": 207.974, "t": 339.457, "r": 215.652, "b": 350.746, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 33, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 207.974, "r_y0": 350.746, "r_x1": 215.652, "r_y1": 350.746, "r_x2": 215.652, "r_y2": 339.457, "r_x3": 207.974, "r_y3": 339.457, "coord_origin": "TOPLEFT"}, "text": "#", "orig": "#", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 14, "label": "text", "bbox": {"l": 192.195, "t": 352.408, "r": 231.431, "b": 363.697, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 34, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 192.195, "r_y0": 363.697, "r_x1": 231.431, "r_y1": 363.697, "r_x2": 231.431, "r_y2": 352.408, "r_x3": 192.195, "r_y3": 352.408, "coord_origin": "TOPLEFT"}, "text": "dec-layers", "orig": "dec-layers", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 15, "label": "text", "bbox": {"l": 239.798, "t": 344.936, "r": 278.318, "b": 356.225, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 35, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 239.798, "r_y0": 356.225, "r_x1": 278.318, "r_y1": 356.225, "r_x2": 278.318, "r_y2": 344.936, "r_x3": 239.798, "r_y3": 344.936, "coord_origin": "TOPLEFT"}, "text": "Language", "orig": "Language", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 16, "label": "text", "bbox": {"l": 324.67, "t": 339.457, "r": 348.264, "b": 350.746, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 36, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 324.67, "r_y0": 350.746, "r_x1": 348.264, "r_y1": 350.746, "r_x2": 348.264, "r_y2": 339.457, "r_x3": 324.67, "r_y3": 339.457, "coord_origin": "TOPLEFT"}, "text": "TEDs", "orig": "TEDs", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 17, "label": "text", "bbox": {"l": 396.271, "t": 339.457, "r": 417.127, "b": 350.746, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 37, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 396.271, "r_y0": 350.746, "r_x1": 417.127, "r_y1": 350.746, "r_x2": 417.127, "r_y2": 339.457, "r_x3": 396.271, "r_y3": 339.457, "coord_origin": "TOPLEFT"}, "text": "mAP", "orig": "mAP", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 18, "label": "text", "bbox": {"l": 394.927, "t": 350.416, "r": 418.473, "b": 361.705, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 38, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 394.927, "r_y0": 361.705, "r_x1": 418.473, "r_y1": 361.705, "r_x2": 418.473, "r_y2": 350.416, "r_x3": 394.927, "r_y3": 350.416, "coord_origin": "TOPLEFT"}, "text": "(0.75)", "orig": "(0.75)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 19, "label": "text", "bbox": {"l": 430.771, "t": 339.457, "r": 467.142, "b": 350.746, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 39, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 430.771, "r_y0": 350.746, "r_x1": 467.142, "r_y1": 350.746, "r_x2": 467.142, "r_y2": 339.457, "r_x3": 430.771, "r_y3": 339.457, "coord_origin": "TOPLEFT"}, "text": "Inference", "orig": "Inference", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 20, "label": "text", "bbox": {"l": 427.148, "t": 350.416, "r": 470.761, "b": 361.705, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 40, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 427.148, "r_y0": 361.705, "r_x1": 470.761, "r_y1": 361.705, "r_x2": 470.761, "r_y2": 350.416, "r_x3": 427.148, "r_y3": 350.416, "coord_origin": "TOPLEFT"}, "text": "time (secs)", "orig": "time (secs)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 21, "label": "text", "bbox": {"l": 286.686, "t": 352.408, "r": 312.333, "b": 363.697, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 41, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 286.686, "r_y0": 363.697, "r_x1": 312.333, "r_y1": 363.697, "r_x2": 312.333, "r_y2": 352.408, "r_x3": 286.686, "r_y3": 352.408, "coord_origin": "TOPLEFT"}, "text": "simple", "orig": "simple", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 22, "label": "text", "bbox": {"l": 320.702, "t": 352.408, "r": 353.72, "b": 363.697, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 42, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 320.702, "r_y0": 363.697, "r_x1": 353.72, "r_y1": 363.697, "r_x2": 353.72, "r_y2": 352.408, "r_x3": 320.702, "r_y3": 352.408, "coord_origin": "TOPLEFT"}, "text": "complex", "orig": "complex", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 23, "label": "text", "bbox": {"l": 369.306, "t": 352.408, "r": 379.031, "b": 363.697, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 43, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 369.306, "r_y0": 363.697, "r_x1": 379.031, "r_y1": 363.697, "r_x2": 379.031, "r_y2": 352.408, "r_x3": 369.306, "r_y3": 352.408, "coord_origin": "TOPLEFT"}, "text": "all", "orig": "all", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 24, "label": "text", "bbox": {"l": 161.906, "t": 371.238, "r": 166.513, "b": 382.527, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 44, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 161.906, "r_y0": 382.527, "r_x1": 166.513, "r_y1": 382.527, "r_x2": 166.513, "r_y2": 371.238, "r_x3": 161.906, "r_y3": 371.238, "coord_origin": "TOPLEFT"}, "text": "6", "orig": "6", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 25, "label": "text", "bbox": {"l": 209.509, "t": 371.238, "r": 214.116, "b": 382.527, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 45, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 209.509, "r_y0": 382.527, "r_x1": 214.116, "r_y1": 382.527, "r_x2": 214.116, "r_y2": 371.238, "r_x3": 209.509, "r_y3": 371.238, "coord_origin": "TOPLEFT"}, "text": "6", "orig": "6", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 26, "label": "text", "bbox": {"l": 246.71, "t": 365.758, "r": 271.405, "b": 377.047, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 46, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 246.71, "r_y0": 377.047, "r_x1": 271.405, "r_y1": 377.047, "r_x2": 271.405, "r_y2": 365.758, "r_x3": 246.71, "r_y3": 365.758, "coord_origin": "TOPLEFT"}, "text": "OTSL", "orig": "OTSL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 27, "label": "text", "bbox": {"l": 289.017, "t": 365.758, "r": 310.004, "b": 377.047, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 47, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 289.017, "r_y0": 377.047, "r_x1": 310.004, "r_y1": 377.047, "r_x2": 310.004, "r_y2": 365.758, "r_x3": 289.017, "r_y3": 365.758, "coord_origin": "TOPLEFT"}, "text": "0.965", "orig": "0.965", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 28, "label": "text", "bbox": {"l": 326.717, "t": 365.758, "r": 347.704, "b": 377.047, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 48, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 326.717, "r_y0": 377.047, "r_x1": 347.704, "r_y1": 377.047, "r_x2": 347.704, "r_y2": 365.758, "r_x3": 326.717, "r_y3": 365.758, "coord_origin": "TOPLEFT"}, "text": "0.934", "orig": "0.934", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 29, "label": "text", "bbox": {"l": 363.676, "t": 365.758, "r": 384.663, "b": 377.047, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 49, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 363.676, "r_y0": 377.047, "r_x1": 384.663, "r_y1": 377.047, "r_x2": 384.663, "r_y2": 365.758, "r_x3": 363.676, "r_y3": 365.758, "coord_origin": "TOPLEFT"}, "text": "0.955", "orig": "0.955", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 30, "label": "text", "bbox": {"l": 397.27, "t": 367.973, "r": 416.127, "b": 375.899, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 50, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 397.27, "r_y0": 375.899, "r_x1": 416.127, "r_y1": 375.899, "r_x2": 416.127, "r_y2": 367.973, "r_x3": 397.27, "r_y3": 367.973, "coord_origin": "TOPLEFT"}, "text": "0.88", "orig": "0.88", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 31, "label": "text", "bbox": {"l": 439.527, "t": 367.973, "r": 458.384, "b": 375.899, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 51, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 439.527, "r_y0": 375.899, "r_x1": 458.384, "r_y1": 375.899, "r_x2": 458.384, "r_y2": 367.973, "r_x3": 439.527, "r_y3": 367.973, "coord_origin": "TOPLEFT"}, "text": "2.73", "orig": "2.73", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 32, "label": "text", "bbox": {"l": 245.176, "t": 378.71, "r": 272.94, "b": 389.999, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 52, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 245.176, "r_y0": 389.999, "r_x1": 272.94, "r_y1": 389.999, "r_x2": 272.94, "r_y2": 378.71, "r_x3": 245.176, "r_y3": 378.71, "coord_origin": "TOPLEFT"}, "text": "HTML", "orig": "HTML", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 33, "label": "text", "bbox": {"l": 289.017, "t": 378.71, "r": 310.004, "b": 389.999, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 53, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 289.017, "r_y0": 389.999, "r_x1": 310.004, "r_y1": 389.999, "r_x2": 310.004, "r_y2": 378.71, "r_x3": 289.017, "r_y3": 378.71, "coord_origin": "TOPLEFT"}, "text": "0.969", "orig": "0.969", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 34, "label": "text", "bbox": {"l": 326.717, "t": 378.71, "r": 347.704, "b": 389.999, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 54, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 326.717, "r_y0": 389.999, "r_x1": 347.704, "r_y1": 389.999, "r_x2": 347.704, "r_y2": 378.71, "r_x3": 326.717, "r_y3": 378.71, "coord_origin": "TOPLEFT"}, "text": "0.927", "orig": "0.927", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 35, "label": "text", "bbox": {"l": 363.676, "t": 378.71, "r": 384.663, "b": 389.999, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 55, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 363.676, "r_y0": 389.999, "r_x1": 384.663, "r_y1": 389.999, "r_x2": 384.663, "r_y2": 378.71, "r_x3": 363.676, "r_y3": 378.71, "coord_origin": "TOPLEFT"}, "text": "0.955", "orig": "0.955", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 36, "label": "text", "bbox": {"l": 396.206, "t": 378.71, "r": 417.193, "b": 389.999, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 56, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 396.206, "r_y0": 389.999, "r_x1": 417.193, "r_y1": 389.999, "r_x2": 417.193, "r_y2": 378.71, "r_x3": 396.206, "r_y3": 378.71, "coord_origin": "TOPLEFT"}, "text": "0.857", "orig": "0.857", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 37, "label": "text", "bbox": {"l": 440.767, "t": 378.71, "r": 457.147, "b": 389.999, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 57, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 440.767, "r_y0": 389.999, "r_x1": 457.147, "r_y1": 389.999, "r_x2": 457.147, "r_y2": 378.71, "r_x3": 440.767, "r_y3": 378.71, "coord_origin": "TOPLEFT"}, "text": "5.39", "orig": "5.39", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 38, "label": "text", "bbox": {"l": 161.906, "t": 397.539, "r": 166.513, "b": 408.828, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 58, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 161.906, "r_y0": 408.828, "r_x1": 166.513, "r_y1": 408.828, "r_x2": 166.513, "r_y2": 397.539, "r_x3": 161.906, "r_y3": 397.539, "coord_origin": "TOPLEFT"}, "text": "4", "orig": "4", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 39, "label": "text", "bbox": {"l": 209.509, "t": 397.539, "r": 214.116, "b": 408.828, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 59, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 209.509, "r_y0": 408.828, "r_x1": 214.116, "r_y1": 408.828, "r_x2": 214.116, "r_y2": 397.539, "r_x3": 209.509, "r_y3": 397.539, "coord_origin": "TOPLEFT"}, "text": "4", "orig": "4", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 40, "label": "text", "bbox": {"l": 246.71, "t": 392.06, "r": 271.405, "b": 403.349, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 60, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 246.71, "r_y0": 403.349, "r_x1": 271.405, "r_y1": 403.349, "r_x2": 271.405, "r_y2": 392.06, "r_x3": 246.71, "r_y3": 392.06, "coord_origin": "TOPLEFT"}, "text": "OTSL", "orig": "OTSL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 41, "label": "text", "bbox": {"l": 289.017, "t": 392.06, "r": 310.004, "b": 403.349, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 61, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 289.017, "r_y0": 403.349, "r_x1": 310.004, "r_y1": 403.349, "r_x2": 310.004, "r_y2": 392.06, "r_x3": 289.017, "r_y3": 392.06, "coord_origin": "TOPLEFT"}, "text": "0.938", "orig": "0.938", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 42, "label": "text", "bbox": {"l": 326.717, "t": 392.06, "r": 347.704, "b": 403.349, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 62, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 326.717, "r_y0": 403.349, "r_x1": 347.704, "r_y1": 403.349, "r_x2": 347.704, "r_y2": 392.06, "r_x3": 326.717, "r_y3": 392.06, "coord_origin": "TOPLEFT"}, "text": "0.904", "orig": "0.904", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 43, "label": "text", "bbox": {"l": 363.676, "t": 392.06, "r": 384.663, "b": 403.349, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 63, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 363.676, "r_y0": 403.349, "r_x1": 384.663, "r_y1": 403.349, "r_x2": 384.663, "r_y2": 392.06, "r_x3": 363.676, "r_y3": 392.06, "coord_origin": "TOPLEFT"}, "text": "0.927", "orig": "0.927", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 44, "label": "text", "bbox": {"l": 394.618, "t": 394.275, "r": 418.779, "b": 402.201, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 64, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 394.618, "r_y0": 402.201, "r_x1": 418.779, "r_y1": 402.201, "r_x2": 418.779, "r_y2": 394.275, "r_x3": 394.618, "r_y3": 394.275, "coord_origin": "TOPLEFT"}, "text": "0.853", "orig": "0.853", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 45, "label": "text", "bbox": {"l": 439.527, "t": 394.275, "r": 458.384, "b": 402.201, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 65, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 439.527, "r_y0": 402.201, "r_x1": 458.384, "r_y1": 402.201, "r_x2": 458.384, "r_y2": 394.275, "r_x3": 439.527, "r_y3": 394.275, "coord_origin": "TOPLEFT"}, "text": "1.97", "orig": "1.97", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 46, "label": "text", "bbox": {"l": 245.176, "t": 405.011, "r": 272.94, "b": 416.3, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 66, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 245.176, "r_y0": 416.3, "r_x1": 272.94, "r_y1": 416.3, "r_x2": 272.94, "r_y2": 405.011, "r_x3": 245.176, "r_y3": 405.011, "coord_origin": "TOPLEFT"}, "text": "HTML", "orig": "HTML", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 47, "label": "text", "bbox": {"l": 289.017, "t": 405.011, "r": 310.004, "b": 416.3, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 67, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 289.017, "r_y0": 416.3, "r_x1": 310.004, "r_y1": 416.3, "r_x2": 310.004, "r_y2": 405.011, "r_x3": 289.017, "r_y3": 405.011, "coord_origin": "TOPLEFT"}, "text": "0.952", "orig": "0.952", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 48, "label": "text", "bbox": {"l": 326.717, "t": 405.011, "r": 347.704, "b": 416.3, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 68, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 326.717, "r_y0": 416.3, "r_x1": 347.704, "r_y1": 416.3, "r_x2": 347.704, "r_y2": 405.011, "r_x3": 326.717, "r_y3": 405.011, "coord_origin": "TOPLEFT"}, "text": "0.909", "orig": "0.909", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 49, "label": "text", "bbox": {"l": 362.088, "t": 407.226, "r": 386.249, "b": 415.152, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 69, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 362.088, "r_y0": 415.152, "r_x1": 386.249, "r_y1": 415.152, "r_x2": 386.249, "r_y2": 407.226, "r_x3": 362.088, "r_y3": 407.226, "coord_origin": "TOPLEFT"}, "text": "0.938", "orig": "0.938", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 50, "label": "text", "bbox": {"l": 396.206, "t": 405.011, "r": 417.193, "b": 416.3, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 70, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 396.206, "r_y0": 416.3, "r_x1": 417.193, "r_y1": 416.3, "r_x2": 417.193, "r_y2": 405.011, "r_x3": 396.206, "r_y3": 405.011, "coord_origin": "TOPLEFT"}, "text": "0.843", "orig": "0.843", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 51, "label": "text", "bbox": {"l": 440.767, "t": 405.011, "r": 457.147, "b": 416.3, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 71, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 440.767, "r_y0": 416.3, "r_x1": 457.147, "r_y1": 416.3, "r_x2": 457.147, "r_y2": 405.011, "r_x3": 440.767, "r_y3": 405.011, "coord_origin": "TOPLEFT"}, "text": "3.77", "orig": "3.77", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 52, "label": "text", "bbox": {"l": 161.906, "t": 423.84, "r": 166.513, "b": 435.129, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 72, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 161.906, "r_y0": 435.129, "r_x1": 166.513, "r_y1": 435.129, "r_x2": 166.513, "r_y2": 423.84, "r_x3": 161.906, "r_y3": 423.84, "coord_origin": "TOPLEFT"}, "text": "2", "orig": "2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 53, "label": "text", "bbox": {"l": 209.509, "t": 423.84, "r": 214.116, "b": 435.129, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 73, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 209.509, "r_y0": 435.129, "r_x1": 214.116, "r_y1": 435.129, "r_x2": 214.116, "r_y2": 423.84, "r_x3": 209.509, "r_y3": 423.84, "coord_origin": "TOPLEFT"}, "text": "4", "orig": "4", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 54, "label": "text", "bbox": {"l": 246.71, "t": 418.361, "r": 271.405, "b": 429.65, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 74, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 246.71, "r_y0": 429.65, "r_x1": 271.405, "r_y1": 429.65, "r_x2": 271.405, "r_y2": 418.361, "r_x3": 246.71, "r_y3": 418.361, "coord_origin": "TOPLEFT"}, "text": "OTSL", "orig": "OTSL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 55, "label": "text", "bbox": {"l": 289.017, "t": 418.361, "r": 310.004, "b": 429.65, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 75, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 289.017, "r_y0": 429.65, "r_x1": 310.004, "r_y1": 429.65, "r_x2": 310.004, "r_y2": 418.361, "r_x3": 289.017, "r_y3": 418.361, "coord_origin": "TOPLEFT"}, "text": "0.923", "orig": "0.923", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 56, "label": "text", "bbox": {"l": 326.717, "t": 418.361, "r": 347.704, "b": 429.65, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 76, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 326.717, "r_y0": 429.65, "r_x1": 347.704, "r_y1": 429.65, "r_x2": 347.704, "r_y2": 418.361, "r_x3": 326.717, "r_y3": 418.361, "coord_origin": "TOPLEFT"}, "text": "0.897", "orig": "0.897", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 57, "label": "text", "bbox": {"l": 363.676, "t": 418.361, "r": 384.663, "b": 429.65, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 77, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 363.676, "r_y0": 429.65, "r_x1": 384.663, "r_y1": 429.65, "r_x2": 384.663, "r_y2": 418.361, "r_x3": 363.676, "r_y3": 418.361, "coord_origin": "TOPLEFT"}, "text": "0.915", "orig": "0.915", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 58, "label": "text", "bbox": {"l": 394.618, "t": 420.576, "r": 418.779, "b": 428.502, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 78, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 394.618, "r_y0": 428.502, "r_x1": 418.779, "r_y1": 428.502, "r_x2": 418.779, "r_y2": 420.576, "r_x3": 394.618, "r_y3": 420.576, "coord_origin": "TOPLEFT"}, "text": "0.859", "orig": "0.859", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 59, "label": "text", "bbox": {"l": 439.527, "t": 420.576, "r": 458.384, "b": 428.502, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 79, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 439.527, "r_y0": 428.502, "r_x1": 458.384, "r_y1": 428.502, "r_x2": 458.384, "r_y2": 420.576, "r_x3": 439.527, "r_y3": 420.576, "coord_origin": "TOPLEFT"}, "text": "1.91", "orig": "1.91", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 60, "label": "text", "bbox": {"l": 245.176, "t": 431.312, "r": 272.94, "b": 442.601, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 80, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 245.176, "r_y0": 442.601, "r_x1": 272.94, "r_y1": 442.601, "r_x2": 272.94, "r_y2": 431.312, "r_x3": 245.176, "r_y3": 431.312, "coord_origin": "TOPLEFT"}, "text": "HTML", "orig": "HTML", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 61, "label": "text", "bbox": {"l": 289.017, "t": 431.312, "r": 310.004, "b": 442.601, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 81, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 289.017, "r_y0": 442.601, "r_x1": 310.004, "r_y1": 442.601, "r_x2": 310.004, "r_y2": 431.312, "r_x3": 289.017, "r_y3": 431.312, "coord_origin": "TOPLEFT"}, "text": "0.945", "orig": "0.945", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 62, "label": "text", "bbox": {"l": 326.717, "t": 431.312, "r": 347.704, "b": 442.601, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 82, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 326.717, "r_y0": 442.601, "r_x1": 347.704, "r_y1": 442.601, "r_x2": 347.704, "r_y2": 431.312, "r_x3": 326.717, "r_y3": 431.312, "coord_origin": "TOPLEFT"}, "text": "0.901", "orig": "0.901", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 63, "label": "text", "bbox": {"l": 362.088, "t": 433.527, "r": 386.249, "b": 441.453, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 83, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 362.088, "r_y0": 441.453, "r_x1": 386.249, "r_y1": 441.453, "r_x2": 386.249, "r_y2": 433.527, "r_x3": 362.088, "r_y3": 433.527, "coord_origin": "TOPLEFT"}, "text": "0.931", "orig": "0.931", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 64, "label": "text", "bbox": {"l": 396.206, "t": 431.312, "r": 417.193, "b": 442.601, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 84, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 396.206, "r_y0": 442.601, "r_x1": 417.193, "r_y1": 442.601, "r_x2": 417.193, "r_y2": 431.312, "r_x3": 396.206, "r_y3": 431.312, "coord_origin": "TOPLEFT"}, "text": "0.834", "orig": "0.834", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 65, "label": "text", "bbox": {"l": 440.767, "t": 431.312, "r": 457.147, "b": 442.601, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 85, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 440.767, "r_y0": 442.601, "r_x1": 457.147, "r_y1": 442.601, "r_x2": 457.147, "r_y2": 431.312, "r_x3": 440.767, "r_y3": 431.312, "coord_origin": "TOPLEFT"}, "text": "3.81", "orig": "3.81", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 66, "label": "text", "bbox": {"l": 161.906, "t": 450.142, "r": 166.513, "b": 461.431, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 86, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 161.906, "r_y0": 461.431, "r_x1": 166.513, "r_y1": 461.431, "r_x2": 166.513, "r_y2": 450.142, "r_x3": 161.906, "r_y3": 450.142, "coord_origin": "TOPLEFT"}, "text": "4", "orig": "4", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 67, "label": "text", "bbox": {"l": 209.509, "t": 450.142, "r": 214.116, "b": 461.431, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 87, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 209.509, "r_y0": 461.431, "r_x1": 214.116, "r_y1": 461.431, "r_x2": 214.116, "r_y2": 450.142, "r_x3": 209.509, "r_y3": 450.142, "coord_origin": "TOPLEFT"}, "text": "2", "orig": "2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 68, "label": "text", "bbox": {"l": 246.71, "t": 444.662, "r": 271.405, "b": 455.951, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 88, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 246.71, "r_y0": 455.951, "r_x1": 271.405, "r_y1": 455.951, "r_x2": 271.405, "r_y2": 444.662, "r_x3": 246.71, "r_y3": 444.662, "coord_origin": "TOPLEFT"}, "text": "OTSL", "orig": "OTSL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 69, "label": "text", "bbox": {"l": 289.017, "t": 444.662, "r": 310.004, "b": 455.951, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 89, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 289.017, "r_y0": 455.951, "r_x1": 310.004, "r_y1": 455.951, "r_x2": 310.004, "r_y2": 444.662, "r_x3": 289.017, "r_y3": 444.662, "coord_origin": "TOPLEFT"}, "text": "0.952", "orig": "0.952", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 70, "label": "text", "bbox": {"l": 329.021, "t": 444.662, "r": 345.401, "b": 455.951, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 90, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 329.021, "r_y0": 455.951, "r_x1": 345.401, "r_y1": 455.951, "r_x2": 345.401, "r_y2": 444.662, "r_x3": 329.021, "r_y3": 444.662, "coord_origin": "TOPLEFT"}, "text": "0.92", "orig": "0.92", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 71, "label": "text", "bbox": {"l": 362.088, "t": 446.877, "r": 386.249, "b": 454.803, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 91, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 362.088, "r_y0": 454.803, "r_x1": 386.249, "r_y1": 454.803, "r_x2": 386.249, "r_y2": 446.877, "r_x3": 362.088, "r_y3": 446.877, "coord_origin": "TOPLEFT"}, "text": "0.942", "orig": "0.942", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 72, "label": "text", "bbox": {"l": 394.618, "t": 446.877, "r": 418.779, "b": 454.803, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 92, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 394.618, "r_y0": 454.803, "r_x1": 418.779, "r_y1": 454.803, "r_x2": 418.779, "r_y2": 446.877, "r_x3": 394.618, "r_y3": 446.877, "coord_origin": "TOPLEFT"}, "text": "0.857", "orig": "0.857", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 73, "label": "text", "bbox": {"l": 439.527, "t": 446.877, "r": 458.384, "b": 454.803, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 93, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 439.527, "r_y0": 454.803, "r_x1": 458.384, "r_y1": 454.803, "r_x2": 458.384, "r_y2": 446.877, "r_x3": 439.527, "r_y3": 446.877, "coord_origin": "TOPLEFT"}, "text": "1.22", "orig": "1.22", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 74, "label": "text", "bbox": {"l": 245.176, "t": 457.614, "r": 272.94, "b": 468.903, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 94, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 245.176, "r_y0": 468.903, "r_x1": 272.94, "r_y1": 468.903, "r_x2": 272.94, "r_y2": 457.614, "r_x3": 245.176, "r_y3": 457.614, "coord_origin": "TOPLEFT"}, "text": "HTML", "orig": "HTML", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 75, "label": "text", "bbox": {"l": 289.017, "t": 457.614, "r": 310.004, "b": 468.903, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 95, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 289.017, "r_y0": 468.903, "r_x1": 310.004, "r_y1": 468.903, "r_x2": 310.004, "r_y2": 457.614, "r_x3": 289.017, "r_y3": 457.614, "coord_origin": "TOPLEFT"}, "text": "0.944", "orig": "0.944", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 76, "label": "text", "bbox": {"l": 326.717, "t": 457.614, "r": 347.704, "b": 468.903, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 96, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 326.717, "r_y0": 468.903, "r_x1": 347.704, "r_y1": 468.903, "r_x2": 347.704, "r_y2": 457.614, "r_x3": 326.717, "r_y3": 457.614, "coord_origin": "TOPLEFT"}, "text": "0.903", "orig": "0.903", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 77, "label": "text", "bbox": {"l": 363.676, "t": 457.614, "r": 384.663, "b": 468.903, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 97, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 363.676, "r_y0": 468.903, "r_x1": 384.663, "r_y1": 468.903, "r_x2": 384.663, "r_y2": 457.614, "r_x3": 363.676, "r_y3": 457.614, "coord_origin": "TOPLEFT"}, "text": "0.931", "orig": "0.931", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 78, "label": "text", "bbox": {"l": 396.206, "t": 457.614, "r": 417.193, "b": 468.903, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 98, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 396.206, "r_y0": 468.903, "r_x1": 417.193, "r_y1": 468.903, "r_x2": 417.193, "r_y2": 457.614, "r_x3": 396.206, "r_y3": 457.614, "coord_origin": "TOPLEFT"}, "text": "0.824", "orig": "0.824", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 79, "label": "text", "bbox": {"l": 446.653, "t": 457.614, "r": 451.26, "b": 468.903, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 99, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 446.653, "r_y0": 468.903, "r_x1": 451.26, "r_y1": 468.903, "r_x2": 451.26, "r_y2": 457.614, "r_x3": 446.653, "r_y3": 457.614, "coord_origin": "TOPLEFT"}, "text": "2", "orig": "2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}]}, "text": null, "otsl_seq": ["ched", "ched", "ched", "ched", "lcel", "lcel", "ched", "ched", "nl", "ucel", "ucel", "ucel", "ched", "ched", "ched", "ched", "ched", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "nl"], "num_rows": 6, "num_cols": 8, "table_cells": [{"bbox": {"l": 144.592, "t": 339.457, "r": 183.828, "b": 363.697, "coord_origin": "TOPLEFT"}, "row_span": 2, "col_span": 1, "start_row_offset_idx": 0, "end_row_offset_idx": 2, "start_col_offset_idx": 0, "end_col_offset_idx": 1, "text": "# enc-layers", "column_header": true, "row_header": false, "row_section": false}, {"bbox": {"l": 192.195, "t": 339.457, "r": 231.431, "b": 363.697, "coord_origin": "TOPLEFT"}, "row_span": 2, "col_span": 1, "start_row_offset_idx": 0, "end_row_offset_idx": 2, "start_col_offset_idx": 1, "end_col_offset_idx": 2, "text": "# dec-layers", "column_header": true, "row_header": false, "row_section": false}, {"bbox": {"l": 239.798, "t": 344.936, "r": 278.318, "b": 356.225, "coord_origin": "TOPLEFT"}, "row_span": 2, "col_span": 1, "start_row_offset_idx": 0, "end_row_offset_idx": 2, "start_col_offset_idx": 2, "end_col_offset_idx": 3, "text": "Language", "column_header": true, "row_header": false, "row_section": false}, {"bbox": {"l": 324.67, "t": 339.457, "r": 348.264, "b": 350.746, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 3, "start_row_offset_idx": 0, "end_row_offset_idx": 1, "start_col_offset_idx": 3, "end_col_offset_idx": 6, "text": "TEDs", "column_header": true, "row_header": false, "row_section": false}, {"bbox": {"l": 396.271, "t": 339.457, "r": 417.127, "b": 350.746, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 0, "end_row_offset_idx": 1, "start_col_offset_idx": 6, "end_col_offset_idx": 7, "text": "mAP", "column_header": true, "row_header": false, "row_section": false}, {"bbox": {"l": 394.927, "t": 350.416, "r": 418.473, "b": 361.705, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 1, "end_row_offset_idx": 2, "start_col_offset_idx": 6, "end_col_offset_idx": 7, "text": "(0.75)", "column_header": true, "row_header": false, "row_section": false}, {"bbox": {"l": 430.771, "t": 339.457, "r": 467.142, "b": 350.746, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 0, "end_row_offset_idx": 1, "start_col_offset_idx": 7, "end_col_offset_idx": 8, "text": "Inference", "column_header": true, "row_header": false, "row_section": false}, {"bbox": {"l": 427.148, "t": 350.416, "r": 470.761, "b": 361.705, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 1, "end_row_offset_idx": 2, "start_col_offset_idx": 7, "end_col_offset_idx": 8, "text": "time (secs)", "column_header": true, "row_header": false, "row_section": false}, {"bbox": {"l": 286.686, "t": 352.408, "r": 312.333, "b": 363.697, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 1, "end_row_offset_idx": 2, "start_col_offset_idx": 3, "end_col_offset_idx": 4, "text": "simple", "column_header": true, "row_header": false, "row_section": false}, {"bbox": {"l": 320.702, "t": 352.408, "r": 353.72, "b": 363.697, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 1, "end_row_offset_idx": 2, "start_col_offset_idx": 4, "end_col_offset_idx": 5, "text": "complex", "column_header": true, "row_header": false, "row_section": false}, {"bbox": {"l": 369.306, "t": 352.408, "r": 379.031, "b": 363.697, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 1, "end_row_offset_idx": 2, "start_col_offset_idx": 5, "end_col_offset_idx": 6, "text": "all", "column_header": true, "row_header": false, "row_section": false}, {"bbox": {"l": 161.906, "t": 371.238, "r": 166.513, "b": 382.527, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 2, "end_row_offset_idx": 3, "start_col_offset_idx": 0, "end_col_offset_idx": 1, "text": "6", "column_header": false, "row_header": false, "row_section": false}, {"bbox": {"l": 209.509, "t": 371.238, "r": 214.116, "b": 382.527, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 2, "end_row_offset_idx": 3, "start_col_offset_idx": 1, "end_col_offset_idx": 2, "text": "6", "column_header": false, "row_header": false, "row_section": false}, {"bbox": {"l": 245.176, "t": 365.758, "r": 272.94, "b": 389.999, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 2, "end_row_offset_idx": 3, "start_col_offset_idx": 2, "end_col_offset_idx": 3, "text": "OTSL HTML", "column_header": false, "row_header": false, "row_section": false}, {"bbox": {"l": 289.017, "t": 365.758, "r": 310.004, "b": 389.999, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 2, "end_row_offset_idx": 3, "start_col_offset_idx": 3, "end_col_offset_idx": 4, "text": "0.965 0.969", "column_header": false, "row_header": false, "row_section": false}, {"bbox": {"l": 326.717, "t": 365.758, "r": 347.704, "b": 389.999, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 2, "end_row_offset_idx": 3, "start_col_offset_idx": 4, "end_col_offset_idx": 5, "text": "0.934 0.927", "column_header": false, "row_header": false, "row_section": false}, {"bbox": {"l": 363.676, "t": 365.758, "r": 384.663, "b": 389.999, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 2, "end_row_offset_idx": 3, "start_col_offset_idx": 5, "end_col_offset_idx": 6, "text": "0.955 0.955", "column_header": false, "row_header": false, "row_section": false}, {"bbox": {"l": 396.206, "t": 367.973, "r": 417.193, "b": 389.999, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 2, "end_row_offset_idx": 3, "start_col_offset_idx": 6, "end_col_offset_idx": 7, "text": "0.88 0.857", "column_header": false, "row_header": false, "row_section": false}, {"bbox": {"l": 439.527, "t": 367.973, "r": 458.384, "b": 389.999, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 2, "end_row_offset_idx": 3, "start_col_offset_idx": 7, "end_col_offset_idx": 8, "text": "2.73 5.39", "column_header": false, "row_header": false, "row_section": false}, {"bbox": {"l": 161.906, "t": 397.539, "r": 166.513, "b": 408.828, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 3, "end_row_offset_idx": 4, "start_col_offset_idx": 0, "end_col_offset_idx": 1, "text": "4", "column_header": false, "row_header": false, "row_section": false}, {"bbox": {"l": 209.509, "t": 397.539, "r": 214.116, "b": 408.828, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 3, "end_row_offset_idx": 4, "start_col_offset_idx": 1, "end_col_offset_idx": 2, "text": "4", "column_header": false, "row_header": false, "row_section": false}, {"bbox": {"l": 245.176, "t": 392.06, "r": 272.94, "b": 416.3, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 3, "end_row_offset_idx": 4, "start_col_offset_idx": 2, "end_col_offset_idx": 3, "text": "OTSL HTML", "column_header": false, "row_header": false, "row_section": false}, {"bbox": {"l": 289.017, "t": 392.06, "r": 310.004, "b": 416.3, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 3, "end_row_offset_idx": 4, "start_col_offset_idx": 3, "end_col_offset_idx": 4, "text": "0.938 0.952", "column_header": false, "row_header": false, "row_section": false}, {"bbox": {"l": 326.717, "t": 392.06, "r": 347.704, "b": 416.3, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 3, "end_row_offset_idx": 4, "start_col_offset_idx": 4, "end_col_offset_idx": 5, "text": "0.904 0.909", "column_header": false, "row_header": false, "row_section": false}, {"bbox": {"l": 362.088, "t": 392.06, "r": 386.249, "b": 415.152, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 3, "end_row_offset_idx": 4, "start_col_offset_idx": 5, "end_col_offset_idx": 6, "text": "0.927 0.938", "column_header": false, "row_header": false, "row_section": false}, {"bbox": {"l": 394.618, "t": 394.275, "r": 418.779, "b": 416.3, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 3, "end_row_offset_idx": 4, "start_col_offset_idx": 6, "end_col_offset_idx": 7, "text": "0.853 0.843", "column_header": false, "row_header": false, "row_section": false}, {"bbox": {"l": 439.527, "t": 394.275, "r": 458.384, "b": 416.3, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 3, "end_row_offset_idx": 4, "start_col_offset_idx": 7, "end_col_offset_idx": 8, "text": "1.97 3.77", "column_header": false, "row_header": false, "row_section": false}, {"bbox": {"l": 161.906, "t": 423.84, "r": 166.513, "b": 435.129, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 4, "end_row_offset_idx": 5, "start_col_offset_idx": 0, "end_col_offset_idx": 1, "text": "2", "column_header": false, "row_header": false, "row_section": false}, {"bbox": {"l": 209.509, "t": 423.84, "r": 214.116, "b": 435.129, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 4, "end_row_offset_idx": 5, "start_col_offset_idx": 1, "end_col_offset_idx": 2, "text": "4", "column_header": false, "row_header": false, "row_section": false}, {"bbox": {"l": 245.176, "t": 418.361, "r": 272.94, "b": 442.601, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 4, "end_row_offset_idx": 5, "start_col_offset_idx": 2, "end_col_offset_idx": 3, "text": "OTSL HTML", "column_header": false, "row_header": false, "row_section": false}, {"bbox": {"l": 289.017, "t": 418.361, "r": 310.004, "b": 442.601, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 4, "end_row_offset_idx": 5, "start_col_offset_idx": 3, "end_col_offset_idx": 4, "text": "0.923 0.945", "column_header": false, "row_header": false, "row_section": false}, {"bbox": {"l": 326.717, "t": 418.361, "r": 347.704, "b": 442.601, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 4, "end_row_offset_idx": 5, "start_col_offset_idx": 4, "end_col_offset_idx": 5, "text": "0.897 0.901", "column_header": false, "row_header": false, "row_section": false}, {"bbox": {"l": 362.088, "t": 418.361, "r": 386.249, "b": 441.453, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 4, "end_row_offset_idx": 5, "start_col_offset_idx": 5, "end_col_offset_idx": 6, "text": "0.915 0.931", "column_header": false, "row_header": false, "row_section": false}, {"bbox": {"l": 394.618, "t": 420.576, "r": 418.779, "b": 442.601, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 4, "end_row_offset_idx": 5, "start_col_offset_idx": 6, "end_col_offset_idx": 7, "text": "0.859 0.834", "column_header": false, "row_header": false, "row_section": false}, {"bbox": {"l": 439.527, "t": 420.576, "r": 458.384, "b": 442.601, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 4, "end_row_offset_idx": 5, "start_col_offset_idx": 7, "end_col_offset_idx": 8, "text": "1.91 3.81", "column_header": false, "row_header": false, "row_section": false}, {"bbox": {"l": 161.906, "t": 450.142, "r": 166.513, "b": 461.431, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 5, "end_row_offset_idx": 6, "start_col_offset_idx": 0, "end_col_offset_idx": 1, "text": "4", "column_header": false, "row_header": false, "row_section": false}, {"bbox": {"l": 209.509, "t": 450.142, "r": 214.116, "b": 461.431, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 5, "end_row_offset_idx": 6, "start_col_offset_idx": 1, "end_col_offset_idx": 2, "text": "2", "column_header": false, "row_header": false, "row_section": false}, {"bbox": {"l": 245.176, "t": 444.662, "r": 272.94, "b": 468.903, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 5, "end_row_offset_idx": 6, "start_col_offset_idx": 2, "end_col_offset_idx": 3, "text": "OTSL HTML", "column_header": false, "row_header": false, "row_section": false}, {"bbox": {"l": 289.017, "t": 444.662, "r": 310.004, "b": 468.903, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 5, "end_row_offset_idx": 6, "start_col_offset_idx": 3, "end_col_offset_idx": 4, "text": "0.952 0.944", "column_header": false, "row_header": false, "row_section": false}, {"bbox": {"l": 326.717, "t": 444.662, "r": 347.704, "b": 468.903, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 5, "end_row_offset_idx": 6, "start_col_offset_idx": 4, "end_col_offset_idx": 5, "text": "0.92 0.903", "column_header": false, "row_header": false, "row_section": false}, {"bbox": {"l": 362.088, "t": 446.877, "r": 386.249, "b": 468.903, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 5, "end_row_offset_idx": 6, "start_col_offset_idx": 5, "end_col_offset_idx": 6, "text": "0.942 0.931", "column_header": false, "row_header": false, "row_section": false}, {"bbox": {"l": 394.618, "t": 446.877, "r": 418.779, "b": 468.903, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 5, "end_row_offset_idx": 6, "start_col_offset_idx": 6, "end_col_offset_idx": 7, "text": "0.857 0.824", "column_header": false, "row_header": false, "row_section": false}, {"bbox": {"l": 439.527, "t": 446.877, "r": 458.384, "b": 468.903, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 5, "end_row_offset_idx": 6, "start_col_offset_idx": 7, "end_col_offset_idx": 8, "text": "1.22 2", "column_header": false, "row_header": false, "row_section": false}]}, {"label": "section_header", "id": 5, "page_no": 8, "cluster": {"id": 5, "label": "section_header", "bbox": {"l": 134.765, "t": 508.152, "r": 264.403, "b": 516.9590000000001, "coord_origin": "TOPLEFT"}, "confidence": 0.9592539668083191, "cells": [{"index": 100, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 516.9590000000001, "r_x1": 149.402, "r_y1": 516.9590000000001, "r_x2": 149.402, "r_y2": 508.152, "r_x3": 134.765, "r_y3": 508.152, "coord_origin": "TOPLEFT"}, "text": "5.2", "orig": "5.2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 101, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 160.859, "r_y0": 516.9590000000001, "r_x1": 264.403, "r_y1": 516.9590000000001, "r_x2": 264.403, "r_y2": 508.152, "r_x3": 160.859, "r_y3": 508.152, "coord_origin": "TOPLEFT"}, "text": "Quantitative Results", "orig": "Quantitative Results", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "5.2 Quantitative Results"}, {"label": "text", "id": 1, "page_no": 8, "cluster": {"id": 1, "label": "text", "bbox": {"l": 134.765, "t": 524.5509999999999, "r": 480.596, "b": 617.035, "coord_origin": "TOPLEFT"}, "confidence": 0.9854757189750671, "cells": [{"index": 102, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 533.348, "r_x1": 480.591, "r_y1": 533.348, "r_x2": 480.591, "r_y2": 524.5509999999999, "r_x3": 134.765, "r_y3": 524.5509999999999, "coord_origin": "TOPLEFT"}, "text": "We picked the model parameter configuration that produced the best prediction", "orig": "We picked the model parameter configuration that produced the best prediction", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 103, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 545.304, "r_x1": 164.921, "r_y1": 545.304, "r_x2": 164.921, "r_y2": 536.5070000000001, "r_x3": 134.765, "r_y3": 536.5070000000001, "coord_origin": "TOPLEFT"}, "text": "quality", "orig": "quality", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 104, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 169.324, "r_y0": 545.304, "r_x1": 480.587, "r_y1": 545.304, "r_x2": 480.587, "r_y2": 536.5070000000001, "r_x3": 169.324, "r_y3": 536.5070000000001, "coord_origin": "TOPLEFT"}, "text": "(enc=6, dec=6, heads=8) with PubTabNet alone, then independently", "orig": "(enc=6, dec=6, heads=8) with PubTabNet alone, then independently", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 105, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 557.259, "r_x1": 480.596, "r_y1": 557.259, "r_x2": 480.596, "r_y2": 548.462, "r_x3": 134.765, "r_y3": 548.462, "coord_origin": "TOPLEFT"}, "text": "trained and evaluated it on three publicly available data sets: PubTabNet (395k", "orig": "trained and evaluated it on three publicly available data sets: PubTabNet (395k", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 106, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 569.2139999999999, "r_x1": 480.592, "r_y1": 569.2139999999999, "r_x2": 480.592, "r_y2": 560.417, "r_x3": 134.765, "r_y3": 560.417, "coord_origin": "TOPLEFT"}, "text": "samples), FinTabNet (113k samples) and PubTables-1M (about 1M samples).", "orig": "samples), FinTabNet (113k samples) and PubTables-1M (about 1M samples).", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 107, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 581.169, "r_x1": 480.591, "r_y1": 581.169, "r_x2": 480.591, "r_y2": 572.3720000000001, "r_x3": 134.765, "r_y3": 572.3720000000001, "coord_origin": "TOPLEFT"}, "text": "Performance results are presented in Table. 2. It is clearly evident that the model", "orig": "Performance results are presented in Table. 2. It is clearly evident that the model", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 108, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 593.124, "r_x1": 480.596, "r_y1": 593.124, "r_x2": 480.596, "r_y2": 584.327, "r_x3": 134.765, "r_y3": 584.327, "coord_origin": "TOPLEFT"}, "text": "trained on OTSL outperforms HTML across the board, keeping high TEDs and", "orig": "trained on OTSL outperforms HTML across the board, keeping high TEDs and", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 109, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 605.08, "r_x1": 480.588, "r_y1": 605.08, "r_x2": 480.588, "r_y2": 596.283, "r_x3": 134.765, "r_y3": 596.283, "coord_origin": "TOPLEFT"}, "text": "mAP scores even on difficult financial tables (FinTabNet) that contain sparse", "orig": "mAP scores even on difficult financial tables (FinTabNet) that contain sparse", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 110, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 617.035, "r_x1": 206.787, "r_y1": 617.035, "r_x2": 206.787, "r_y2": 608.238, "r_x3": 134.765, "r_y3": 608.238, "coord_origin": "TOPLEFT"}, "text": "and large tables.", "orig": "and large tables.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "We picked the model parameter configuration that produced the best prediction quality (enc=6, dec=6, heads=8) with PubTabNet alone, then independently trained and evaluated it on three publicly available data sets: PubTabNet (395k samples), FinTabNet (113k samples) and PubTables-1M (about 1M samples). Performance results are presented in Table. 2. It is clearly evident that the model trained on OTSL outperforms HTML across the board, keeping high TEDs and mAP scores even on difficult financial tables (FinTabNet) that contain sparse and large tables."}, {"label": "text", "id": 2, "page_no": 8, "cluster": {"id": 2, "label": "text", "bbox": {"l": 134.765, "t": 620.193, "r": 480.596, "b": 664.855, "coord_origin": "TOPLEFT"}, "confidence": 0.9851234555244446, "cells": [{"index": 111, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 149.709, "r_y0": 628.99, "r_x1": 205.597, "r_y1": 628.99, "r_x2": 205.597, "r_y2": 620.193, "r_x3": 149.709, "r_y3": 620.193, "coord_origin": "TOPLEFT"}, "text": "Additionally,", "orig": "Additionally,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 112, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 210.578, "r_y0": 628.99, "r_x1": 224.412, "r_y1": 628.99, "r_x2": 224.412, "r_y2": 620.193, "r_x3": 210.578, "r_y3": 620.193, "coord_origin": "TOPLEFT"}, "text": "the", "orig": "the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 113, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 229.383, "r_y0": 628.99, "r_x1": 257.74, "r_y1": 628.99, "r_x2": 257.74, "r_y2": 620.193, "r_x3": 229.383, "r_y3": 620.193, "coord_origin": "TOPLEFT"}, "text": "results", "orig": "results", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 114, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 262.722, "r_y0": 628.99, "r_x1": 307.319, "r_y1": 628.99, "r_x2": 307.319, "r_y2": 620.193, "r_x3": 262.722, "r_y3": 620.193, "coord_origin": "TOPLEFT"}, "text": "show that", "orig": "show that", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 115, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 312.301, "r_y0": 628.99, "r_x1": 480.593, "r_y1": 628.99, "r_x2": 480.593, "r_y2": 620.193, "r_x3": 312.301, "r_y3": 620.193, "coord_origin": "TOPLEFT"}, "text": "OTSL has an advantage over HTML", "orig": "OTSL has an advantage over HTML", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 116, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 640.9449999999999, "r_x1": 480.596, "r_y1": 640.9449999999999, "r_x2": 480.596, "r_y2": 632.148, "r_x3": 134.765, "r_y3": 632.148, "coord_origin": "TOPLEFT"}, "text": "when applied on a bigger data set like PubTables-1M and achieves significantly", "orig": "when applied on a bigger data set like PubTables-1M and achieves significantly", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 117, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 652.9, "r_x1": 480.593, "r_y1": 652.9, "r_x2": 480.593, "r_y2": 644.1030000000001, "r_x3": 134.765, "r_y3": 644.1030000000001, "coord_origin": "TOPLEFT"}, "text": "improved scores. Finally, OTSL achieves faster inference due to fewer decoding", "orig": "improved scores. Finally, OTSL achieves faster inference due to fewer decoding", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 118, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 664.855, "r_x1": 405.797, "r_y1": 664.855, "r_x2": 405.797, "r_y2": 656.058, "r_x3": 134.765, "r_y3": 656.058, "coord_origin": "TOPLEFT"}, "text": "steps which is a result of the reduced sequence representation.", "orig": "steps which is a result of the reduced sequence representation.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "Additionally, the results show that OTSL has an advantage over HTML when applied on a bigger data set like PubTables-1M and achieves significantly improved scores. Finally, OTSL achieves faster inference due to fewer decoding steps which is a result of the reduced sequence representation."}], "body": [{"label": "text", "id": 4, "page_no": 8, "cluster": {"id": 4, "label": "text", "bbox": {"l": 134.765, "t": 118.93399999999997, "r": 480.596, "b": 151.64200000000005, "coord_origin": "TOPLEFT"}, "confidence": 0.9805440306663513, "cells": [{"index": 2, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 127.731, "r_x1": 480.594, "r_y1": 127.731, "r_x2": 480.594, "r_y2": 118.93399999999997, "r_x3": 134.765, "r_y3": 118.93399999999997, "coord_origin": "TOPLEFT"}, "text": "order to compute the TED score. Inference timing results for all experiments", "orig": "order to compute the TED score. Inference timing results for all experiments", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 3, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 139.68600000000004, "r_x1": 480.596, "r_y1": 139.68600000000004, "r_x2": 480.596, "r_y2": 130.889, "r_x3": 134.765, "r_y3": 130.889, "coord_origin": "TOPLEFT"}, "text": "were obtained from the same machine on a single core with AMD EPYC 7763", "orig": "were obtained from the same machine on a single core with AMD EPYC 7763", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 4, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 151.64200000000005, "r_x1": 210.785, "r_y1": 151.64200000000005, "r_x2": 210.785, "r_y2": 142.84500000000003, "r_x3": 134.765, "r_y3": 142.84500000000003, "coord_origin": "TOPLEFT"}, "text": "CPU @2.45 GHz.", "orig": "CPU @2.45 GHz.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "order to compute the TED score. Inference timing results for all experiments were obtained from the same machine on a single core with AMD EPYC 7763 CPU @2.45 GHz."}, {"label": "section_header", "id": 6, "page_no": 8, "cluster": {"id": 6, "label": "section_header", "bbox": {"l": 134.765, "t": 169.18600000000004, "r": 318.448, "b": 177.99300000000005, "coord_origin": "TOPLEFT"}, "confidence": 0.9579681158065796, "cells": [{"index": 5, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 177.99300000000005, "r_x1": 149.402, "r_y1": 177.99300000000005, "r_x2": 149.402, "r_y2": 169.18600000000004, "r_x3": 134.765, "r_y3": 169.18600000000004, "coord_origin": "TOPLEFT"}, "text": "5.1", "orig": "5.1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 6, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 160.859, "r_y0": 177.99300000000005, "r_x1": 318.448, "r_y1": 177.99300000000005, "r_x2": 318.448, "r_y2": 169.18600000000004, "r_x3": 160.859, "r_y3": 169.18600000000004, "coord_origin": "TOPLEFT"}, "text": "Hyper Parameter Optimization", "orig": "Hyper Parameter Optimization", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "5.1 Hyper Parameter Optimization"}, {"label": "text", "id": 3, "page_no": 8, "cluster": {"id": 3, "label": "text", "bbox": {"l": 134.765, "t": 185.586, "r": 480.593, "b": 254.159, "coord_origin": "TOPLEFT"}, "confidence": 0.9842326641082764, "cells": [{"index": 7, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 194.38300000000004, "r_x1": 480.592, "r_y1": 194.38300000000004, "r_x2": 480.592, "r_y2": 185.586, "r_x3": 134.765, "r_y3": 185.586, "coord_origin": "TOPLEFT"}, "text": "We have chosen the PubTabNet data set to perform HPO, since it includes a", "orig": "We have chosen the PubTabNet data set to perform HPO, since it includes a", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 8, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 206.33799999999997, "r_x1": 480.592, "r_y1": 206.33799999999997, "r_x2": 480.592, "r_y2": 197.54100000000005, "r_x3": 134.765, "r_y3": 197.54100000000005, "coord_origin": "TOPLEFT"}, "text": "highly diverse set of tables. Also we report TED scores separately for simple and", "orig": "highly diverse set of tables. Also we report TED scores separately for simple and", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 9, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 218.293, "r_x1": 480.592, "r_y1": 218.293, "r_x2": 480.592, "r_y2": 209.49599999999998, "r_x3": 134.765, "r_y3": 209.49599999999998, "coord_origin": "TOPLEFT"}, "text": "complex tables (tables with cell spans). Results are presented in Table. 1. It is", "orig": "complex tables (tables with cell spans). Results are presented in Table. 1. It is", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 10, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 230.24800000000005, "r_x1": 480.593, "r_y1": 230.24800000000005, "r_x2": 480.593, "r_y2": 221.45100000000002, "r_x3": 134.765, "r_y3": 221.45100000000002, "coord_origin": "TOPLEFT"}, "text": "evident that with OTSL, our model achieves the same TED score and slightly", "orig": "evident that with OTSL, our model achieves the same TED score and slightly", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 11, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 242.20299999999997, "r_x1": 440.942, "r_y1": 242.20299999999997, "r_x2": 440.942, "r_y2": 233.40599999999995, "r_x3": 134.765, "r_y3": 233.40599999999995, "coord_origin": "TOPLEFT"}, "text": "better mAP scores in comparison to HTML. However OTSL yields a", "orig": "better mAP scores in comparison to HTML. However OTSL yields a", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 12, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 444.868, "r_y0": 242.20299999999997, "r_x1": 480.588, "r_y1": 242.20299999999997, "r_x2": 480.588, "r_y2": 233.40599999999995, "r_x3": 444.868, "r_y3": 233.40599999999995, "coord_origin": "TOPLEFT"}, "text": "2x speed", "orig": "2x speed", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 13, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 254.159, "r_x1": 145.201, "r_y1": 254.159, "r_x2": 145.201, "r_y2": 245.36199999999997, "r_x3": 134.765, "r_y3": 245.36199999999997, "coord_origin": "TOPLEFT"}, "text": "up", "orig": "up", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 14, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 149.149, "r_y0": 254.159, "r_x1": 311.22, "r_y1": 254.159, "r_x2": 311.22, "r_y2": 245.36199999999997, "r_x3": 149.149, "r_y3": 245.36199999999997, "coord_origin": "TOPLEFT"}, "text": "in the inference runtime over HTML.", "orig": "in the inference runtime over HTML.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "We have chosen the PubTabNet data set to perform HPO, since it includes a highly diverse set of tables. Also we report TED scores separately for simple and complex tables (tables with cell spans). Results are presented in Table. 1. It is evident that with OTSL, our model achieves the same TED score and slightly better mAP scores in comparison to HTML. However OTSL yields a 2x speed up in the inference runtime over HTML."}, {"label": "caption", "id": 7, "page_no": 8, "cluster": {"id": 7, "label": "caption", "bbox": {"l": 134.765, "t": 272.85699999999997, "r": 480.595, "b": 327.982, "coord_origin": "TOPLEFT"}, "confidence": 0.9570781588554382, "cells": [{"index": 15, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 282.998, "r_x1": 160.118, "r_y1": 282.998, "r_x2": 160.118, "r_y2": 275.072, "r_x3": 134.765, "r_y3": 275.072, "coord_origin": "TOPLEFT"}, "text": "Table", "orig": "Table", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 16, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 167.345, "r_y0": 282.998, "r_x1": 175.595, "r_y1": 282.998, "r_x2": 175.595, "r_y2": 275.072, "r_x3": 167.345, "r_y3": 275.072, "coord_origin": "TOPLEFT"}, "text": "1.", "orig": "1.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 17, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 188.133, "r_y0": 284.146, "r_x1": 255.736, "r_y1": 284.146, "r_x2": 255.736, "r_y2": 272.85699999999997, "r_x3": 188.133, "r_y3": 272.85699999999997, "coord_origin": "TOPLEFT"}, "text": "HPO performed", "orig": "HPO performed", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 18, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 262.013, "r_y0": 284.146, "r_x1": 269.69, "r_y1": 284.146, "r_x2": 269.69, "r_y2": 272.85699999999997, "r_x3": 262.013, "r_y3": 272.85699999999997, "coord_origin": "TOPLEFT"}, "text": "in", "orig": "in", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 19, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 275.957, "r_y0": 284.146, "r_x1": 300.652, "r_y1": 284.146, "r_x2": 300.652, "r_y2": 272.85699999999997, "r_x3": 275.957, "r_y3": 272.85699999999997, "coord_origin": "TOPLEFT"}, "text": "OTSL", "orig": "OTSL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 20, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 306.92, "r_y0": 284.146, "r_x1": 321.763, "r_y1": 284.146, "r_x2": 321.763, "r_y2": 272.85699999999997, "r_x3": 306.92, "r_y3": 272.85699999999997, "coord_origin": "TOPLEFT"}, "text": "and", "orig": "and", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 21, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 328.03, "r_y0": 284.146, "r_x1": 419.24, "r_y1": 284.146, "r_x2": 419.24, "r_y2": 272.85699999999997, "r_x3": 328.03, "r_y3": 272.85699999999997, "coord_origin": "TOPLEFT"}, "text": "HTML representation", "orig": "HTML representation", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 22, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 425.508, "r_y0": 284.146, "r_x1": 435.233, "r_y1": 284.146, "r_x2": 435.233, "r_y2": 272.85699999999997, "r_x3": 425.508, "r_y3": 272.85699999999997, "coord_origin": "TOPLEFT"}, "text": "on", "orig": "on", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 23, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 441.509, "r_y0": 284.146, "r_x1": 454.309, "r_y1": 284.146, "r_x2": 454.309, "r_y2": 272.85699999999997, "r_x3": 441.509, "r_y3": 272.85699999999997, "coord_origin": "TOPLEFT"}, "text": "the", "orig": "the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 24, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 460.576, "r_y0": 284.146, "r_x1": 480.594, "r_y1": 284.146, "r_x2": 480.594, "r_y2": 272.85699999999997, "r_x3": 460.576, "r_y3": 272.85699999999997, "coord_origin": "TOPLEFT"}, "text": "same", "orig": "same", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 25, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 295.105, "r_x1": 480.595, "r_y1": 295.105, "r_x2": 480.595, "r_y2": 283.816, "r_x3": 134.765, "r_y3": 283.816, "coord_origin": "TOPLEFT"}, "text": "transformer-based TableFormer [9] architecture, trained only on PubTabNet [22]. Ef-", "orig": "transformer-based TableFormer [9] architecture, trained only on PubTabNet [22]. Ef-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 26, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 306.064, "r_x1": 480.595, "r_y1": 306.064, "r_x2": 480.595, "r_y2": 294.775, "r_x3": 134.765, "r_y3": 294.775, "coord_origin": "TOPLEFT"}, "text": "fects of reducing the # of layers in encoder and decoder stages of the model show that", "orig": "fects of reducing the # of layers in encoder and decoder stages of the model show that", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 27, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 317.023, "r_x1": 163.504, "r_y1": 317.023, "r_x2": 163.504, "r_y2": 305.734, "r_x3": 134.765, "r_y3": 305.734, "coord_origin": "TOPLEFT"}, "text": "smaller", "orig": "smaller", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 28, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 167.817, "r_y0": 317.023, "r_x1": 443.264, "r_y1": 317.023, "r_x2": 443.264, "r_y2": 305.734, "r_x3": 167.817, "r_y3": 305.734, "coord_origin": "TOPLEFT"}, "text": "models trained on OTSL perform better, especially in recognizing", "orig": "models trained on OTSL perform better, especially in recognizing", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 29, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 447.577, "r_y0": 317.023, "r_x1": 480.595, "r_y1": 317.023, "r_x2": 480.595, "r_y2": 305.734, "r_x3": 447.577, "r_y3": 305.734, "coord_origin": "TOPLEFT"}, "text": "complex", "orig": "complex", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 30, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 327.982, "r_x1": 480.595, "r_y1": 327.982, "r_x2": 480.595, "r_y2": 316.693, "r_x3": 134.765, "r_y3": 316.693, "coord_origin": "TOPLEFT"}, "text": "table structures, and maintain a much higher mAP score than the HTML counterpart.", "orig": "table structures, and maintain a much higher mAP score than the HTML counterpart.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "Table 1. HPO performed in OTSL and HTML representation on the same transformer-based TableFormer [9] architecture, trained only on PubTabNet [22]. Effects of reducing the # of layers in encoder and decoder stages of the model show that smaller models trained on OTSL perform better, especially in recognizing complex table structures, and maintain a much higher mAP score than the HTML counterpart."}, {"label": "table", "id": 0, "page_no": 8, "cluster": {"id": 0, "label": "table", "bbox": {"l": 139.66845703125, "t": 337.5747985839844, "r": 475.00372314453125, "b": 469.4721374511719, "coord_origin": "TOPLEFT"}, "confidence": 0.9901032447814941, "cells": [{"index": 31, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 160.37, "r_y0": 350.746, "r_x1": 168.048, "r_y1": 350.746, "r_x2": 168.048, "r_y2": 339.457, "r_x3": 160.37, "r_y3": 339.457, "coord_origin": "TOPLEFT"}, "text": "#", "orig": "#", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 32, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 144.592, "r_y0": 363.697, "r_x1": 183.828, "r_y1": 363.697, "r_x2": 183.828, "r_y2": 352.408, "r_x3": 144.592, "r_y3": 352.408, "coord_origin": "TOPLEFT"}, "text": "enc-layers", "orig": "enc-layers", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 33, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 207.974, "r_y0": 350.746, "r_x1": 215.652, "r_y1": 350.746, "r_x2": 215.652, "r_y2": 339.457, "r_x3": 207.974, "r_y3": 339.457, "coord_origin": "TOPLEFT"}, "text": "#", "orig": "#", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 34, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 192.195, "r_y0": 363.697, "r_x1": 231.431, "r_y1": 363.697, "r_x2": 231.431, "r_y2": 352.408, "r_x3": 192.195, "r_y3": 352.408, "coord_origin": "TOPLEFT"}, "text": "dec-layers", "orig": "dec-layers", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 35, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 239.798, "r_y0": 356.225, "r_x1": 278.318, "r_y1": 356.225, "r_x2": 278.318, "r_y2": 344.936, "r_x3": 239.798, "r_y3": 344.936, "coord_origin": "TOPLEFT"}, "text": "Language", "orig": "Language", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 36, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 324.67, "r_y0": 350.746, "r_x1": 348.264, "r_y1": 350.746, "r_x2": 348.264, "r_y2": 339.457, "r_x3": 324.67, "r_y3": 339.457, "coord_origin": "TOPLEFT"}, "text": "TEDs", "orig": "TEDs", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 37, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 396.271, "r_y0": 350.746, "r_x1": 417.127, "r_y1": 350.746, "r_x2": 417.127, "r_y2": 339.457, "r_x3": 396.271, "r_y3": 339.457, "coord_origin": "TOPLEFT"}, "text": "mAP", "orig": "mAP", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 38, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 394.927, "r_y0": 361.705, "r_x1": 418.473, "r_y1": 361.705, "r_x2": 418.473, "r_y2": 350.416, "r_x3": 394.927, "r_y3": 350.416, "coord_origin": "TOPLEFT"}, "text": "(0.75)", "orig": "(0.75)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 39, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 430.771, "r_y0": 350.746, "r_x1": 467.142, "r_y1": 350.746, "r_x2": 467.142, "r_y2": 339.457, "r_x3": 430.771, "r_y3": 339.457, "coord_origin": "TOPLEFT"}, "text": "Inference", "orig": "Inference", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 40, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 427.148, "r_y0": 361.705, "r_x1": 470.761, "r_y1": 361.705, "r_x2": 470.761, "r_y2": 350.416, "r_x3": 427.148, "r_y3": 350.416, "coord_origin": "TOPLEFT"}, "text": "time (secs)", "orig": "time (secs)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 41, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 286.686, "r_y0": 363.697, "r_x1": 312.333, "r_y1": 363.697, "r_x2": 312.333, "r_y2": 352.408, "r_x3": 286.686, "r_y3": 352.408, "coord_origin": "TOPLEFT"}, "text": "simple", "orig": "simple", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 42, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 320.702, "r_y0": 363.697, "r_x1": 353.72, "r_y1": 363.697, "r_x2": 353.72, "r_y2": 352.408, "r_x3": 320.702, "r_y3": 352.408, "coord_origin": "TOPLEFT"}, "text": "complex", "orig": "complex", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 43, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 369.306, "r_y0": 363.697, "r_x1": 379.031, "r_y1": 363.697, "r_x2": 379.031, "r_y2": 352.408, "r_x3": 369.306, "r_y3": 352.408, "coord_origin": "TOPLEFT"}, "text": "all", "orig": "all", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 44, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 161.906, "r_y0": 382.527, "r_x1": 166.513, "r_y1": 382.527, "r_x2": 166.513, "r_y2": 371.238, "r_x3": 161.906, "r_y3": 371.238, "coord_origin": "TOPLEFT"}, "text": "6", "orig": "6", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 45, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 209.509, "r_y0": 382.527, "r_x1": 214.116, "r_y1": 382.527, "r_x2": 214.116, "r_y2": 371.238, "r_x3": 209.509, "r_y3": 371.238, "coord_origin": "TOPLEFT"}, "text": "6", "orig": "6", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 46, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 246.71, "r_y0": 377.047, "r_x1": 271.405, "r_y1": 377.047, "r_x2": 271.405, "r_y2": 365.758, "r_x3": 246.71, "r_y3": 365.758, "coord_origin": "TOPLEFT"}, "text": "OTSL", "orig": "OTSL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 47, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 289.017, "r_y0": 377.047, "r_x1": 310.004, "r_y1": 377.047, "r_x2": 310.004, "r_y2": 365.758, "r_x3": 289.017, "r_y3": 365.758, "coord_origin": "TOPLEFT"}, "text": "0.965", "orig": "0.965", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 48, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 326.717, "r_y0": 377.047, "r_x1": 347.704, "r_y1": 377.047, "r_x2": 347.704, "r_y2": 365.758, "r_x3": 326.717, "r_y3": 365.758, "coord_origin": "TOPLEFT"}, "text": "0.934", "orig": "0.934", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 49, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 363.676, "r_y0": 377.047, "r_x1": 384.663, "r_y1": 377.047, "r_x2": 384.663, "r_y2": 365.758, "r_x3": 363.676, "r_y3": 365.758, "coord_origin": "TOPLEFT"}, "text": "0.955", "orig": "0.955", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 50, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 397.27, "r_y0": 375.899, "r_x1": 416.127, "r_y1": 375.899, "r_x2": 416.127, "r_y2": 367.973, "r_x3": 397.27, "r_y3": 367.973, "coord_origin": "TOPLEFT"}, "text": "0.88", "orig": "0.88", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 51, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 439.527, "r_y0": 375.899, "r_x1": 458.384, "r_y1": 375.899, "r_x2": 458.384, "r_y2": 367.973, "r_x3": 439.527, "r_y3": 367.973, "coord_origin": "TOPLEFT"}, "text": "2.73", "orig": "2.73", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 52, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 245.176, "r_y0": 389.999, "r_x1": 272.94, "r_y1": 389.999, "r_x2": 272.94, "r_y2": 378.71, "r_x3": 245.176, "r_y3": 378.71, "coord_origin": "TOPLEFT"}, "text": "HTML", "orig": "HTML", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 53, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 289.017, "r_y0": 389.999, "r_x1": 310.004, "r_y1": 389.999, "r_x2": 310.004, "r_y2": 378.71, "r_x3": 289.017, "r_y3": 378.71, "coord_origin": "TOPLEFT"}, "text": "0.969", "orig": "0.969", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 54, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 326.717, "r_y0": 389.999, "r_x1": 347.704, "r_y1": 389.999, "r_x2": 347.704, "r_y2": 378.71, "r_x3": 326.717, "r_y3": 378.71, "coord_origin": "TOPLEFT"}, "text": "0.927", "orig": "0.927", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 55, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 363.676, "r_y0": 389.999, "r_x1": 384.663, "r_y1": 389.999, "r_x2": 384.663, "r_y2": 378.71, "r_x3": 363.676, "r_y3": 378.71, "coord_origin": "TOPLEFT"}, "text": "0.955", "orig": "0.955", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 56, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 396.206, "r_y0": 389.999, "r_x1": 417.193, "r_y1": 389.999, "r_x2": 417.193, "r_y2": 378.71, "r_x3": 396.206, "r_y3": 378.71, "coord_origin": "TOPLEFT"}, "text": "0.857", "orig": "0.857", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 57, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 440.767, "r_y0": 389.999, "r_x1": 457.147, "r_y1": 389.999, "r_x2": 457.147, "r_y2": 378.71, "r_x3": 440.767, "r_y3": 378.71, "coord_origin": "TOPLEFT"}, "text": "5.39", "orig": "5.39", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 58, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 161.906, "r_y0": 408.828, "r_x1": 166.513, "r_y1": 408.828, "r_x2": 166.513, "r_y2": 397.539, "r_x3": 161.906, "r_y3": 397.539, "coord_origin": "TOPLEFT"}, "text": "4", "orig": "4", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 59, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 209.509, "r_y0": 408.828, "r_x1": 214.116, "r_y1": 408.828, "r_x2": 214.116, "r_y2": 397.539, "r_x3": 209.509, "r_y3": 397.539, "coord_origin": "TOPLEFT"}, "text": "4", "orig": "4", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 60, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 246.71, "r_y0": 403.349, "r_x1": 271.405, "r_y1": 403.349, "r_x2": 271.405, "r_y2": 392.06, "r_x3": 246.71, "r_y3": 392.06, "coord_origin": "TOPLEFT"}, "text": "OTSL", "orig": "OTSL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 61, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 289.017, "r_y0": 403.349, "r_x1": 310.004, "r_y1": 403.349, "r_x2": 310.004, "r_y2": 392.06, "r_x3": 289.017, "r_y3": 392.06, "coord_origin": "TOPLEFT"}, "text": "0.938", "orig": "0.938", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 62, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 326.717, "r_y0": 403.349, "r_x1": 347.704, "r_y1": 403.349, "r_x2": 347.704, "r_y2": 392.06, "r_x3": 326.717, "r_y3": 392.06, "coord_origin": "TOPLEFT"}, "text": "0.904", "orig": "0.904", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 63, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 363.676, "r_y0": 403.349, "r_x1": 384.663, "r_y1": 403.349, "r_x2": 384.663, "r_y2": 392.06, "r_x3": 363.676, "r_y3": 392.06, "coord_origin": "TOPLEFT"}, "text": "0.927", "orig": "0.927", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 64, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 394.618, "r_y0": 402.201, "r_x1": 418.779, "r_y1": 402.201, "r_x2": 418.779, "r_y2": 394.275, "r_x3": 394.618, "r_y3": 394.275, "coord_origin": "TOPLEFT"}, "text": "0.853", "orig": "0.853", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 65, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 439.527, "r_y0": 402.201, "r_x1": 458.384, "r_y1": 402.201, "r_x2": 458.384, "r_y2": 394.275, "r_x3": 439.527, "r_y3": 394.275, "coord_origin": "TOPLEFT"}, "text": "1.97", "orig": "1.97", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 66, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 245.176, "r_y0": 416.3, "r_x1": 272.94, "r_y1": 416.3, "r_x2": 272.94, "r_y2": 405.011, "r_x3": 245.176, "r_y3": 405.011, "coord_origin": "TOPLEFT"}, "text": "HTML", "orig": "HTML", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 67, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 289.017, "r_y0": 416.3, "r_x1": 310.004, "r_y1": 416.3, "r_x2": 310.004, "r_y2": 405.011, "r_x3": 289.017, "r_y3": 405.011, "coord_origin": "TOPLEFT"}, "text": "0.952", "orig": "0.952", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 68, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 326.717, "r_y0": 416.3, "r_x1": 347.704, "r_y1": 416.3, "r_x2": 347.704, "r_y2": 405.011, "r_x3": 326.717, "r_y3": 405.011, "coord_origin": "TOPLEFT"}, "text": "0.909", "orig": "0.909", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 69, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 362.088, "r_y0": 415.152, "r_x1": 386.249, "r_y1": 415.152, "r_x2": 386.249, "r_y2": 407.226, "r_x3": 362.088, "r_y3": 407.226, "coord_origin": "TOPLEFT"}, "text": "0.938", "orig": "0.938", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 70, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 396.206, "r_y0": 416.3, "r_x1": 417.193, "r_y1": 416.3, "r_x2": 417.193, "r_y2": 405.011, "r_x3": 396.206, "r_y3": 405.011, "coord_origin": "TOPLEFT"}, "text": "0.843", "orig": "0.843", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 71, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 440.767, "r_y0": 416.3, "r_x1": 457.147, "r_y1": 416.3, "r_x2": 457.147, "r_y2": 405.011, "r_x3": 440.767, "r_y3": 405.011, "coord_origin": "TOPLEFT"}, "text": "3.77", "orig": "3.77", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 72, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 161.906, "r_y0": 435.129, "r_x1": 166.513, "r_y1": 435.129, "r_x2": 166.513, "r_y2": 423.84, "r_x3": 161.906, "r_y3": 423.84, "coord_origin": "TOPLEFT"}, "text": "2", "orig": "2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 73, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 209.509, "r_y0": 435.129, "r_x1": 214.116, "r_y1": 435.129, "r_x2": 214.116, "r_y2": 423.84, "r_x3": 209.509, "r_y3": 423.84, "coord_origin": "TOPLEFT"}, "text": "4", "orig": "4", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 74, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 246.71, "r_y0": 429.65, "r_x1": 271.405, "r_y1": 429.65, "r_x2": 271.405, "r_y2": 418.361, "r_x3": 246.71, "r_y3": 418.361, "coord_origin": "TOPLEFT"}, "text": "OTSL", "orig": "OTSL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 75, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 289.017, "r_y0": 429.65, "r_x1": 310.004, "r_y1": 429.65, "r_x2": 310.004, "r_y2": 418.361, "r_x3": 289.017, "r_y3": 418.361, "coord_origin": "TOPLEFT"}, "text": "0.923", "orig": "0.923", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 76, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 326.717, "r_y0": 429.65, "r_x1": 347.704, "r_y1": 429.65, "r_x2": 347.704, "r_y2": 418.361, "r_x3": 326.717, "r_y3": 418.361, "coord_origin": "TOPLEFT"}, "text": "0.897", "orig": "0.897", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 77, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 363.676, "r_y0": 429.65, "r_x1": 384.663, "r_y1": 429.65, "r_x2": 384.663, "r_y2": 418.361, "r_x3": 363.676, "r_y3": 418.361, "coord_origin": "TOPLEFT"}, "text": "0.915", "orig": "0.915", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 78, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 394.618, "r_y0": 428.502, "r_x1": 418.779, "r_y1": 428.502, "r_x2": 418.779, "r_y2": 420.576, "r_x3": 394.618, "r_y3": 420.576, "coord_origin": "TOPLEFT"}, "text": "0.859", "orig": "0.859", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 79, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 439.527, "r_y0": 428.502, "r_x1": 458.384, "r_y1": 428.502, "r_x2": 458.384, "r_y2": 420.576, "r_x3": 439.527, "r_y3": 420.576, "coord_origin": "TOPLEFT"}, "text": "1.91", "orig": "1.91", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 80, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 245.176, "r_y0": 442.601, "r_x1": 272.94, "r_y1": 442.601, "r_x2": 272.94, "r_y2": 431.312, "r_x3": 245.176, "r_y3": 431.312, "coord_origin": "TOPLEFT"}, "text": "HTML", "orig": "HTML", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 81, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 289.017, "r_y0": 442.601, "r_x1": 310.004, "r_y1": 442.601, "r_x2": 310.004, "r_y2": 431.312, "r_x3": 289.017, "r_y3": 431.312, "coord_origin": "TOPLEFT"}, "text": "0.945", "orig": "0.945", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 82, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 326.717, "r_y0": 442.601, "r_x1": 347.704, "r_y1": 442.601, "r_x2": 347.704, "r_y2": 431.312, "r_x3": 326.717, "r_y3": 431.312, "coord_origin": "TOPLEFT"}, "text": "0.901", "orig": "0.901", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 83, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 362.088, "r_y0": 441.453, "r_x1": 386.249, "r_y1": 441.453, "r_x2": 386.249, "r_y2": 433.527, "r_x3": 362.088, "r_y3": 433.527, "coord_origin": "TOPLEFT"}, "text": "0.931", "orig": "0.931", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 84, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 396.206, "r_y0": 442.601, "r_x1": 417.193, "r_y1": 442.601, "r_x2": 417.193, "r_y2": 431.312, "r_x3": 396.206, "r_y3": 431.312, "coord_origin": "TOPLEFT"}, "text": "0.834", "orig": "0.834", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 85, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 440.767, "r_y0": 442.601, "r_x1": 457.147, "r_y1": 442.601, "r_x2": 457.147, "r_y2": 431.312, "r_x3": 440.767, "r_y3": 431.312, "coord_origin": "TOPLEFT"}, "text": "3.81", "orig": "3.81", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 86, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 161.906, "r_y0": 461.431, "r_x1": 166.513, "r_y1": 461.431, "r_x2": 166.513, "r_y2": 450.142, "r_x3": 161.906, "r_y3": 450.142, "coord_origin": "TOPLEFT"}, "text": "4", "orig": "4", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 87, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 209.509, "r_y0": 461.431, "r_x1": 214.116, "r_y1": 461.431, "r_x2": 214.116, "r_y2": 450.142, "r_x3": 209.509, "r_y3": 450.142, "coord_origin": "TOPLEFT"}, "text": "2", "orig": "2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 88, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 246.71, "r_y0": 455.951, "r_x1": 271.405, "r_y1": 455.951, "r_x2": 271.405, "r_y2": 444.662, "r_x3": 246.71, "r_y3": 444.662, "coord_origin": "TOPLEFT"}, "text": "OTSL", "orig": "OTSL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 89, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 289.017, "r_y0": 455.951, "r_x1": 310.004, "r_y1": 455.951, "r_x2": 310.004, "r_y2": 444.662, "r_x3": 289.017, "r_y3": 444.662, "coord_origin": "TOPLEFT"}, "text": "0.952", "orig": "0.952", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 90, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 329.021, "r_y0": 455.951, "r_x1": 345.401, "r_y1": 455.951, "r_x2": 345.401, "r_y2": 444.662, "r_x3": 329.021, "r_y3": 444.662, "coord_origin": "TOPLEFT"}, "text": "0.92", "orig": "0.92", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 91, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 362.088, "r_y0": 454.803, "r_x1": 386.249, "r_y1": 454.803, "r_x2": 386.249, "r_y2": 446.877, "r_x3": 362.088, "r_y3": 446.877, "coord_origin": "TOPLEFT"}, "text": "0.942", "orig": "0.942", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 92, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 394.618, "r_y0": 454.803, "r_x1": 418.779, "r_y1": 454.803, "r_x2": 418.779, "r_y2": 446.877, "r_x3": 394.618, "r_y3": 446.877, "coord_origin": "TOPLEFT"}, "text": "0.857", "orig": "0.857", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 93, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 439.527, "r_y0": 454.803, "r_x1": 458.384, "r_y1": 454.803, "r_x2": 458.384, "r_y2": 446.877, "r_x3": 439.527, "r_y3": 446.877, "coord_origin": "TOPLEFT"}, "text": "1.22", "orig": "1.22", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 94, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 245.176, "r_y0": 468.903, "r_x1": 272.94, "r_y1": 468.903, "r_x2": 272.94, "r_y2": 457.614, "r_x3": 245.176, "r_y3": 457.614, "coord_origin": "TOPLEFT"}, "text": "HTML", "orig": "HTML", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 95, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 289.017, "r_y0": 468.903, "r_x1": 310.004, "r_y1": 468.903, "r_x2": 310.004, "r_y2": 457.614, "r_x3": 289.017, "r_y3": 457.614, "coord_origin": "TOPLEFT"}, "text": "0.944", "orig": "0.944", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 96, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 326.717, "r_y0": 468.903, "r_x1": 347.704, "r_y1": 468.903, "r_x2": 347.704, "r_y2": 457.614, "r_x3": 326.717, "r_y3": 457.614, "coord_origin": "TOPLEFT"}, "text": "0.903", "orig": "0.903", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 97, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 363.676, "r_y0": 468.903, "r_x1": 384.663, "r_y1": 468.903, "r_x2": 384.663, "r_y2": 457.614, "r_x3": 363.676, "r_y3": 457.614, "coord_origin": "TOPLEFT"}, "text": "0.931", "orig": "0.931", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 98, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 396.206, "r_y0": 468.903, "r_x1": 417.193, "r_y1": 468.903, "r_x2": 417.193, "r_y2": 457.614, "r_x3": 396.206, "r_y3": 457.614, "coord_origin": "TOPLEFT"}, "text": "0.824", "orig": "0.824", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 99, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 446.653, "r_y0": 468.903, "r_x1": 451.26, "r_y1": 468.903, "r_x2": 451.26, "r_y2": 457.614, "r_x3": 446.653, "r_y3": 457.614, "coord_origin": "TOPLEFT"}, "text": "2", "orig": "2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": [{"id": 11, "label": "text", "bbox": {"l": 160.37, "t": 339.457, "r": 168.048, "b": 350.746, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 31, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 160.37, "r_y0": 350.746, "r_x1": 168.048, "r_y1": 350.746, "r_x2": 168.048, "r_y2": 339.457, "r_x3": 160.37, "r_y3": 339.457, "coord_origin": "TOPLEFT"}, "text": "#", "orig": "#", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 12, "label": "text", "bbox": {"l": 144.592, "t": 352.408, "r": 183.828, "b": 363.697, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 32, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 144.592, "r_y0": 363.697, "r_x1": 183.828, "r_y1": 363.697, "r_x2": 183.828, "r_y2": 352.408, "r_x3": 144.592, "r_y3": 352.408, "coord_origin": "TOPLEFT"}, "text": "enc-layers", "orig": "enc-layers", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 13, "label": "text", "bbox": {"l": 207.974, "t": 339.457, "r": 215.652, "b": 350.746, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 33, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 207.974, "r_y0": 350.746, "r_x1": 215.652, "r_y1": 350.746, "r_x2": 215.652, "r_y2": 339.457, "r_x3": 207.974, "r_y3": 339.457, "coord_origin": "TOPLEFT"}, "text": "#", "orig": "#", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 14, "label": "text", "bbox": {"l": 192.195, "t": 352.408, "r": 231.431, "b": 363.697, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 34, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 192.195, "r_y0": 363.697, "r_x1": 231.431, "r_y1": 363.697, "r_x2": 231.431, "r_y2": 352.408, "r_x3": 192.195, "r_y3": 352.408, "coord_origin": "TOPLEFT"}, "text": "dec-layers", "orig": "dec-layers", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 15, "label": "text", "bbox": {"l": 239.798, "t": 344.936, "r": 278.318, "b": 356.225, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 35, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 239.798, "r_y0": 356.225, "r_x1": 278.318, "r_y1": 356.225, "r_x2": 278.318, "r_y2": 344.936, "r_x3": 239.798, "r_y3": 344.936, "coord_origin": "TOPLEFT"}, "text": "Language", "orig": "Language", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 16, "label": "text", "bbox": {"l": 324.67, "t": 339.457, "r": 348.264, "b": 350.746, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 36, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 324.67, "r_y0": 350.746, "r_x1": 348.264, "r_y1": 350.746, "r_x2": 348.264, "r_y2": 339.457, "r_x3": 324.67, "r_y3": 339.457, "coord_origin": "TOPLEFT"}, "text": "TEDs", "orig": "TEDs", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 17, "label": "text", "bbox": {"l": 396.271, "t": 339.457, "r": 417.127, "b": 350.746, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 37, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 396.271, "r_y0": 350.746, "r_x1": 417.127, "r_y1": 350.746, "r_x2": 417.127, "r_y2": 339.457, "r_x3": 396.271, "r_y3": 339.457, "coord_origin": "TOPLEFT"}, "text": "mAP", "orig": "mAP", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 18, "label": "text", "bbox": {"l": 394.927, "t": 350.416, "r": 418.473, "b": 361.705, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 38, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 394.927, "r_y0": 361.705, "r_x1": 418.473, "r_y1": 361.705, "r_x2": 418.473, "r_y2": 350.416, "r_x3": 394.927, "r_y3": 350.416, "coord_origin": "TOPLEFT"}, "text": "(0.75)", "orig": "(0.75)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 19, "label": "text", "bbox": {"l": 430.771, "t": 339.457, "r": 467.142, "b": 350.746, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 39, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 430.771, "r_y0": 350.746, "r_x1": 467.142, "r_y1": 350.746, "r_x2": 467.142, "r_y2": 339.457, "r_x3": 430.771, "r_y3": 339.457, "coord_origin": "TOPLEFT"}, "text": "Inference", "orig": "Inference", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 20, "label": "text", "bbox": {"l": 427.148, "t": 350.416, "r": 470.761, "b": 361.705, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 40, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 427.148, "r_y0": 361.705, "r_x1": 470.761, "r_y1": 361.705, "r_x2": 470.761, "r_y2": 350.416, "r_x3": 427.148, "r_y3": 350.416, "coord_origin": "TOPLEFT"}, "text": "time (secs)", "orig": "time (secs)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 21, "label": "text", "bbox": {"l": 286.686, "t": 352.408, "r": 312.333, "b": 363.697, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 41, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 286.686, "r_y0": 363.697, "r_x1": 312.333, "r_y1": 363.697, "r_x2": 312.333, "r_y2": 352.408, "r_x3": 286.686, "r_y3": 352.408, "coord_origin": "TOPLEFT"}, "text": "simple", "orig": "simple", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 22, "label": "text", "bbox": {"l": 320.702, "t": 352.408, "r": 353.72, "b": 363.697, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 42, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 320.702, "r_y0": 363.697, "r_x1": 353.72, "r_y1": 363.697, "r_x2": 353.72, "r_y2": 352.408, "r_x3": 320.702, "r_y3": 352.408, "coord_origin": "TOPLEFT"}, "text": "complex", "orig": "complex", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 23, "label": "text", "bbox": {"l": 369.306, "t": 352.408, "r": 379.031, "b": 363.697, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 43, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 369.306, "r_y0": 363.697, "r_x1": 379.031, "r_y1": 363.697, "r_x2": 379.031, "r_y2": 352.408, "r_x3": 369.306, "r_y3": 352.408, "coord_origin": "TOPLEFT"}, "text": "all", "orig": "all", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 24, "label": "text", "bbox": {"l": 161.906, "t": 371.238, "r": 166.513, "b": 382.527, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 44, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 161.906, "r_y0": 382.527, "r_x1": 166.513, "r_y1": 382.527, "r_x2": 166.513, "r_y2": 371.238, "r_x3": 161.906, "r_y3": 371.238, "coord_origin": "TOPLEFT"}, "text": "6", "orig": "6", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 25, "label": "text", "bbox": {"l": 209.509, "t": 371.238, "r": 214.116, "b": 382.527, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 45, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 209.509, "r_y0": 382.527, "r_x1": 214.116, "r_y1": 382.527, "r_x2": 214.116, "r_y2": 371.238, "r_x3": 209.509, "r_y3": 371.238, "coord_origin": "TOPLEFT"}, "text": "6", "orig": "6", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 26, "label": "text", "bbox": {"l": 246.71, "t": 365.758, "r": 271.405, "b": 377.047, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 46, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 246.71, "r_y0": 377.047, "r_x1": 271.405, "r_y1": 377.047, "r_x2": 271.405, "r_y2": 365.758, "r_x3": 246.71, "r_y3": 365.758, "coord_origin": "TOPLEFT"}, "text": "OTSL", "orig": "OTSL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 27, "label": "text", "bbox": {"l": 289.017, "t": 365.758, "r": 310.004, "b": 377.047, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 47, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 289.017, "r_y0": 377.047, "r_x1": 310.004, "r_y1": 377.047, "r_x2": 310.004, "r_y2": 365.758, "r_x3": 289.017, "r_y3": 365.758, "coord_origin": "TOPLEFT"}, "text": "0.965", "orig": "0.965", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 28, "label": "text", "bbox": {"l": 326.717, "t": 365.758, "r": 347.704, "b": 377.047, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 48, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 326.717, "r_y0": 377.047, "r_x1": 347.704, "r_y1": 377.047, "r_x2": 347.704, "r_y2": 365.758, "r_x3": 326.717, "r_y3": 365.758, "coord_origin": "TOPLEFT"}, "text": "0.934", "orig": "0.934", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 29, "label": "text", "bbox": {"l": 363.676, "t": 365.758, "r": 384.663, "b": 377.047, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 49, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 363.676, "r_y0": 377.047, "r_x1": 384.663, "r_y1": 377.047, "r_x2": 384.663, "r_y2": 365.758, "r_x3": 363.676, "r_y3": 365.758, "coord_origin": "TOPLEFT"}, "text": "0.955", "orig": "0.955", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 30, "label": "text", "bbox": {"l": 397.27, "t": 367.973, "r": 416.127, "b": 375.899, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 50, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 397.27, "r_y0": 375.899, "r_x1": 416.127, "r_y1": 375.899, "r_x2": 416.127, "r_y2": 367.973, "r_x3": 397.27, "r_y3": 367.973, "coord_origin": "TOPLEFT"}, "text": "0.88", "orig": "0.88", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 31, "label": "text", "bbox": {"l": 439.527, "t": 367.973, "r": 458.384, "b": 375.899, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 51, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 439.527, "r_y0": 375.899, "r_x1": 458.384, "r_y1": 375.899, "r_x2": 458.384, "r_y2": 367.973, "r_x3": 439.527, "r_y3": 367.973, "coord_origin": "TOPLEFT"}, "text": "2.73", "orig": "2.73", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 32, "label": "text", "bbox": {"l": 245.176, "t": 378.71, "r": 272.94, "b": 389.999, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 52, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 245.176, "r_y0": 389.999, "r_x1": 272.94, "r_y1": 389.999, "r_x2": 272.94, "r_y2": 378.71, "r_x3": 245.176, "r_y3": 378.71, "coord_origin": "TOPLEFT"}, "text": "HTML", "orig": "HTML", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 33, "label": "text", "bbox": {"l": 289.017, "t": 378.71, "r": 310.004, "b": 389.999, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 53, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 289.017, "r_y0": 389.999, "r_x1": 310.004, "r_y1": 389.999, "r_x2": 310.004, "r_y2": 378.71, "r_x3": 289.017, "r_y3": 378.71, "coord_origin": "TOPLEFT"}, "text": "0.969", "orig": "0.969", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 34, "label": "text", "bbox": {"l": 326.717, "t": 378.71, "r": 347.704, "b": 389.999, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 54, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 326.717, "r_y0": 389.999, "r_x1": 347.704, "r_y1": 389.999, "r_x2": 347.704, "r_y2": 378.71, "r_x3": 326.717, "r_y3": 378.71, "coord_origin": "TOPLEFT"}, "text": "0.927", "orig": "0.927", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 35, "label": "text", "bbox": {"l": 363.676, "t": 378.71, "r": 384.663, "b": 389.999, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 55, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 363.676, "r_y0": 389.999, "r_x1": 384.663, "r_y1": 389.999, "r_x2": 384.663, "r_y2": 378.71, "r_x3": 363.676, "r_y3": 378.71, "coord_origin": "TOPLEFT"}, "text": "0.955", "orig": "0.955", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 36, "label": "text", "bbox": {"l": 396.206, "t": 378.71, "r": 417.193, "b": 389.999, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 56, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 396.206, "r_y0": 389.999, "r_x1": 417.193, "r_y1": 389.999, "r_x2": 417.193, "r_y2": 378.71, "r_x3": 396.206, "r_y3": 378.71, "coord_origin": "TOPLEFT"}, "text": "0.857", "orig": "0.857", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 37, "label": "text", "bbox": {"l": 440.767, "t": 378.71, "r": 457.147, "b": 389.999, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 57, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 440.767, "r_y0": 389.999, "r_x1": 457.147, "r_y1": 389.999, "r_x2": 457.147, "r_y2": 378.71, "r_x3": 440.767, "r_y3": 378.71, "coord_origin": "TOPLEFT"}, "text": "5.39", "orig": "5.39", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 38, "label": "text", "bbox": {"l": 161.906, "t": 397.539, "r": 166.513, "b": 408.828, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 58, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 161.906, "r_y0": 408.828, "r_x1": 166.513, "r_y1": 408.828, "r_x2": 166.513, "r_y2": 397.539, "r_x3": 161.906, "r_y3": 397.539, "coord_origin": "TOPLEFT"}, "text": "4", "orig": "4", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 39, "label": "text", "bbox": {"l": 209.509, "t": 397.539, "r": 214.116, "b": 408.828, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 59, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 209.509, "r_y0": 408.828, "r_x1": 214.116, "r_y1": 408.828, "r_x2": 214.116, "r_y2": 397.539, "r_x3": 209.509, "r_y3": 397.539, "coord_origin": "TOPLEFT"}, "text": "4", "orig": "4", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 40, "label": "text", "bbox": {"l": 246.71, "t": 392.06, "r": 271.405, "b": 403.349, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 60, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 246.71, "r_y0": 403.349, "r_x1": 271.405, "r_y1": 403.349, "r_x2": 271.405, "r_y2": 392.06, "r_x3": 246.71, "r_y3": 392.06, "coord_origin": "TOPLEFT"}, "text": "OTSL", "orig": "OTSL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 41, "label": "text", "bbox": {"l": 289.017, "t": 392.06, "r": 310.004, "b": 403.349, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 61, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 289.017, "r_y0": 403.349, "r_x1": 310.004, "r_y1": 403.349, "r_x2": 310.004, "r_y2": 392.06, "r_x3": 289.017, "r_y3": 392.06, "coord_origin": "TOPLEFT"}, "text": "0.938", "orig": "0.938", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 42, "label": "text", "bbox": {"l": 326.717, "t": 392.06, "r": 347.704, "b": 403.349, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 62, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 326.717, "r_y0": 403.349, "r_x1": 347.704, "r_y1": 403.349, "r_x2": 347.704, "r_y2": 392.06, "r_x3": 326.717, "r_y3": 392.06, "coord_origin": "TOPLEFT"}, "text": "0.904", "orig": "0.904", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 43, "label": "text", "bbox": {"l": 363.676, "t": 392.06, "r": 384.663, "b": 403.349, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 63, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 363.676, "r_y0": 403.349, "r_x1": 384.663, "r_y1": 403.349, "r_x2": 384.663, "r_y2": 392.06, "r_x3": 363.676, "r_y3": 392.06, "coord_origin": "TOPLEFT"}, "text": "0.927", "orig": "0.927", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 44, "label": "text", "bbox": {"l": 394.618, "t": 394.275, "r": 418.779, "b": 402.201, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 64, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 394.618, "r_y0": 402.201, "r_x1": 418.779, "r_y1": 402.201, "r_x2": 418.779, "r_y2": 394.275, "r_x3": 394.618, "r_y3": 394.275, "coord_origin": "TOPLEFT"}, "text": "0.853", "orig": "0.853", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 45, "label": "text", "bbox": {"l": 439.527, "t": 394.275, "r": 458.384, "b": 402.201, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 65, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 439.527, "r_y0": 402.201, "r_x1": 458.384, "r_y1": 402.201, "r_x2": 458.384, "r_y2": 394.275, "r_x3": 439.527, "r_y3": 394.275, "coord_origin": "TOPLEFT"}, "text": "1.97", "orig": "1.97", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 46, "label": "text", "bbox": {"l": 245.176, "t": 405.011, "r": 272.94, "b": 416.3, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 66, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 245.176, "r_y0": 416.3, "r_x1": 272.94, "r_y1": 416.3, "r_x2": 272.94, "r_y2": 405.011, "r_x3": 245.176, "r_y3": 405.011, "coord_origin": "TOPLEFT"}, "text": "HTML", "orig": "HTML", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 47, "label": "text", "bbox": {"l": 289.017, "t": 405.011, "r": 310.004, "b": 416.3, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 67, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 289.017, "r_y0": 416.3, "r_x1": 310.004, "r_y1": 416.3, "r_x2": 310.004, "r_y2": 405.011, "r_x3": 289.017, "r_y3": 405.011, "coord_origin": "TOPLEFT"}, "text": "0.952", "orig": "0.952", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 48, "label": "text", "bbox": {"l": 326.717, "t": 405.011, "r": 347.704, "b": 416.3, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 68, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 326.717, "r_y0": 416.3, "r_x1": 347.704, "r_y1": 416.3, "r_x2": 347.704, "r_y2": 405.011, "r_x3": 326.717, "r_y3": 405.011, "coord_origin": "TOPLEFT"}, "text": "0.909", "orig": "0.909", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 49, "label": "text", "bbox": {"l": 362.088, "t": 407.226, "r": 386.249, "b": 415.152, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 69, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 362.088, "r_y0": 415.152, "r_x1": 386.249, "r_y1": 415.152, "r_x2": 386.249, "r_y2": 407.226, "r_x3": 362.088, "r_y3": 407.226, "coord_origin": "TOPLEFT"}, "text": "0.938", "orig": "0.938", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 50, "label": "text", "bbox": {"l": 396.206, "t": 405.011, "r": 417.193, "b": 416.3, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 70, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 396.206, "r_y0": 416.3, "r_x1": 417.193, "r_y1": 416.3, "r_x2": 417.193, "r_y2": 405.011, "r_x3": 396.206, "r_y3": 405.011, "coord_origin": "TOPLEFT"}, "text": "0.843", "orig": "0.843", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 51, "label": "text", "bbox": {"l": 440.767, "t": 405.011, "r": 457.147, "b": 416.3, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 71, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 440.767, "r_y0": 416.3, "r_x1": 457.147, "r_y1": 416.3, "r_x2": 457.147, "r_y2": 405.011, "r_x3": 440.767, "r_y3": 405.011, "coord_origin": "TOPLEFT"}, "text": "3.77", "orig": "3.77", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 52, "label": "text", "bbox": {"l": 161.906, "t": 423.84, "r": 166.513, "b": 435.129, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 72, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 161.906, "r_y0": 435.129, "r_x1": 166.513, "r_y1": 435.129, "r_x2": 166.513, "r_y2": 423.84, "r_x3": 161.906, "r_y3": 423.84, "coord_origin": "TOPLEFT"}, "text": "2", "orig": "2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 53, "label": "text", "bbox": {"l": 209.509, "t": 423.84, "r": 214.116, "b": 435.129, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 73, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 209.509, "r_y0": 435.129, "r_x1": 214.116, "r_y1": 435.129, "r_x2": 214.116, "r_y2": 423.84, "r_x3": 209.509, "r_y3": 423.84, "coord_origin": "TOPLEFT"}, "text": "4", "orig": "4", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 54, "label": "text", "bbox": {"l": 246.71, "t": 418.361, "r": 271.405, "b": 429.65, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 74, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 246.71, "r_y0": 429.65, "r_x1": 271.405, "r_y1": 429.65, "r_x2": 271.405, "r_y2": 418.361, "r_x3": 246.71, "r_y3": 418.361, "coord_origin": "TOPLEFT"}, "text": "OTSL", "orig": "OTSL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 55, "label": "text", "bbox": {"l": 289.017, "t": 418.361, "r": 310.004, "b": 429.65, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 75, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 289.017, "r_y0": 429.65, "r_x1": 310.004, "r_y1": 429.65, "r_x2": 310.004, "r_y2": 418.361, "r_x3": 289.017, "r_y3": 418.361, "coord_origin": "TOPLEFT"}, "text": "0.923", "orig": "0.923", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 56, "label": "text", "bbox": {"l": 326.717, "t": 418.361, "r": 347.704, "b": 429.65, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 76, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 326.717, "r_y0": 429.65, "r_x1": 347.704, "r_y1": 429.65, "r_x2": 347.704, "r_y2": 418.361, "r_x3": 326.717, "r_y3": 418.361, "coord_origin": "TOPLEFT"}, "text": "0.897", "orig": "0.897", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 57, "label": "text", "bbox": {"l": 363.676, "t": 418.361, "r": 384.663, "b": 429.65, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 77, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 363.676, "r_y0": 429.65, "r_x1": 384.663, "r_y1": 429.65, "r_x2": 384.663, "r_y2": 418.361, "r_x3": 363.676, "r_y3": 418.361, "coord_origin": "TOPLEFT"}, "text": "0.915", "orig": "0.915", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 58, "label": "text", "bbox": {"l": 394.618, "t": 420.576, "r": 418.779, "b": 428.502, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 78, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 394.618, "r_y0": 428.502, "r_x1": 418.779, "r_y1": 428.502, "r_x2": 418.779, "r_y2": 420.576, "r_x3": 394.618, "r_y3": 420.576, "coord_origin": "TOPLEFT"}, "text": "0.859", "orig": "0.859", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 59, "label": "text", "bbox": {"l": 439.527, "t": 420.576, "r": 458.384, "b": 428.502, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 79, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 439.527, "r_y0": 428.502, "r_x1": 458.384, "r_y1": 428.502, "r_x2": 458.384, "r_y2": 420.576, "r_x3": 439.527, "r_y3": 420.576, "coord_origin": "TOPLEFT"}, "text": "1.91", "orig": "1.91", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 60, "label": "text", "bbox": {"l": 245.176, "t": 431.312, "r": 272.94, "b": 442.601, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 80, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 245.176, "r_y0": 442.601, "r_x1": 272.94, "r_y1": 442.601, "r_x2": 272.94, "r_y2": 431.312, "r_x3": 245.176, "r_y3": 431.312, "coord_origin": "TOPLEFT"}, "text": "HTML", "orig": "HTML", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 61, "label": "text", "bbox": {"l": 289.017, "t": 431.312, "r": 310.004, "b": 442.601, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 81, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 289.017, "r_y0": 442.601, "r_x1": 310.004, "r_y1": 442.601, "r_x2": 310.004, "r_y2": 431.312, "r_x3": 289.017, "r_y3": 431.312, "coord_origin": "TOPLEFT"}, "text": "0.945", "orig": "0.945", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 62, "label": "text", "bbox": {"l": 326.717, "t": 431.312, "r": 347.704, "b": 442.601, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 82, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 326.717, "r_y0": 442.601, "r_x1": 347.704, "r_y1": 442.601, "r_x2": 347.704, "r_y2": 431.312, "r_x3": 326.717, "r_y3": 431.312, "coord_origin": "TOPLEFT"}, "text": "0.901", "orig": "0.901", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 63, "label": "text", "bbox": {"l": 362.088, "t": 433.527, "r": 386.249, "b": 441.453, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 83, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 362.088, "r_y0": 441.453, "r_x1": 386.249, "r_y1": 441.453, "r_x2": 386.249, "r_y2": 433.527, "r_x3": 362.088, "r_y3": 433.527, "coord_origin": "TOPLEFT"}, "text": "0.931", "orig": "0.931", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 64, "label": "text", "bbox": {"l": 396.206, "t": 431.312, "r": 417.193, "b": 442.601, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 84, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 396.206, "r_y0": 442.601, "r_x1": 417.193, "r_y1": 442.601, "r_x2": 417.193, "r_y2": 431.312, "r_x3": 396.206, "r_y3": 431.312, "coord_origin": "TOPLEFT"}, "text": "0.834", "orig": "0.834", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 65, "label": "text", "bbox": {"l": 440.767, "t": 431.312, "r": 457.147, "b": 442.601, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 85, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 440.767, "r_y0": 442.601, "r_x1": 457.147, "r_y1": 442.601, "r_x2": 457.147, "r_y2": 431.312, "r_x3": 440.767, "r_y3": 431.312, "coord_origin": "TOPLEFT"}, "text": "3.81", "orig": "3.81", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 66, "label": "text", "bbox": {"l": 161.906, "t": 450.142, "r": 166.513, "b": 461.431, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 86, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 161.906, "r_y0": 461.431, "r_x1": 166.513, "r_y1": 461.431, "r_x2": 166.513, "r_y2": 450.142, "r_x3": 161.906, "r_y3": 450.142, "coord_origin": "TOPLEFT"}, "text": "4", "orig": "4", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 67, "label": "text", "bbox": {"l": 209.509, "t": 450.142, "r": 214.116, "b": 461.431, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 87, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 209.509, "r_y0": 461.431, "r_x1": 214.116, "r_y1": 461.431, "r_x2": 214.116, "r_y2": 450.142, "r_x3": 209.509, "r_y3": 450.142, "coord_origin": "TOPLEFT"}, "text": "2", "orig": "2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 68, "label": "text", "bbox": {"l": 246.71, "t": 444.662, "r": 271.405, "b": 455.951, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 88, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 246.71, "r_y0": 455.951, "r_x1": 271.405, "r_y1": 455.951, "r_x2": 271.405, "r_y2": 444.662, "r_x3": 246.71, "r_y3": 444.662, "coord_origin": "TOPLEFT"}, "text": "OTSL", "orig": "OTSL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 69, "label": "text", "bbox": {"l": 289.017, "t": 444.662, "r": 310.004, "b": 455.951, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 89, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 289.017, "r_y0": 455.951, "r_x1": 310.004, "r_y1": 455.951, "r_x2": 310.004, "r_y2": 444.662, "r_x3": 289.017, "r_y3": 444.662, "coord_origin": "TOPLEFT"}, "text": "0.952", "orig": "0.952", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 70, "label": "text", "bbox": {"l": 329.021, "t": 444.662, "r": 345.401, "b": 455.951, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 90, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 329.021, "r_y0": 455.951, "r_x1": 345.401, "r_y1": 455.951, "r_x2": 345.401, "r_y2": 444.662, "r_x3": 329.021, "r_y3": 444.662, "coord_origin": "TOPLEFT"}, "text": "0.92", "orig": "0.92", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 71, "label": "text", "bbox": {"l": 362.088, "t": 446.877, "r": 386.249, "b": 454.803, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 91, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 362.088, "r_y0": 454.803, "r_x1": 386.249, "r_y1": 454.803, "r_x2": 386.249, "r_y2": 446.877, "r_x3": 362.088, "r_y3": 446.877, "coord_origin": "TOPLEFT"}, "text": "0.942", "orig": "0.942", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 72, "label": "text", "bbox": {"l": 394.618, "t": 446.877, "r": 418.779, "b": 454.803, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 92, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 394.618, "r_y0": 454.803, "r_x1": 418.779, "r_y1": 454.803, "r_x2": 418.779, "r_y2": 446.877, "r_x3": 394.618, "r_y3": 446.877, "coord_origin": "TOPLEFT"}, "text": "0.857", "orig": "0.857", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 73, "label": "text", "bbox": {"l": 439.527, "t": 446.877, "r": 458.384, "b": 454.803, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 93, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 439.527, "r_y0": 454.803, "r_x1": 458.384, "r_y1": 454.803, "r_x2": 458.384, "r_y2": 446.877, "r_x3": 439.527, "r_y3": 446.877, "coord_origin": "TOPLEFT"}, "text": "1.22", "orig": "1.22", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 74, "label": "text", "bbox": {"l": 245.176, "t": 457.614, "r": 272.94, "b": 468.903, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 94, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 245.176, "r_y0": 468.903, "r_x1": 272.94, "r_y1": 468.903, "r_x2": 272.94, "r_y2": 457.614, "r_x3": 245.176, "r_y3": 457.614, "coord_origin": "TOPLEFT"}, "text": "HTML", "orig": "HTML", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 75, "label": "text", "bbox": {"l": 289.017, "t": 457.614, "r": 310.004, "b": 468.903, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 95, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 289.017, "r_y0": 468.903, "r_x1": 310.004, "r_y1": 468.903, "r_x2": 310.004, "r_y2": 457.614, "r_x3": 289.017, "r_y3": 457.614, "coord_origin": "TOPLEFT"}, "text": "0.944", "orig": "0.944", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 76, "label": "text", "bbox": {"l": 326.717, "t": 457.614, "r": 347.704, "b": 468.903, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 96, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 326.717, "r_y0": 468.903, "r_x1": 347.704, "r_y1": 468.903, "r_x2": 347.704, "r_y2": 457.614, "r_x3": 326.717, "r_y3": 457.614, "coord_origin": "TOPLEFT"}, "text": "0.903", "orig": "0.903", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 77, "label": "text", "bbox": {"l": 363.676, "t": 457.614, "r": 384.663, "b": 468.903, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 97, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 363.676, "r_y0": 468.903, "r_x1": 384.663, "r_y1": 468.903, "r_x2": 384.663, "r_y2": 457.614, "r_x3": 363.676, "r_y3": 457.614, "coord_origin": "TOPLEFT"}, "text": "0.931", "orig": "0.931", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 78, "label": "text", "bbox": {"l": 396.206, "t": 457.614, "r": 417.193, "b": 468.903, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 98, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 396.206, "r_y0": 468.903, "r_x1": 417.193, "r_y1": 468.903, "r_x2": 417.193, "r_y2": 457.614, "r_x3": 396.206, "r_y3": 457.614, "coord_origin": "TOPLEFT"}, "text": "0.824", "orig": "0.824", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 79, "label": "text", "bbox": {"l": 446.653, "t": 457.614, "r": 451.26, "b": 468.903, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 99, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 446.653, "r_y0": 468.903, "r_x1": 451.26, "r_y1": 468.903, "r_x2": 451.26, "r_y2": 457.614, "r_x3": 446.653, "r_y3": 457.614, "coord_origin": "TOPLEFT"}, "text": "2", "orig": "2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}]}, "text": null, "otsl_seq": ["ched", "ched", "ched", "ched", "lcel", "lcel", "ched", "ched", "nl", "ucel", "ucel", "ucel", "ched", "ched", "ched", "ched", "ched", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "nl"], "num_rows": 6, "num_cols": 8, "table_cells": [{"bbox": {"l": 144.592, "t": 339.457, "r": 183.828, "b": 363.697, "coord_origin": "TOPLEFT"}, "row_span": 2, "col_span": 1, "start_row_offset_idx": 0, "end_row_offset_idx": 2, "start_col_offset_idx": 0, "end_col_offset_idx": 1, "text": "# enc-layers", "column_header": true, "row_header": false, "row_section": false}, {"bbox": {"l": 192.195, "t": 339.457, "r": 231.431, "b": 363.697, "coord_origin": "TOPLEFT"}, "row_span": 2, "col_span": 1, "start_row_offset_idx": 0, "end_row_offset_idx": 2, "start_col_offset_idx": 1, "end_col_offset_idx": 2, "text": "# dec-layers", "column_header": true, "row_header": false, "row_section": false}, {"bbox": {"l": 239.798, "t": 344.936, "r": 278.318, "b": 356.225, "coord_origin": "TOPLEFT"}, "row_span": 2, "col_span": 1, "start_row_offset_idx": 0, "end_row_offset_idx": 2, "start_col_offset_idx": 2, "end_col_offset_idx": 3, "text": "Language", "column_header": true, "row_header": false, "row_section": false}, {"bbox": {"l": 324.67, "t": 339.457, "r": 348.264, "b": 350.746, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 3, "start_row_offset_idx": 0, "end_row_offset_idx": 1, "start_col_offset_idx": 3, "end_col_offset_idx": 6, "text": "TEDs", "column_header": true, "row_header": false, "row_section": false}, {"bbox": {"l": 396.271, "t": 339.457, "r": 417.127, "b": 350.746, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 0, "end_row_offset_idx": 1, "start_col_offset_idx": 6, "end_col_offset_idx": 7, "text": "mAP", "column_header": true, "row_header": false, "row_section": false}, {"bbox": {"l": 394.927, "t": 350.416, "r": 418.473, "b": 361.705, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 1, "end_row_offset_idx": 2, "start_col_offset_idx": 6, "end_col_offset_idx": 7, "text": "(0.75)", "column_header": true, "row_header": false, "row_section": false}, {"bbox": {"l": 430.771, "t": 339.457, "r": 467.142, "b": 350.746, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 0, "end_row_offset_idx": 1, "start_col_offset_idx": 7, "end_col_offset_idx": 8, "text": "Inference", "column_header": true, "row_header": false, "row_section": false}, {"bbox": {"l": 427.148, "t": 350.416, "r": 470.761, "b": 361.705, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 1, "end_row_offset_idx": 2, "start_col_offset_idx": 7, "end_col_offset_idx": 8, "text": "time (secs)", "column_header": true, "row_header": false, "row_section": false}, {"bbox": {"l": 286.686, "t": 352.408, "r": 312.333, "b": 363.697, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 1, "end_row_offset_idx": 2, "start_col_offset_idx": 3, "end_col_offset_idx": 4, "text": "simple", "column_header": true, "row_header": false, "row_section": false}, {"bbox": {"l": 320.702, "t": 352.408, "r": 353.72, "b": 363.697, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 1, "end_row_offset_idx": 2, "start_col_offset_idx": 4, "end_col_offset_idx": 5, "text": "complex", "column_header": true, "row_header": false, "row_section": false}, {"bbox": {"l": 369.306, "t": 352.408, "r": 379.031, "b": 363.697, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 1, "end_row_offset_idx": 2, "start_col_offset_idx": 5, "end_col_offset_idx": 6, "text": "all", "column_header": true, "row_header": false, "row_section": false}, {"bbox": {"l": 161.906, "t": 371.238, "r": 166.513, "b": 382.527, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 2, "end_row_offset_idx": 3, "start_col_offset_idx": 0, "end_col_offset_idx": 1, "text": "6", "column_header": false, "row_header": false, "row_section": false}, {"bbox": {"l": 209.509, "t": 371.238, "r": 214.116, "b": 382.527, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 2, "end_row_offset_idx": 3, "start_col_offset_idx": 1, "end_col_offset_idx": 2, "text": "6", "column_header": false, "row_header": false, "row_section": false}, {"bbox": {"l": 245.176, "t": 365.758, "r": 272.94, "b": 389.999, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 2, "end_row_offset_idx": 3, "start_col_offset_idx": 2, "end_col_offset_idx": 3, "text": "OTSL HTML", "column_header": false, "row_header": false, "row_section": false}, {"bbox": {"l": 289.017, "t": 365.758, "r": 310.004, "b": 389.999, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 2, "end_row_offset_idx": 3, "start_col_offset_idx": 3, "end_col_offset_idx": 4, "text": "0.965 0.969", "column_header": false, "row_header": false, "row_section": false}, {"bbox": {"l": 326.717, "t": 365.758, "r": 347.704, "b": 389.999, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 2, "end_row_offset_idx": 3, "start_col_offset_idx": 4, "end_col_offset_idx": 5, "text": "0.934 0.927", "column_header": false, "row_header": false, "row_section": false}, {"bbox": {"l": 363.676, "t": 365.758, "r": 384.663, "b": 389.999, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 2, "end_row_offset_idx": 3, "start_col_offset_idx": 5, "end_col_offset_idx": 6, "text": "0.955 0.955", "column_header": false, "row_header": false, "row_section": false}, {"bbox": {"l": 396.206, "t": 367.973, "r": 417.193, "b": 389.999, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 2, "end_row_offset_idx": 3, "start_col_offset_idx": 6, "end_col_offset_idx": 7, "text": "0.88 0.857", "column_header": false, "row_header": false, "row_section": false}, {"bbox": {"l": 439.527, "t": 367.973, "r": 458.384, "b": 389.999, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 2, "end_row_offset_idx": 3, "start_col_offset_idx": 7, "end_col_offset_idx": 8, "text": "2.73 5.39", "column_header": false, "row_header": false, "row_section": false}, {"bbox": {"l": 161.906, "t": 397.539, "r": 166.513, "b": 408.828, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 3, "end_row_offset_idx": 4, "start_col_offset_idx": 0, "end_col_offset_idx": 1, "text": "4", "column_header": false, "row_header": false, "row_section": false}, {"bbox": {"l": 209.509, "t": 397.539, "r": 214.116, "b": 408.828, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 3, "end_row_offset_idx": 4, "start_col_offset_idx": 1, "end_col_offset_idx": 2, "text": "4", "column_header": false, "row_header": false, "row_section": false}, {"bbox": {"l": 245.176, "t": 392.06, "r": 272.94, "b": 416.3, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 3, "end_row_offset_idx": 4, "start_col_offset_idx": 2, "end_col_offset_idx": 3, "text": "OTSL HTML", "column_header": false, "row_header": false, "row_section": false}, {"bbox": {"l": 289.017, "t": 392.06, "r": 310.004, "b": 416.3, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 3, "end_row_offset_idx": 4, "start_col_offset_idx": 3, "end_col_offset_idx": 4, "text": "0.938 0.952", "column_header": false, "row_header": false, "row_section": false}, {"bbox": {"l": 326.717, "t": 392.06, "r": 347.704, "b": 416.3, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 3, "end_row_offset_idx": 4, "start_col_offset_idx": 4, "end_col_offset_idx": 5, "text": "0.904 0.909", "column_header": false, "row_header": false, "row_section": false}, {"bbox": {"l": 362.088, "t": 392.06, "r": 386.249, "b": 415.152, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 3, "end_row_offset_idx": 4, "start_col_offset_idx": 5, "end_col_offset_idx": 6, "text": "0.927 0.938", "column_header": false, "row_header": false, "row_section": false}, {"bbox": {"l": 394.618, "t": 394.275, "r": 418.779, "b": 416.3, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 3, "end_row_offset_idx": 4, "start_col_offset_idx": 6, "end_col_offset_idx": 7, "text": "0.853 0.843", "column_header": false, "row_header": false, "row_section": false}, {"bbox": {"l": 439.527, "t": 394.275, "r": 458.384, "b": 416.3, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 3, "end_row_offset_idx": 4, "start_col_offset_idx": 7, "end_col_offset_idx": 8, "text": "1.97 3.77", "column_header": false, "row_header": false, "row_section": false}, {"bbox": {"l": 161.906, "t": 423.84, "r": 166.513, "b": 435.129, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 4, "end_row_offset_idx": 5, "start_col_offset_idx": 0, "end_col_offset_idx": 1, "text": "2", "column_header": false, "row_header": false, "row_section": false}, {"bbox": {"l": 209.509, "t": 423.84, "r": 214.116, "b": 435.129, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 4, "end_row_offset_idx": 5, "start_col_offset_idx": 1, "end_col_offset_idx": 2, "text": "4", "column_header": false, "row_header": false, "row_section": false}, {"bbox": {"l": 245.176, "t": 418.361, "r": 272.94, "b": 442.601, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 4, "end_row_offset_idx": 5, "start_col_offset_idx": 2, "end_col_offset_idx": 3, "text": "OTSL HTML", "column_header": false, "row_header": false, "row_section": false}, {"bbox": {"l": 289.017, "t": 418.361, "r": 310.004, "b": 442.601, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 4, "end_row_offset_idx": 5, "start_col_offset_idx": 3, "end_col_offset_idx": 4, "text": "0.923 0.945", "column_header": false, "row_header": false, "row_section": false}, {"bbox": {"l": 326.717, "t": 418.361, "r": 347.704, "b": 442.601, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 4, "end_row_offset_idx": 5, "start_col_offset_idx": 4, "end_col_offset_idx": 5, "text": "0.897 0.901", "column_header": false, "row_header": false, "row_section": false}, {"bbox": {"l": 362.088, "t": 418.361, "r": 386.249, "b": 441.453, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 4, "end_row_offset_idx": 5, "start_col_offset_idx": 5, "end_col_offset_idx": 6, "text": "0.915 0.931", "column_header": false, "row_header": false, "row_section": false}, {"bbox": {"l": 394.618, "t": 420.576, "r": 418.779, "b": 442.601, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 4, "end_row_offset_idx": 5, "start_col_offset_idx": 6, "end_col_offset_idx": 7, "text": "0.859 0.834", "column_header": false, "row_header": false, "row_section": false}, {"bbox": {"l": 439.527, "t": 420.576, "r": 458.384, "b": 442.601, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 4, "end_row_offset_idx": 5, "start_col_offset_idx": 7, "end_col_offset_idx": 8, "text": "1.91 3.81", "column_header": false, "row_header": false, "row_section": false}, {"bbox": {"l": 161.906, "t": 450.142, "r": 166.513, "b": 461.431, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 5, "end_row_offset_idx": 6, "start_col_offset_idx": 0, "end_col_offset_idx": 1, "text": "4", "column_header": false, "row_header": false, "row_section": false}, {"bbox": {"l": 209.509, "t": 450.142, "r": 214.116, "b": 461.431, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 5, "end_row_offset_idx": 6, "start_col_offset_idx": 1, "end_col_offset_idx": 2, "text": "2", "column_header": false, "row_header": false, "row_section": false}, {"bbox": {"l": 245.176, "t": 444.662, "r": 272.94, "b": 468.903, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 5, "end_row_offset_idx": 6, "start_col_offset_idx": 2, "end_col_offset_idx": 3, "text": "OTSL HTML", "column_header": false, "row_header": false, "row_section": false}, {"bbox": {"l": 289.017, "t": 444.662, "r": 310.004, "b": 468.903, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 5, "end_row_offset_idx": 6, "start_col_offset_idx": 3, "end_col_offset_idx": 4, "text": "0.952 0.944", "column_header": false, "row_header": false, "row_section": false}, {"bbox": {"l": 326.717, "t": 444.662, "r": 347.704, "b": 468.903, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 5, "end_row_offset_idx": 6, "start_col_offset_idx": 4, "end_col_offset_idx": 5, "text": "0.92 0.903", "column_header": false, "row_header": false, "row_section": false}, {"bbox": {"l": 362.088, "t": 446.877, "r": 386.249, "b": 468.903, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 5, "end_row_offset_idx": 6, "start_col_offset_idx": 5, "end_col_offset_idx": 6, "text": "0.942 0.931", "column_header": false, "row_header": false, "row_section": false}, {"bbox": {"l": 394.618, "t": 446.877, "r": 418.779, "b": 468.903, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 5, "end_row_offset_idx": 6, "start_col_offset_idx": 6, "end_col_offset_idx": 7, "text": "0.857 0.824", "column_header": false, "row_header": false, "row_section": false}, {"bbox": {"l": 439.527, "t": 446.877, "r": 458.384, "b": 468.903, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 5, "end_row_offset_idx": 6, "start_col_offset_idx": 7, "end_col_offset_idx": 8, "text": "1.22 2", "column_header": false, "row_header": false, "row_section": false}]}, {"label": "section_header", "id": 5, "page_no": 8, "cluster": {"id": 5, "label": "section_header", "bbox": {"l": 134.765, "t": 508.152, "r": 264.403, "b": 516.9590000000001, "coord_origin": "TOPLEFT"}, "confidence": 0.9592539668083191, "cells": [{"index": 100, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 516.9590000000001, "r_x1": 149.402, "r_y1": 516.9590000000001, "r_x2": 149.402, "r_y2": 508.152, "r_x3": 134.765, "r_y3": 508.152, "coord_origin": "TOPLEFT"}, "text": "5.2", "orig": "5.2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 101, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 160.859, "r_y0": 516.9590000000001, "r_x1": 264.403, "r_y1": 516.9590000000001, "r_x2": 264.403, "r_y2": 508.152, "r_x3": 160.859, "r_y3": 508.152, "coord_origin": "TOPLEFT"}, "text": "Quantitative Results", "orig": "Quantitative Results", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "5.2 Quantitative Results"}, {"label": "text", "id": 1, "page_no": 8, "cluster": {"id": 1, "label": "text", "bbox": {"l": 134.765, "t": 524.5509999999999, "r": 480.596, "b": 617.035, "coord_origin": "TOPLEFT"}, "confidence": 0.9854757189750671, "cells": [{"index": 102, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 533.348, "r_x1": 480.591, "r_y1": 533.348, "r_x2": 480.591, "r_y2": 524.5509999999999, "r_x3": 134.765, "r_y3": 524.5509999999999, "coord_origin": "TOPLEFT"}, "text": "We picked the model parameter configuration that produced the best prediction", "orig": "We picked the model parameter configuration that produced the best prediction", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 103, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 545.304, "r_x1": 164.921, "r_y1": 545.304, "r_x2": 164.921, "r_y2": 536.5070000000001, "r_x3": 134.765, "r_y3": 536.5070000000001, "coord_origin": "TOPLEFT"}, "text": "quality", "orig": "quality", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 104, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 169.324, "r_y0": 545.304, "r_x1": 480.587, "r_y1": 545.304, "r_x2": 480.587, "r_y2": 536.5070000000001, "r_x3": 169.324, "r_y3": 536.5070000000001, "coord_origin": "TOPLEFT"}, "text": "(enc=6, dec=6, heads=8) with PubTabNet alone, then independently", "orig": "(enc=6, dec=6, heads=8) with PubTabNet alone, then independently", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 105, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 557.259, "r_x1": 480.596, "r_y1": 557.259, "r_x2": 480.596, "r_y2": 548.462, "r_x3": 134.765, "r_y3": 548.462, "coord_origin": "TOPLEFT"}, "text": "trained and evaluated it on three publicly available data sets: PubTabNet (395k", "orig": "trained and evaluated it on three publicly available data sets: PubTabNet (395k", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 106, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 569.2139999999999, "r_x1": 480.592, "r_y1": 569.2139999999999, "r_x2": 480.592, "r_y2": 560.417, "r_x3": 134.765, "r_y3": 560.417, "coord_origin": "TOPLEFT"}, "text": "samples), FinTabNet (113k samples) and PubTables-1M (about 1M samples).", "orig": "samples), FinTabNet (113k samples) and PubTables-1M (about 1M samples).", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 107, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 581.169, "r_x1": 480.591, "r_y1": 581.169, "r_x2": 480.591, "r_y2": 572.3720000000001, "r_x3": 134.765, "r_y3": 572.3720000000001, "coord_origin": "TOPLEFT"}, "text": "Performance results are presented in Table. 2. It is clearly evident that the model", "orig": "Performance results are presented in Table. 2. It is clearly evident that the model", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 108, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 593.124, "r_x1": 480.596, "r_y1": 593.124, "r_x2": 480.596, "r_y2": 584.327, "r_x3": 134.765, "r_y3": 584.327, "coord_origin": "TOPLEFT"}, "text": "trained on OTSL outperforms HTML across the board, keeping high TEDs and", "orig": "trained on OTSL outperforms HTML across the board, keeping high TEDs and", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 109, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 605.08, "r_x1": 480.588, "r_y1": 605.08, "r_x2": 480.588, "r_y2": 596.283, "r_x3": 134.765, "r_y3": 596.283, "coord_origin": "TOPLEFT"}, "text": "mAP scores even on difficult financial tables (FinTabNet) that contain sparse", "orig": "mAP scores even on difficult financial tables (FinTabNet) that contain sparse", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 110, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 617.035, "r_x1": 206.787, "r_y1": 617.035, "r_x2": 206.787, "r_y2": 608.238, "r_x3": 134.765, "r_y3": 608.238, "coord_origin": "TOPLEFT"}, "text": "and large tables.", "orig": "and large tables.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "We picked the model parameter configuration that produced the best prediction quality (enc=6, dec=6, heads=8) with PubTabNet alone, then independently trained and evaluated it on three publicly available data sets: PubTabNet (395k samples), FinTabNet (113k samples) and PubTables-1M (about 1M samples). Performance results are presented in Table. 2. It is clearly evident that the model trained on OTSL outperforms HTML across the board, keeping high TEDs and mAP scores even on difficult financial tables (FinTabNet) that contain sparse and large tables."}, {"label": "text", "id": 2, "page_no": 8, "cluster": {"id": 2, "label": "text", "bbox": {"l": 134.765, "t": 620.193, "r": 480.596, "b": 664.855, "coord_origin": "TOPLEFT"}, "confidence": 0.9851234555244446, "cells": [{"index": 111, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 149.709, "r_y0": 628.99, "r_x1": 205.597, "r_y1": 628.99, "r_x2": 205.597, "r_y2": 620.193, "r_x3": 149.709, "r_y3": 620.193, "coord_origin": "TOPLEFT"}, "text": "Additionally,", "orig": "Additionally,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 112, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 210.578, "r_y0": 628.99, "r_x1": 224.412, "r_y1": 628.99, "r_x2": 224.412, "r_y2": 620.193, "r_x3": 210.578, "r_y3": 620.193, "coord_origin": "TOPLEFT"}, "text": "the", "orig": "the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 113, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 229.383, "r_y0": 628.99, "r_x1": 257.74, "r_y1": 628.99, "r_x2": 257.74, "r_y2": 620.193, "r_x3": 229.383, "r_y3": 620.193, "coord_origin": "TOPLEFT"}, "text": "results", "orig": "results", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 114, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 262.722, "r_y0": 628.99, "r_x1": 307.319, "r_y1": 628.99, "r_x2": 307.319, "r_y2": 620.193, "r_x3": 262.722, "r_y3": 620.193, "coord_origin": "TOPLEFT"}, "text": "show that", "orig": "show that", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 115, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 312.301, "r_y0": 628.99, "r_x1": 480.593, "r_y1": 628.99, "r_x2": 480.593, "r_y2": 620.193, "r_x3": 312.301, "r_y3": 620.193, "coord_origin": "TOPLEFT"}, "text": "OTSL has an advantage over HTML", "orig": "OTSL has an advantage over HTML", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 116, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 640.9449999999999, "r_x1": 480.596, "r_y1": 640.9449999999999, "r_x2": 480.596, "r_y2": 632.148, "r_x3": 134.765, "r_y3": 632.148, "coord_origin": "TOPLEFT"}, "text": "when applied on a bigger data set like PubTables-1M and achieves significantly", "orig": "when applied on a bigger data set like PubTables-1M and achieves significantly", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 117, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 652.9, "r_x1": 480.593, "r_y1": 652.9, "r_x2": 480.593, "r_y2": 644.1030000000001, "r_x3": 134.765, "r_y3": 644.1030000000001, "coord_origin": "TOPLEFT"}, "text": "improved scores. Finally, OTSL achieves faster inference due to fewer decoding", "orig": "improved scores. Finally, OTSL achieves faster inference due to fewer decoding", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 118, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 664.855, "r_x1": 405.797, "r_y1": 664.855, "r_x2": 405.797, "r_y2": 656.058, "r_x3": 134.765, "r_y3": 656.058, "coord_origin": "TOPLEFT"}, "text": "steps which is a result of the reduced sequence representation.", "orig": "steps which is a result of the reduced sequence representation.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "Additionally, the results show that OTSL has an advantage over HTML when applied on a bigger data set like PubTables-1M and achieves significantly improved scores. Finally, OTSL achieves faster inference due to fewer decoding steps which is a result of the reduced sequence representation."}], "headers": [{"label": "page_header", "id": 8, "page_no": 8, "cluster": {"id": 8, "label": "page_header", "bbox": {"l": 194.478, "t": 91.49300000000005, "r": 447.543, "b": 102.78200000000004, "coord_origin": "TOPLEFT"}, "confidence": 0.9373378753662109, "cells": [{"index": 0, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 194.478, "r_y0": 102.78200000000004, "r_x1": 447.543, "r_y1": 102.78200000000004, "r_x2": 447.543, "r_y2": 91.49300000000005, "r_x3": 194.478, "r_y3": 91.49300000000005, "coord_origin": "TOPLEFT"}, "text": "Optimized Table Tokenization for Table Structure Recognition", "orig": "Optimized Table Tokenization for Table Structure Recognition", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "Optimized Table Tokenization for Table Structure Recognition"}, {"label": "page_header", "id": 9, "page_no": 8, "cluster": {"id": 9, "label": "page_header", "bbox": {"l": 475.984, "t": 91.49300000000005, "r": 480.591, "b": 102.78200000000004, "coord_origin": "TOPLEFT"}, "confidence": 0.8857625722885132, "cells": [{"index": 1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 475.984, "r_y0": 102.78200000000004, "r_x1": 480.591, "r_y1": 102.78200000000004, "r_x2": 480.591, "r_y2": 91.49300000000005, "r_x3": 475.984, "r_y3": 91.49300000000005, "coord_origin": "TOPLEFT"}, "text": "9", "orig": "9", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "9"}]}}, {"page_no": 9, "size": {"width": 612.0, "height": 792.0}, "cells": [{"index": 0, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 102.78200000000004, "r_x1": 143.979, "r_y1": 102.78200000000004, "r_x2": 143.979, "r_y2": 91.49300000000005, "r_x3": 134.765, "r_y3": 91.49300000000005, "coord_origin": "TOPLEFT"}, "text": "10", "orig": "10", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 167.821, "r_y0": 102.78200000000004, "r_x1": 231.72, "r_y1": 102.78200000000004, "r_x2": 231.72, "r_y2": 91.49300000000005, "r_x3": 167.821, "r_y3": 91.49300000000005, "coord_origin": "TOPLEFT"}, "text": "M. Lysak, et al.", "orig": "M. Lysak, et al.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 2, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 123.76199999999994, "r_x1": 173.094, "r_y1": 123.76199999999994, "r_x2": 173.094, "r_y2": 115.83600000000001, "r_x3": 134.765, "r_y3": 115.83600000000001, "coord_origin": "TOPLEFT"}, "text": "Table 2.", "orig": "Table 2.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 3, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 181.303, "r_y0": 124.90999999999997, "r_x1": 480.592, "r_y1": 124.90999999999997, "r_x2": 480.592, "r_y2": 113.62099999999998, "r_x3": 181.303, "r_y3": 113.62099999999998, "coord_origin": "TOPLEFT"}, "text": "TSR and cell detection results compared between OTSL and HTML on", "orig": "TSR and cell detection results compared between OTSL and HTML on", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 4, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 135.86900000000003, "r_x1": 480.594, "r_y1": 135.86900000000003, "r_x2": 480.594, "r_y2": 124.58000000000004, "r_x3": 134.765, "r_y3": 124.58000000000004, "coord_origin": "TOPLEFT"}, "text": "the PubTabNet [22], FinTabNet [21] and PubTables-1M [14] data sets using Table-", "orig": "the PubTabNet [22], FinTabNet [21] and PubTables-1M [14] data sets using Table-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 5, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 146.82799999999997, "r_x1": 305.957, "r_y1": 146.82799999999997, "r_x2": 305.957, "r_y2": 135.539, "r_x3": 134.765, "r_y3": 135.539, "coord_origin": "TOPLEFT"}, "text": "Former [9] (with enc=6, dec=6, heads=8).", "orig": "Former [9] (with enc=6, dec=6, heads=8).", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 6, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 160.782, "r_y0": 175.57000000000005, "r_x1": 194.998, "r_y1": 175.57000000000005, "r_x2": 194.998, "r_y2": 164.28099999999995, "r_x3": 160.782, "r_y3": 164.28099999999995, "coord_origin": "TOPLEFT"}, "text": "Data set", "orig": "Data set", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 7, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 215.525, "r_y0": 175.54499999999996, "r_x1": 254.045, "r_y1": 175.54499999999996, "r_x2": 254.045, "r_y2": 164.25599999999997, "r_x3": 215.525, "r_y3": 164.25599999999997, "coord_origin": "TOPLEFT"}, "text": "Language", "orig": "Language", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 8, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 300.397, "r_y0": 170.09000000000003, "r_x1": 323.991, "r_y1": 170.09000000000003, "r_x2": 323.991, "r_y2": 158.80100000000004, "r_x3": 300.397, "r_y3": 158.80100000000004, "coord_origin": "TOPLEFT"}, "text": "TEDs", "orig": "TEDs", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 9, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 370.345, "r_y0": 175.57000000000005, "r_x1": 414.747, "r_y1": 175.57000000000005, "r_x2": 414.747, "r_y2": 164.28099999999995, "r_x3": 370.345, "r_y3": 164.28099999999995, "coord_origin": "TOPLEFT"}, "text": "mAP(0.75)", "orig": "mAP(0.75)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 10, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 426.737, "r_y0": 170.09000000000003, "r_x1": 463.108, "r_y1": 170.09000000000003, "r_x2": 463.108, "r_y2": 158.80100000000004, "r_x3": 426.737, "r_y3": 158.80100000000004, "coord_origin": "TOPLEFT"}, "text": "Inference", "orig": "Inference", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 11, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 423.114, "r_y0": 181.04899999999998, "r_x1": 466.727, "r_y1": 181.04899999999998, "r_x2": 466.727, "r_y2": 169.76, "r_x3": 423.114, "r_y3": 169.76, "coord_origin": "TOPLEFT"}, "text": "time (secs)", "orig": "time (secs)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 12, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 262.413, "r_y0": 183.04200000000003, "r_x1": 288.06, "r_y1": 183.04200000000003, "r_x2": 288.06, "r_y2": 171.75300000000004, "r_x3": 262.413, "r_y3": 171.75300000000004, "coord_origin": "TOPLEFT"}, "text": "simple", "orig": "simple", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 13, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 296.429, "r_y0": 183.04200000000003, "r_x1": 329.447, "r_y1": 183.04200000000003, "r_x2": 329.447, "r_y2": 171.75300000000004, "r_x3": 296.429, "r_y3": 171.75300000000004, "coord_origin": "TOPLEFT"}, "text": "complex", "orig": "complex", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 14, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 345.033, "r_y0": 183.04200000000003, "r_x1": 354.758, "r_y1": 183.04200000000003, "r_x2": 354.758, "r_y2": 171.75300000000004, "r_x3": 345.033, "r_y3": 171.75300000000004, "coord_origin": "TOPLEFT"}, "text": "all", "orig": "all", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 15, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 154.538, "r_y0": 201.87099999999998, "r_x1": 201.241, "r_y1": 201.87099999999998, "r_x2": 201.241, "r_y2": 190.582, "r_x3": 154.538, "r_y3": 190.582, "coord_origin": "TOPLEFT"}, "text": "PubTabNet", "orig": "PubTabNet", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 16, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 222.437, "r_y0": 196.39200000000005, "r_x1": 247.132, "r_y1": 196.39200000000005, "r_x2": 247.132, "r_y2": 185.10299999999995, "r_x3": 222.437, "r_y3": 185.10299999999995, "coord_origin": "TOPLEFT"}, "text": "OTSL", "orig": "OTSL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 17, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 264.744, "r_y0": 196.39200000000005, "r_x1": 285.731, "r_y1": 196.39200000000005, "r_x2": 285.731, "r_y2": 185.10299999999995, "r_x3": 264.744, "r_y3": 185.10299999999995, "coord_origin": "TOPLEFT"}, "text": "0.965", "orig": "0.965", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 18, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 302.444, "r_y0": 196.39200000000005, "r_x1": 323.431, "r_y1": 196.39200000000005, "r_x2": 323.431, "r_y2": 185.10299999999995, "r_x3": 302.444, "r_y3": 185.10299999999995, "coord_origin": "TOPLEFT"}, "text": "0.934", "orig": "0.934", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 19, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 339.403, "r_y0": 196.39200000000005, "r_x1": 360.39, "r_y1": 196.39200000000005, "r_x2": 360.39, "r_y2": 185.10299999999995, "r_x3": 339.403, "r_y3": 185.10299999999995, "coord_origin": "TOPLEFT"}, "text": "0.955", "orig": "0.955", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 20, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 383.116, "r_y0": 195.24400000000003, "r_x1": 401.973, "r_y1": 195.24400000000003, "r_x2": 401.973, "r_y2": 187.31799999999998, "r_x3": 383.116, "r_y3": 187.31799999999998, "coord_origin": "TOPLEFT"}, "text": "0.88", "orig": "0.88", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 21, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 435.493, "r_y0": 195.24400000000003, "r_x1": 454.35, "r_y1": 195.24400000000003, "r_x2": 454.35, "r_y2": 187.31799999999998, "r_x3": 435.493, "r_y3": 187.31799999999998, "coord_origin": "TOPLEFT"}, "text": "2.73", "orig": "2.73", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 22, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 220.903, "r_y0": 209.34299999999996, "r_x1": 248.667, "r_y1": 209.34299999999996, "r_x2": 248.667, "r_y2": 198.05399999999997, "r_x3": 220.903, "r_y3": 198.05399999999997, "coord_origin": "TOPLEFT"}, "text": "HTML", "orig": "HTML", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 23, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 264.744, "r_y0": 209.34299999999996, "r_x1": 285.731, "r_y1": 209.34299999999996, "r_x2": 285.731, "r_y2": 198.05399999999997, "r_x3": 264.744, "r_y3": 198.05399999999997, "coord_origin": "TOPLEFT"}, "text": "0.969", "orig": "0.969", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 24, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 302.444, "r_y0": 209.34299999999996, "r_x1": 323.431, "r_y1": 209.34299999999996, "r_x2": 323.431, "r_y2": 198.05399999999997, "r_x3": 302.444, "r_y3": 198.05399999999997, "coord_origin": "TOPLEFT"}, "text": "0.927", "orig": "0.927", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 25, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 339.403, "r_y0": 209.34299999999996, "r_x1": 360.39, "r_y1": 209.34299999999996, "r_x2": 360.39, "r_y2": 198.05399999999997, "r_x3": 339.403, "r_y3": 198.05399999999997, "coord_origin": "TOPLEFT"}, "text": "0.955", "orig": "0.955", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 26, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 382.052, "r_y0": 209.34299999999996, "r_x1": 403.039, "r_y1": 209.34299999999996, "r_x2": 403.039, "r_y2": 198.05399999999997, "r_x3": 382.052, "r_y3": 198.05399999999997, "coord_origin": "TOPLEFT"}, "text": "0.857", "orig": "0.857", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 27, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 436.732, "r_y0": 209.34299999999996, "r_x1": 453.112, "r_y1": 209.34299999999996, "r_x2": 453.112, "r_y2": 198.05399999999997, "r_x3": 436.732, "r_y3": 198.05399999999997, "coord_origin": "TOPLEFT"}, "text": "5.39", "orig": "5.39", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 28, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 155.945, "r_y0": 228.173, "r_x1": 199.834, "r_y1": 228.173, "r_x2": 199.834, "r_y2": 216.88400000000001, "r_x3": 155.945, "r_y3": 216.88400000000001, "coord_origin": "TOPLEFT"}, "text": "FinTabNet", "orig": "FinTabNet", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 29, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 222.437, "r_y0": 222.69299999999998, "r_x1": 247.132, "r_y1": 222.69299999999998, "r_x2": 247.132, "r_y2": 211.404, "r_x3": 222.437, "r_y3": 211.404, "coord_origin": "TOPLEFT"}, "text": "OTSL", "orig": "OTSL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 30, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 264.744, "r_y0": 222.69299999999998, "r_x1": 285.731, "r_y1": 222.69299999999998, "r_x2": 285.731, "r_y2": 211.404, "r_x3": 264.744, "r_y3": 211.404, "coord_origin": "TOPLEFT"}, "text": "0.955", "orig": "0.955", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 31, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 302.444, "r_y0": 222.69299999999998, "r_x1": 323.431, "r_y1": 222.69299999999998, "r_x2": 323.431, "r_y2": 211.404, "r_x3": 302.444, "r_y3": 211.404, "coord_origin": "TOPLEFT"}, "text": "0.961", "orig": "0.961", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 32, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 337.815, "r_y0": 221.54499999999996, "r_x1": 361.976, "r_y1": 221.54499999999996, "r_x2": 361.976, "r_y2": 213.61900000000003, "r_x3": 337.815, "r_y3": 213.61900000000003, "coord_origin": "TOPLEFT"}, "text": "0.959", "orig": "0.959", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 33, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 380.464, "r_y0": 221.54499999999996, "r_x1": 404.625, "r_y1": 221.54499999999996, "r_x2": 404.625, "r_y2": 213.61900000000003, "r_x3": 380.464, "r_y3": 213.61900000000003, "coord_origin": "TOPLEFT"}, "text": "0.862", "orig": "0.862", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 34, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 435.493, "r_y0": 221.54499999999996, "r_x1": 454.35, "r_y1": 221.54499999999996, "r_x2": 454.35, "r_y2": 213.61900000000003, "r_x3": 435.493, "r_y3": 213.61900000000003, "coord_origin": "TOPLEFT"}, "text": "1.85", "orig": "1.85", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 35, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 220.903, "r_y0": 235.64499999999998, "r_x1": 248.667, "r_y1": 235.64499999999998, "r_x2": 248.667, "r_y2": 224.356, "r_x3": 220.903, "r_y3": 224.356, "coord_origin": "TOPLEFT"}, "text": "HTML", "orig": "HTML", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 36, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 264.744, "r_y0": 235.64499999999998, "r_x1": 285.731, "r_y1": 235.64499999999998, "r_x2": 285.731, "r_y2": 224.356, "r_x3": 264.744, "r_y3": 224.356, "coord_origin": "TOPLEFT"}, "text": "0.917", "orig": "0.917", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 37, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 302.444, "r_y0": 235.64499999999998, "r_x1": 323.431, "r_y1": 235.64499999999998, "r_x2": 323.431, "r_y2": 224.356, "r_x3": 302.444, "r_y3": 224.356, "coord_origin": "TOPLEFT"}, "text": "0.922", "orig": "0.922", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 38, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 341.706, "r_y0": 235.64499999999998, "r_x1": 358.086, "r_y1": 235.64499999999998, "r_x2": 358.086, "r_y2": 224.356, "r_x3": 341.706, "r_y3": 224.356, "coord_origin": "TOPLEFT"}, "text": "0.92", "orig": "0.92", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 39, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 382.052, "r_y0": 235.64499999999998, "r_x1": 403.039, "r_y1": 235.64499999999998, "r_x2": 403.039, "r_y2": 224.356, "r_x3": 382.052, "r_y3": 224.356, "coord_origin": "TOPLEFT"}, "text": "0.722", "orig": "0.722", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 40, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 436.732, "r_y0": 235.64499999999998, "r_x1": 453.112, "r_y1": 235.64499999999998, "r_x2": 453.112, "r_y2": 224.356, "r_x3": 436.732, "r_y3": 224.356, "coord_origin": "TOPLEFT"}, "text": "3.26", "orig": "3.26", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 41, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 148.626, "r_y0": 254.47400000000005, "r_x1": 207.152, "r_y1": 254.47400000000005, "r_x2": 207.152, "r_y2": 243.18499999999995, "r_x3": 148.626, "r_y3": 243.18499999999995, "coord_origin": "TOPLEFT"}, "text": "PubTables-1M", "orig": "PubTables-1M", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 42, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 222.437, "r_y0": 248.99400000000003, "r_x1": 247.132, "r_y1": 248.99400000000003, "r_x2": 247.132, "r_y2": 237.70500000000004, "r_x3": 222.437, "r_y3": 237.70500000000004, "coord_origin": "TOPLEFT"}, "text": "OTSL", "orig": "OTSL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 43, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 264.744, "r_y0": 248.99400000000003, "r_x1": 285.731, "r_y1": 248.99400000000003, "r_x2": 285.731, "r_y2": 237.70500000000004, "r_x3": 264.744, "r_y3": 237.70500000000004, "coord_origin": "TOPLEFT"}, "text": "0.987", "orig": "0.987", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 44, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 302.444, "r_y0": 248.99400000000003, "r_x1": 323.431, "r_y1": 248.99400000000003, "r_x2": 323.431, "r_y2": 237.70500000000004, "r_x3": 302.444, "r_y3": 237.70500000000004, "coord_origin": "TOPLEFT"}, "text": "0.964", "orig": "0.964", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 45, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 337.815, "r_y0": 247.846, "r_x1": 361.976, "r_y1": 247.846, "r_x2": 361.976, "r_y2": 239.91999999999996, "r_x3": 337.815, "r_y3": 239.91999999999996, "coord_origin": "TOPLEFT"}, "text": "0.977", "orig": "0.977", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 46, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 380.464, "r_y0": 247.846, "r_x1": 404.625, "r_y1": 247.846, "r_x2": 404.625, "r_y2": 239.91999999999996, "r_x3": 380.464, "r_y3": 239.91999999999996, "coord_origin": "TOPLEFT"}, "text": "0.896", "orig": "0.896", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 47, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 435.493, "r_y0": 247.846, "r_x1": 454.35, "r_y1": 247.846, "r_x2": 454.35, "r_y2": 239.91999999999996, "r_x3": 435.493, "r_y3": 239.91999999999996, "coord_origin": "TOPLEFT"}, "text": "1.79", "orig": "1.79", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 48, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 220.903, "r_y0": 261.946, "r_x1": 248.667, "r_y1": 261.946, "r_x2": 248.667, "r_y2": 250.65700000000004, "r_x3": 220.903, "r_y3": 250.65700000000004, "coord_origin": "TOPLEFT"}, "text": "HTML", "orig": "HTML", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 49, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 264.744, "r_y0": 261.946, "r_x1": 285.731, "r_y1": 261.946, "r_x2": 285.731, "r_y2": 250.65700000000004, "r_x3": 264.744, "r_y3": 250.65700000000004, "coord_origin": "TOPLEFT"}, "text": "0.983", "orig": "0.983", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 50, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 302.444, "r_y0": 261.946, "r_x1": 323.431, "r_y1": 261.946, "r_x2": 323.431, "r_y2": 250.65700000000004, "r_x3": 302.444, "r_y3": 250.65700000000004, "coord_origin": "TOPLEFT"}, "text": "0.944", "orig": "0.944", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 51, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 339.403, "r_y0": 261.946, "r_x1": 360.39, "r_y1": 261.946, "r_x2": 360.39, "r_y2": 250.65700000000004, "r_x3": 339.403, "r_y3": 250.65700000000004, "coord_origin": "TOPLEFT"}, "text": "0.966", "orig": "0.966", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 52, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 382.052, "r_y0": 261.946, "r_x1": 403.039, "r_y1": 261.946, "r_x2": 403.039, "r_y2": 250.65700000000004, "r_x3": 382.052, "r_y3": 250.65700000000004, "coord_origin": "TOPLEFT"}, "text": "0.889", "orig": "0.889", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 53, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 436.732, "r_y0": 261.946, "r_x1": 453.112, "r_y1": 261.946, "r_x2": 453.112, "r_y2": 250.65700000000004, "r_x3": 436.732, "r_y3": 250.65700000000004, "coord_origin": "TOPLEFT"}, "text": "3.26", "orig": "3.26", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 54, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 297.722, "r_x1": 149.402, "r_y1": 297.722, "r_x2": 149.402, "r_y2": 288.915, "r_x3": 134.765, "r_y3": 288.915, "coord_origin": "TOPLEFT"}, "text": "5.3", "orig": "5.3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 55, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 160.859, "r_y0": 297.722, "r_x1": 257.087, "r_y1": 297.722, "r_x2": 257.087, "r_y2": 288.915, "r_x3": 160.859, "r_y3": 288.915, "coord_origin": "TOPLEFT"}, "text": "Qualitative Results", "orig": "Qualitative Results", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 56, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 318.658, "r_x1": 189.59, "r_y1": 318.658, "r_x2": 189.59, "r_y2": 309.861, "r_x3": 134.765, "r_y3": 309.861, "coord_origin": "TOPLEFT"}, "text": "To illustrate", "orig": "To illustrate", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 57, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 194.263, "r_y0": 318.658, "r_x1": 208.096, "r_y1": 318.658, "r_x2": 208.096, "r_y2": 309.861, "r_x3": 194.263, "r_y3": 309.861, "coord_origin": "TOPLEFT"}, "text": "the", "orig": "the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 58, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 212.768, "r_y0": 318.658, "r_x1": 258.971, "r_y1": 318.658, "r_x2": 258.971, "r_y2": 309.861, "r_x3": 212.768, "r_y3": 309.861, "coord_origin": "TOPLEFT"}, "text": "qualitative", "orig": "qualitative", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 59, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 263.643, "r_y0": 318.658, "r_x1": 308.822, "r_y1": 318.658, "r_x2": 308.822, "r_y2": 309.861, "r_x3": 263.643, "r_y3": 309.861, "coord_origin": "TOPLEFT"}, "text": "differences", "orig": "differences", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 60, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 313.484, "r_y0": 318.658, "r_x1": 480.588, "r_y1": 318.658, "r_x2": 480.588, "r_y2": 309.861, "r_x3": 313.484, "r_y3": 309.861, "coord_origin": "TOPLEFT"}, "text": "between OTSL and HTML, Figure 5", "orig": "between OTSL and HTML, Figure 5", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 61, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 330.613, "r_x1": 480.589, "r_y1": 330.613, "r_x2": 480.589, "r_y2": 321.816, "r_x3": 134.765, "r_y3": 321.816, "coord_origin": "TOPLEFT"}, "text": "demonstrates less overlap and more accurate bounding boxes with OTSL. In", "orig": "demonstrates less overlap and more accurate bounding boxes with OTSL. In", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 62, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 342.568, "r_x1": 480.587, "r_y1": 342.568, "r_x2": 480.587, "r_y2": 333.771, "r_x3": 134.765, "r_y3": 333.771, "coord_origin": "TOPLEFT"}, "text": "Figure 6, OTSL proves to be more effective in handling tables with longer to-", "orig": "Figure 6, OTSL proves to be more effective in handling tables with longer to-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 63, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 354.523, "r_x1": 480.59, "r_y1": 354.523, "r_x2": 480.59, "r_y2": 345.726, "r_x3": 134.765, "r_y3": 345.726, "coord_origin": "TOPLEFT"}, "text": "ken sequences, resulting in even more precise structure prediction and bounding", "orig": "ken sequences, resulting in even more precise structure prediction and bounding", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 64, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 366.478, "r_x1": 161.657, "r_y1": 366.478, "r_x2": 161.657, "r_y2": 357.681, "r_x3": 134.765, "r_y3": 357.681, "coord_origin": "TOPLEFT"}, "text": "boxes.", "orig": "boxes.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 65, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 405.516, "r_x1": 162.644, "r_y1": 405.516, "r_x2": 162.644, "r_y2": 397.59, "r_x3": 134.765, "r_y3": 397.59, "coord_origin": "TOPLEFT"}, "text": "Fig. 5.", "orig": "Fig. 5.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 66, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 167.384, "r_y0": 406.664, "r_x1": 437.456, "r_y1": 406.664, "r_x2": 437.456, "r_y2": 395.375, "r_x3": 167.384, "r_y3": 395.375, "coord_origin": "TOPLEFT"}, "text": "The OTSL model produces more accurate bounding boxes with", "orig": "The OTSL model produces more accurate bounding boxes with", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 67, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 442.2, "r_y0": 406.664, "r_x1": 456.125, "r_y1": 406.664, "r_x2": 456.125, "r_y2": 395.375, "r_x3": 442.2, "r_y3": 395.375, "coord_origin": "TOPLEFT"}, "text": "less", "orig": "less", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 68, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 460.86, "r_y0": 406.664, "r_x1": 480.591, "r_y1": 406.664, "r_x2": 480.591, "r_y2": 395.375, "r_x3": 460.86, "r_y3": 395.375, "coord_origin": "TOPLEFT"}, "text": "over-", "orig": "over-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 69, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 417.623, "r_x1": 147.049, "r_y1": 417.623, "r_x2": 147.049, "r_y2": 406.334, "r_x3": 134.765, "r_y3": 406.334, "coord_origin": "TOPLEFT"}, "text": "lap", "orig": "lap", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 70, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 151.434, "r_y0": 417.623, "r_x1": 480.591, "r_y1": 417.623, "r_x2": 480.591, "r_y2": 406.334, "r_x3": 151.434, "r_y3": 406.334, "coord_origin": "TOPLEFT"}, "text": "(E) than the HTML model (D), when predicting the structure of a sparse ta-", "orig": "(E) than the HTML model (D), when predicting the structure of a sparse ta-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 71, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 428.582, "r_x1": 146.541, "r_y1": 428.582, "r_x2": 146.541, "r_y2": 417.293, "r_x3": 134.765, "r_y3": 417.293, "coord_origin": "TOPLEFT"}, "text": "ble", "orig": "ble", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 72, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 151.391, "r_y0": 428.582, "r_x1": 168.025, "r_y1": 428.582, "r_x2": 168.025, "r_y2": 417.293, "r_x3": 151.391, "r_y3": 417.293, "coord_origin": "TOPLEFT"}, "text": "(A),", "orig": "(A),", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 73, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 172.885, "r_y0": 428.582, "r_x1": 181.066, "r_y1": 428.582, "r_x2": 181.066, "r_y2": 417.293, "r_x3": 172.885, "r_y3": 417.293, "coord_origin": "TOPLEFT"}, "text": "at", "orig": "at", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 74, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 185.925, "r_y0": 428.582, "r_x1": 206.655, "r_y1": 428.582, "r_x2": 206.655, "r_y2": 417.293, "r_x3": 185.925, "r_y3": 417.293, "coord_origin": "TOPLEFT"}, "text": "twice", "orig": "twice", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 75, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 211.506, "r_y0": 428.582, "r_x1": 224.305, "r_y1": 428.582, "r_x2": 224.305, "r_y2": 417.293, "r_x3": 211.506, "r_y3": 417.293, "coord_origin": "TOPLEFT"}, "text": "the", "orig": "the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 76, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 229.165, "r_y0": 428.582, "r_x1": 264.77, "r_y1": 428.582, "r_x2": 264.77, "r_y2": 417.293, "r_x3": 229.165, "r_y3": 417.293, "coord_origin": "TOPLEFT"}, "text": "inference", "orig": "inference", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 77, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 269.621, "r_y0": 428.582, "r_x1": 291.939, "r_y1": 428.582, "r_x2": 291.939, "r_y2": 417.293, "r_x3": 269.621, "r_y3": 417.293, "coord_origin": "TOPLEFT"}, "text": "speed", "orig": "speed", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 78, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 296.799, "r_y0": 428.582, "r_x1": 327.819, "r_y1": 428.582, "r_x2": 327.819, "r_y2": 417.293, "r_x3": 296.799, "r_y3": 417.293, "coord_origin": "TOPLEFT"}, "text": "because", "orig": "because", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 79, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 332.67, "r_y0": 428.582, "r_x1": 340.092, "r_y1": 428.582, "r_x2": 340.092, "r_y2": 417.293, "r_x3": 332.67, "r_y3": 417.293, "coord_origin": "TOPLEFT"}, "text": "of", "orig": "of", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 80, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 344.952, "r_y0": 428.582, "r_x1": 373.2, "r_y1": 428.582, "r_x2": 373.2, "r_y2": 417.293, "r_x3": 344.952, "r_y3": 417.293, "coord_origin": "TOPLEFT"}, "text": "shorter", "orig": "shorter", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 81, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 378.05, "r_y0": 428.582, "r_x1": 413.174, "r_y1": 428.582, "r_x2": 413.174, "r_y2": 417.293, "r_x3": 378.05, "r_y3": 417.293, "coord_origin": "TOPLEFT"}, "text": "sequence", "orig": "sequence", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 82, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 418.024, "r_y0": 428.582, "r_x1": 443.108, "r_y1": 428.582, "r_x2": 443.108, "r_y2": 417.293, "r_x3": 418.024, "r_y3": 417.293, "coord_origin": "TOPLEFT"}, "text": "length", "orig": "length", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 83, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 447.959, "r_y0": 428.582, "r_x1": 480.588, "r_y1": 428.582, "r_x2": 480.588, "r_y2": 417.293, "r_x3": 447.959, "r_y3": 417.293, "coord_origin": "TOPLEFT"}, "text": "(B),(C).", "orig": "(B),(C).", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 84, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 439.541, "r_x1": 304.692, "r_y1": 439.541, "r_x2": 304.692, "r_y2": 428.252, "r_x3": 134.765, "r_y3": 428.252, "coord_origin": "TOPLEFT"}, "text": "\"PMC2807444_006_00.png\" PubTabNet.", "orig": "\"PMC2807444_006_00.png\" PubTabNet.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 85, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 180.125, "r_y0": 518.934, "r_x1": 190.62, "r_y1": 518.934, "r_x2": 190.62, "r_y2": 516.296, "r_x3": 180.125, "r_y3": 516.296, "coord_origin": "TOPLEFT"}, "text": "<table>", "orig": "<table>", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 86, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 183.244, "r_y0": 522.8330000000001, "r_x1": 304.548, "r_y1": 522.8330000000001, "r_x2": 304.548, "r_y2": 520.194, "r_x3": 183.244, "r_y3": 520.194, "coord_origin": "TOPLEFT"}, "text": "<tr><td></td><td colspan=\"4\"></td><td colspan=\"6\"></td><td colspan=\"3\"></td></tr>", "orig": "<tr><td></td><td colspan=\"4\"></td><td colspan=\"6\"></td><td colspan=\"3\"></td></tr>", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 87, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 183.244, "r_y0": 526.731, "r_x1": 388.423, "r_y1": 526.731, "r_x2": 388.423, "r_y2": 524.0930000000001, "r_x3": 183.244, "r_y3": 524.0930000000001, "coord_origin": "TOPLEFT"}, "text": "<tr><td></td><td></td><td></td><td></td><td></td><td></td><td></td><td></td><td></td><td></td><td></td><td></td><td></td><td></td></tr>", "orig": "<tr><td></td><td></td><td></td><td></td><td></td><td></td><td></td><td></td><td></td><td></td><td></td><td></td><td></td><td></td></tr>", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 88, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 183.244, "r_y0": 530.63, "r_x1": 388.423, "r_y1": 530.63, "r_x2": 388.423, "r_y2": 527.992, "r_x3": 183.244, "r_y3": 527.992, "coord_origin": "TOPLEFT"}, "text": "<tr><td></td><td></td><td></td><td></td><td></td><td></td><td></td><td></td><td></td><td></td><td></td><td></td><td></td><td></td></tr>", "orig": "<tr><td></td><td></td><td></td><td></td><td></td><td></td><td></td><td></td><td></td><td></td><td></td><td></td><td></td><td></td></tr>", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 89, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 183.244, "r_y0": 534.529, "r_x1": 388.423, "r_y1": 534.529, "r_x2": 388.423, "r_y2": 531.8910000000001, "r_x3": 183.244, "r_y3": 531.8910000000001, "coord_origin": "TOPLEFT"}, "text": "<tr><td></td><td></td><td></td><td></td><td></td><td></td><td></td><td></td><td></td><td></td><td></td><td></td><td></td><td></td></tr>", "orig": "<tr><td></td><td></td><td></td><td></td><td></td><td></td><td></td><td></td><td></td><td></td><td></td><td></td><td></td><td></td></tr>", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 90, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 183.244, "r_y0": 538.428, "r_x1": 388.423, "r_y1": 538.428, "r_x2": 388.423, "r_y2": 535.79, "r_x3": 183.244, "r_y3": 535.79, "coord_origin": "TOPLEFT"}, "text": "<tr><td></td><td></td><td></td><td></td><td></td><td></td><td></td><td></td><td></td><td></td><td></td><td></td><td></td><td></td></tr>", "orig": "<tr><td></td><td></td><td></td><td></td><td></td><td></td><td></td><td></td><td></td><td></td><td></td><td></td><td></td><td></td></tr>", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 91, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 183.244, "r_y0": 542.327, "r_x1": 388.423, "r_y1": 542.327, "r_x2": 388.423, "r_y2": 539.689, "r_x3": 183.244, "r_y3": 539.689, "coord_origin": "TOPLEFT"}, "text": "<tr><td></td><td></td><td></td><td></td><td></td><td></td><td></td><td></td><td></td><td></td><td></td><td></td><td></td><td></td></tr>", "orig": "<tr><td></td><td></td><td></td><td></td><td></td><td></td><td></td><td></td><td></td><td></td><td></td><td></td><td></td><td></td></tr>", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 92, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 183.244, "r_y0": 546.226, "r_x1": 388.423, "r_y1": 546.226, "r_x2": 388.423, "r_y2": 543.588, "r_x3": 183.244, "r_y3": 543.588, "coord_origin": "TOPLEFT"}, "text": "<tr><td></td><td></td><td></td><td></td><td></td><td></td><td></td><td></td><td></td><td></td><td></td><td></td><td></td><td></td></tr>", "orig": "<tr><td></td><td></td><td></td><td></td><td></td><td></td><td></td><td></td><td></td><td></td><td></td><td></td><td></td><td></td></tr>", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 93, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 183.244, "r_y0": 550.124, "r_x1": 388.423, "r_y1": 550.124, "r_x2": 388.423, "r_y2": 547.486, "r_x3": 183.244, "r_y3": 547.486, "coord_origin": "TOPLEFT"}, "text": "<tr><td></td><td></td><td></td><td></td><td></td><td></td><td></td><td></td><td></td><td></td><td></td><td></td><td></td><td></td></tr>", "orig": "<tr><td></td><td></td><td></td><td></td><td></td><td></td><td></td><td></td><td></td><td></td><td></td><td></td><td></td><td></td></tr>", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 94, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 183.244, "r_y0": 554.023, "r_x1": 388.423, "r_y1": 554.023, "r_x2": 388.423, "r_y2": 551.385, "r_x3": 183.244, "r_y3": 551.385, "coord_origin": "TOPLEFT"}, "text": "<tr><td></td><td></td><td></td><td></td><td></td><td></td><td></td><td></td><td></td><td></td><td></td><td></td><td></td><td></td></tr>", "orig": "<tr><td></td><td></td><td></td><td></td><td></td><td></td><td></td><td></td><td></td><td></td><td></td><td></td><td></td><td></td></tr>", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 95, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 180.125, "r_y0": 557.922, "r_x1": 191.868, "r_y1": 557.922, "r_x2": 191.868, "r_y2": 555.284, "r_x3": 180.125, "r_y3": 555.284, "coord_origin": "TOPLEFT"}, "text": "</table>", "orig": "</table>", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 96, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 407.383, "r_y0": 521.001, "r_x1": 450.486, "r_y1": 521.001, "r_x2": 450.486, "r_y2": 518.363, "r_x3": 407.383, "r_y3": 518.363, "coord_origin": "TOPLEFT"}, "text": "C C L L L C L L L L L C L L NL", "orig": "C C L L L C L L L L L C L L NL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 97, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 407.383, "r_y0": 524.9, "r_x1": 450.486, "r_y1": 524.9, "r_x2": 450.486, "r_y2": 522.262, "r_x3": 407.383, "r_y3": 522.262, "coord_origin": "TOPLEFT"}, "text": "C C C C C C C C C C C C C C NL", "orig": "C C C C C C C C C C C C C C NL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 98, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 407.383, "r_y0": 528.799, "r_x1": 450.486, "r_y1": 528.799, "r_x2": 450.486, "r_y2": 526.1600000000001, "r_x3": 407.383, "r_y3": 526.1600000000001, "coord_origin": "TOPLEFT"}, "text": "C C C C C C C C C C C C C C NL", "orig": "C C C C C C C C C C C C C C NL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 99, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 407.383, "r_y0": 532.697, "r_x1": 450.486, "r_y1": 532.697, "r_x2": 450.486, "r_y2": 530.059, "r_x3": 407.383, "r_y3": 530.059, "coord_origin": "TOPLEFT"}, "text": "C C C C C C C C C C C C C C NL", "orig": "C C C C C C C C C C C C C C NL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 100, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 407.383, "r_y0": 536.596, "r_x1": 450.486, "r_y1": 536.596, "r_x2": 450.486, "r_y2": 533.9580000000001, "r_x3": 407.383, "r_y3": 533.9580000000001, "coord_origin": "TOPLEFT"}, "text": "C C C C C C C C C C C C C C NL", "orig": "C C C C C C C C C C C C C C NL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 101, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 407.383, "r_y0": 540.495, "r_x1": 450.486, "r_y1": 540.495, "r_x2": 450.486, "r_y2": 537.857, "r_x3": 407.383, "r_y3": 537.857, "coord_origin": "TOPLEFT"}, "text": "C C C C C C C C C C C C C C NL", "orig": "C C C C C C C C C C C C C C NL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 102, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 407.383, "r_y0": 544.394, "r_x1": 450.486, "r_y1": 544.394, "r_x2": 450.486, "r_y2": 541.756, "r_x3": 407.383, "r_y3": 541.756, "coord_origin": "TOPLEFT"}, "text": "C C C C C C C C C C C C C C NL", "orig": "C C C C C C C C C C C C C C NL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 103, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 407.383, "r_y0": 548.293, "r_x1": 450.486, "r_y1": 548.293, "r_x2": 450.486, "r_y2": 545.655, "r_x3": 407.383, "r_y3": 545.655, "coord_origin": "TOPLEFT"}, "text": "C C C C C C C C C C C C C C NL", "orig": "C C C C C C C C C C C C C C NL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 104, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 407.383, "r_y0": 552.192, "r_x1": 450.486, "r_y1": 552.192, "r_x2": 450.486, "r_y2": 549.554, "r_x3": 407.383, "r_y3": 549.554, "coord_origin": "TOPLEFT"}, "text": "C C C C C C C C C C C C C C NL", "orig": "C C C C C C C C C C C C C C NL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 105, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 164.529, "r_y0": 515.288, "r_x1": 181.853, "r_y1": 515.288, "r_x2": 181.853, "r_y2": 509.533, "r_x3": 164.529, "r_y3": 509.533, "coord_origin": "TOPLEFT"}, "text": "HTML", "orig": "HTML", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 106, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 183.584, "r_y0": 515.288, "r_x1": 208.901, "r_y1": 515.288, "r_x2": 208.901, "r_y2": 509.533, "r_x3": 183.584, "r_y3": 509.533, "coord_origin": "TOPLEFT"}, "text": "# tokens:", "orig": "# tokens:", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 107, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 210.633, "r_y0": 515.288, "r_x1": 221.04, "r_y1": 515.288, "r_x2": 221.04, "r_y2": 509.533, "r_x3": 210.633, "r_y3": 509.533, "coord_origin": "TOPLEFT"}, "text": "258", "orig": "258", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 108, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 390.202, "r_y0": 515.433, "r_x1": 406.836, "r_y1": 515.433, "r_x2": 406.836, "r_y2": 509.678, "r_x3": 390.202, "r_y3": 509.678, "coord_origin": "TOPLEFT"}, "text": "OTSL", "orig": "OTSL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 109, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 408.569, "r_y0": 515.433, "r_x1": 433.886, "r_y1": 515.433, "r_x2": 433.886, "r_y2": 509.678, "r_x3": 408.569, "r_y3": 509.678, "coord_origin": "TOPLEFT"}, "text": "# tokens:", "orig": "# tokens:", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 110, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 435.617, "r_y0": 515.433, "r_x1": 446.025, "r_y1": 515.433, "r_x2": 446.025, "r_y2": 509.678, "r_x3": 435.617, "r_y3": 509.678, "coord_origin": "TOPLEFT"}, "text": "135", "orig": "135", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 111, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 167.193, "r_y0": 526.36, "r_x1": 172.823, "r_y1": 526.36, "r_x2": 172.823, "r_y2": 519.1659999999999, "r_x3": 167.193, "r_y3": 519.1659999999999, "coord_origin": "TOPLEFT"}, "text": "B", "orig": "B", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 112, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 187.337, "r_y0": 455.912, "r_x1": 192.967, "r_y1": 455.912, "r_x2": 192.967, "r_y2": 448.718, "r_x3": 187.337, "r_y3": 448.718, "coord_origin": "TOPLEFT"}, "text": "A", "orig": "A", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 113, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 167.387, "r_y0": 573.292, "r_x1": 173.016, "r_y1": 573.292, "r_x2": 173.016, "r_y2": 566.0989999999999, "r_x3": 167.387, "r_y3": 566.0989999999999, "coord_origin": "TOPLEFT"}, "text": "D", "orig": "D", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 114, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 248.456, "r_y0": 629.067, "r_x1": 253.657, "r_y1": 629.067, "r_x2": 253.657, "r_y2": 621.874, "r_x3": 248.456, "r_y3": 621.874, "coord_origin": "TOPLEFT"}, "text": "E", "orig": "E", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 115, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 395.901, "r_y0": 526.4870000000001, "r_x1": 401.531, "r_y1": 526.4870000000001, "r_x2": 401.531, "r_y2": 519.293, "r_x3": 395.901, "r_y3": 519.293, "coord_origin": "TOPLEFT"}, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 116, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 177.46, "r_y0": 597.268, "r_x1": 177.455, "r_y1": 580.287, "r_x2": 171.7, "r_y2": 580.289, "r_x3": 171.705, "r_y3": 597.269, "coord_origin": "TOPLEFT"}, "text": "HTML", "orig": "HTML", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 117, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 256.891, "r_y0": 649.923, "r_x1": 256.886, "r_y1": 633.633, "r_x2": 251.131, "r_y2": 633.634, "r_x3": 251.136, "r_y3": 649.925, "coord_origin": "TOPLEFT"}, "text": "OTSL", "orig": "OTSL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 118, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 372.146, "r_y0": 607.287, "r_x1": 427.038, "r_y1": 607.287, "r_x2": 427.038, "r_y2": 601.532, "r_x3": 372.146, "r_y3": 601.532, "coord_origin": "TOPLEFT"}, "text": "HTML model shows", "orig": "HTML model shows", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 119, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 372.146, "r_y0": 613.729, "r_x1": 430.068, "r_y1": 613.729, "r_x2": 430.068, "r_y2": 607.9739999999999, "r_x3": 372.146, "r_y3": 607.9739999999999, "coord_origin": "TOPLEFT"}, "text": "bounding box drifting", "orig": "bounding box drifting", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 120, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 176.88, "r_y0": 648.702, "r_x1": 231.082, "r_y1": 648.702, "r_x2": 231.082, "r_y2": 642.947, "r_x3": 176.88, "r_y3": 642.947, "coord_origin": "TOPLEFT"}, "text": "OTSL model shows", "orig": "OTSL model shows", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 121, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 176.88, "r_y0": 655.144, "r_x1": 230.993, "r_y1": 655.144, "r_x2": 230.993, "r_y2": 649.389, "r_x3": 176.88, "r_y3": 649.389, "coord_origin": "TOPLEFT"}, "text": "clean bounding box", "orig": "clean bounding box", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 122, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 176.88, "r_y0": 661.586, "r_x1": 203.932, "r_y1": 661.586, "r_x2": 203.932, "r_y2": 655.831, "r_x3": 176.88, "r_y3": 655.831, "coord_origin": "TOPLEFT"}, "text": "alignment", "orig": "alignment", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 123, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 215.932, "r_y0": 569.16, "r_x1": 218.47, "r_y1": 569.16, "r_x2": 218.47, "r_y2": 557.563, "r_x3": 215.932, "r_y3": 557.563, "coord_origin": "TOPLEFT"}, "text": "\u2264", "orig": "\u2264", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 124, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 229.057, "r_y0": 569.16, "r_x1": 231.719, "r_y1": 569.16, "r_x2": 231.719, "r_y2": 557.563, "r_x3": 229.057, "r_y3": 557.563, "coord_origin": "TOPLEFT"}, "text": "\u03bc", "orig": "\u03bc", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 125, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 342.634, "r_y0": 439.717, "r_x1": 344.819, "r_y1": 439.717, "r_x2": 344.819, "r_y2": 430.197, "r_x3": 342.634, "r_y3": 430.197, "coord_origin": "TOPLEFT"}, "text": "\u03bc", "orig": "\u03bc", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 126, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 261.209, "r_y0": 451.197, "r_x1": 263.57, "r_y1": 451.197, "r_x2": 263.57, "r_y2": 448.461, "r_x3": 261.209, "r_y3": 448.461, "coord_origin": "TOPLEFT"}, "text": "S", "orig": "S", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 127, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 312.335, "r_y0": 451.197, "r_x1": 313.636, "r_y1": 451.197, "r_x2": 313.636, "r_y2": 448.461, "r_x3": 312.335, "r_y3": 448.461, "coord_origin": "TOPLEFT"}, "text": "I", "orig": "I", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 128, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 377.411, "r_y0": 451.197, "r_x1": 380.057, "r_y1": 451.197, "r_x2": 380.057, "r_y2": 448.461, "r_x3": 377.411, "r_y3": 448.461, "coord_origin": "TOPLEFT"}, "text": "R", "orig": "R", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 129, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 200.64, "r_y0": 456.076, "r_x1": 205.818, "r_y1": 456.076, "r_x2": 205.818, "r_y2": 453.34, "r_x3": 200.64, "r_y3": 453.34, "coord_origin": "TOPLEFT"}, "text": "ST", "orig": "ST", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 130, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 222.208, "r_y0": 456.076, "r_x1": 229.761, "r_y1": 456.076, "r_x2": 229.761, "r_y2": 453.34, "r_x3": 222.208, "r_y3": 453.34, "coord_origin": "TOPLEFT"}, "text": "0.03", "orig": "0.03", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 131, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 243.267, "r_y0": 456.076, "r_x1": 250.82, "r_y1": 456.076, "r_x2": 250.82, "r_y2": 453.34, "r_x3": 243.267, "r_y3": 453.34, "coord_origin": "TOPLEFT"}, "text": "0.06", "orig": "0.06", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 132, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 264.297, "r_y0": 456.076, "r_x1": 271.842, "r_y1": 456.076, "r_x2": 271.842, "r_y2": 453.34, "r_x3": 264.297, "r_y3": 453.34, "coord_origin": "TOPLEFT"}, "text": "0.12", "orig": "0.12", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 133, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 285.319, "r_y0": 456.076, "r_x1": 292.872, "r_y1": 456.076, "r_x2": 292.872, "r_y2": 453.34, "r_x3": 285.319, "r_y3": 453.34, "coord_origin": "TOPLEFT"}, "text": "0.25", "orig": "0.25", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 134, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 306.378, "r_y0": 456.076, "r_x1": 311.766, "r_y1": 456.076, "r_x2": 311.766, "r_y2": 453.34, "r_x3": 306.378, "r_y3": 453.34, "coord_origin": "TOPLEFT"}, "text": "0.5", "orig": "0.5", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 135, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 323.417, "r_y0": 456.076, "r_x1": 325.575, "r_y1": 456.076, "r_x2": 325.575, "r_y2": 453.34, "r_x3": 323.417, "r_y3": 453.34, "coord_origin": "TOPLEFT"}, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 136, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 334.458, "r_y0": 456.076, "r_x1": 336.616, "r_y1": 456.076, "r_x2": 336.616, "r_y2": 453.34, "r_x3": 334.458, "r_y3": 453.34, "coord_origin": "TOPLEFT"}, "text": "2", "orig": "2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 137, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 345.528, "r_y0": 456.076, "r_x1": 347.685, "r_y1": 456.076, "r_x2": 347.685, "r_y2": 453.34, "r_x3": 345.528, "r_y3": 453.34, "coord_origin": "TOPLEFT"}, "text": "4", "orig": "4", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 138, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 356.569, "r_y0": 456.076, "r_x1": 358.726, "r_y1": 456.076, "r_x2": 358.726, "r_y2": 453.34, "r_x3": 356.569, "r_y3": 453.34, "coord_origin": "TOPLEFT"}, "text": "8", "orig": "8", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 139, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 367.638, "r_y0": 456.076, "r_x1": 371.964, "r_y1": 456.076, "r_x2": 371.964, "r_y2": 453.34, "r_x3": 367.638, "r_y3": 453.34, "coord_origin": "TOPLEFT"}, "text": "16", "orig": "16", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 140, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 382.673, "r_y0": 456.076, "r_x1": 386.999, "r_y1": 456.076, "r_x2": 386.999, "r_y2": 453.34, "r_x3": 382.673, "r_y3": 453.34, "coord_origin": "TOPLEFT"}, "text": "32", "orig": "32", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 141, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 397.737, "r_y0": 456.076, "r_x1": 402.063, "r_y1": 456.076, "r_x2": 402.063, "r_y2": 453.34, "r_x3": 397.737, "r_y3": 453.34, "coord_origin": "TOPLEFT"}, "text": "64", "orig": "64", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 142, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 412.789, "r_y0": 457.8, "r_x1": 414.935, "r_y1": 457.8, "r_x2": 414.935, "r_y2": 447.993, "r_x3": 412.789, "r_y3": 447.993, "coord_origin": "TOPLEFT"}, "text": "\u2265", "orig": "\u2265", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 143, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 416.07, "r_y0": 456.076, "r_x1": 422.535, "r_y1": 456.076, "r_x2": 422.535, "r_y2": 453.34, "r_x3": 416.07, "r_y3": 453.34, "coord_origin": "TOPLEFT"}, "text": "128", "orig": "128", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 144, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 200.64, "r_y0": 466.66, "r_x1": 204.563, "r_y1": 466.66, "r_x2": 204.563, "r_y2": 463.924, "r_x3": 200.64, "r_y3": 463.924, "coord_origin": "TOPLEFT"}, "text": "63", "orig": "63", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 145, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 367.626, "r_y0": 466.66, "r_x1": 369.58, "r_y1": 466.66, "r_x2": 369.58, "r_y2": 463.924, "r_x3": 367.626, "r_y3": 463.924, "coord_origin": "TOPLEFT"}, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 146, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 382.661, "r_y0": 466.66, "r_x1": 384.616, "r_y1": 466.66, "r_x2": 384.616, "r_y2": 463.924, "r_x3": 382.661, "r_y3": 463.924, "coord_origin": "TOPLEFT"}, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 147, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 397.725, "r_y0": 466.66, "r_x1": 399.679, "r_y1": 466.66, "r_x2": 399.679, "r_y2": 463.924, "r_x3": 397.725, "r_y3": 463.924, "coord_origin": "TOPLEFT"}, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 148, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 200.64, "r_y0": 471.539, "r_x1": 206.503, "r_y1": 471.539, "r_x2": 206.503, "r_y2": 468.803, "r_x3": 200.64, "r_y3": 468.803, "coord_origin": "TOPLEFT"}, "text": "199", "orig": "199", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 149, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 264.29, "r_y0": 471.539, "r_x1": 266.245, "r_y1": 471.539, "r_x2": 266.245, "r_y2": 468.803, "r_x3": 264.29, "r_y3": 468.803, "coord_origin": "TOPLEFT"}, "text": "5", "orig": "5", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 150, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 306.372, "r_y0": 471.539, "r_x1": 308.326, "r_y1": 471.539, "r_x2": 308.326, "r_y2": 468.803, "r_x3": 306.372, "r_y3": 468.803, "coord_origin": "TOPLEFT"}, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 151, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 345.515, "r_y0": 471.539, "r_x1": 347.47, "r_y1": 471.539, "r_x2": 347.47, "r_y2": 468.803, "r_x3": 345.515, "r_y3": 468.803, "coord_origin": "TOPLEFT"}, "text": "2", "orig": "2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 152, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 356.556, "r_y0": 471.539, "r_x1": 358.511, "r_y1": 471.539, "r_x2": 358.511, "r_y2": 468.803, "r_x3": 356.556, "r_y3": 468.803, "coord_origin": "TOPLEFT"}, "text": "4", "orig": "4", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 153, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 367.626, "r_y0": 471.539, "r_x1": 369.58, "r_y1": 471.539, "r_x2": 369.58, "r_y2": 468.803, "r_x3": 367.626, "r_y3": 468.803, "coord_origin": "TOPLEFT"}, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 154, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 382.661, "r_y0": 471.539, "r_x1": 384.615, "r_y1": 471.539, "r_x2": 384.615, "r_y2": 468.803, "r_x3": 382.661, "r_y3": 468.803, "coord_origin": "TOPLEFT"}, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 155, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 200.64, "r_y0": 476.418, "r_x1": 206.503, "r_y1": 476.418, "r_x2": 206.503, "r_y2": 473.682, "r_x3": 200.64, "r_y3": 473.682, "coord_origin": "TOPLEFT"}, "text": "416", "orig": "416", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 156, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 264.29, "r_y0": 476.418, "r_x1": 266.245, "r_y1": 476.418, "r_x2": 266.245, "r_y2": 473.682, "r_x3": 264.29, "r_y3": 473.682, "coord_origin": "TOPLEFT"}, "text": "4", "orig": "4", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 157, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 200.64, "r_y0": 481.268, "r_x1": 206.503, "r_y1": 481.268, "r_x2": 206.503, "r_y2": 478.532, "r_x3": 200.64, "r_y3": 478.532, "coord_origin": "TOPLEFT"}, "text": "230", "orig": "230", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 158, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 243.264, "r_y0": 481.268, "r_x1": 245.218, "r_y1": 481.268, "r_x2": 245.218, "r_y2": 478.532, "r_x3": 243.264, "r_y3": 478.532, "coord_origin": "TOPLEFT"}, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 159, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 264.29, "r_y0": 481.268, "r_x1": 266.245, "r_y1": 481.268, "r_x2": 266.245, "r_y2": 478.532, "r_x3": 264.29, "r_y3": 478.532, "coord_origin": "TOPLEFT"}, "text": "9", "orig": "9", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 160, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 323.405, "r_y0": 481.268, "r_x1": 325.359, "r_y1": 481.268, "r_x2": 325.359, "r_y2": 478.532, "r_x3": 323.405, "r_y3": 478.532, "coord_origin": "TOPLEFT"}, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 161, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 397.725, "r_y0": 481.268, "r_x1": 399.679, "r_y1": 481.268, "r_x2": 399.679, "r_y2": 478.532, "r_x3": 397.725, "r_y3": 478.532, "coord_origin": "TOPLEFT"}, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 162, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 200.64, "r_y0": 486.147, "r_x1": 206.503, "r_y1": 486.147, "r_x2": 206.503, "r_y2": 483.411, "r_x3": 200.64, "r_y3": 483.411, "coord_origin": "TOPLEFT"}, "text": "276", "orig": "276", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 163, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 382.661, "r_y0": 486.147, "r_x1": 384.616, "r_y1": 486.147, "r_x2": 384.616, "r_y2": 483.411, "r_x3": 382.661, "r_y3": 483.411, "coord_origin": "TOPLEFT"}, "text": "2", "orig": "2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 164, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 397.725, "r_y0": 486.147, "r_x1": 401.648, "r_y1": 486.147, "r_x2": 401.648, "r_y2": 483.411, "r_x3": 397.725, "r_y3": 483.411, "coord_origin": "TOPLEFT"}, "text": "12", "orig": "12", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 165, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 412.789, "r_y0": 486.147, "r_x1": 414.744, "r_y1": 486.147, "r_x2": 414.744, "r_y2": 483.411, "r_x3": 412.789, "r_y3": 483.411, "coord_origin": "TOPLEFT"}, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 166, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 200.64, "r_y0": 491.026, "r_x1": 207.134, "r_y1": 491.026, "r_x2": 207.134, "r_y2": 488.29, "r_x3": 200.64, "r_y3": 488.29, "coord_origin": "TOPLEFT"}, "text": "320", "orig": "320", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 167, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 367.626, "r_y0": 491.026, "r_x1": 369.784, "r_y1": 491.026, "r_x2": 369.784, "r_y2": 488.29, "r_x3": 367.626, "r_y3": 488.29, "coord_origin": "TOPLEFT"}, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 168, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 382.661, "r_y0": 491.026, "r_x1": 384.819, "r_y1": 491.026, "r_x2": 384.819, "r_y2": 488.29, "r_x3": 382.661, "r_y3": 488.29, "coord_origin": "TOPLEFT"}, "text": "4", "orig": "4", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 169, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 397.725, "r_y0": 491.026, "r_x1": 402.051, "r_y1": 491.026, "r_x2": 402.051, "r_y2": 488.29, "r_x3": 397.725, "r_y3": 488.29, "coord_origin": "TOPLEFT"}, "text": "20", "orig": "20", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 170, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 200.64, "r_y0": 495.904, "r_x1": 208.472, "r_y1": 495.904, "r_x2": 208.472, "r_y2": 493.168, "r_x3": 200.64, "r_y3": 493.168, "coord_origin": "TOPLEFT"}, "text": "2013", "orig": "2013", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 171, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 264.29, "r_y0": 495.904, "r_x1": 266.245, "r_y1": 495.904, "r_x2": 266.245, "r_y2": 493.168, "r_x3": 264.29, "r_y3": 493.168, "coord_origin": "TOPLEFT"}, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 172, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 227.915, "r_y0": 675.346, "r_x1": 230.1, "r_y1": 675.346, "r_x2": 230.1, "r_y2": 665.826, "r_x3": 227.915, "r_y3": 665.826, "coord_origin": "TOPLEFT"}, "text": "\u03bc", "orig": "\u03bc", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 173, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 300.581, "r_y0": 693.429, "r_x1": 302.726, "r_y1": 693.429, "r_x2": 302.726, "r_y2": 683.622, "r_x3": 300.581, "r_y3": 683.622, "coord_origin": "TOPLEFT"}, "text": "\u2265", "orig": "\u2265", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "parsed_page": null, "predictions": {"layout": {"clusters": [{"id": 7, "label": "page_header", "bbox": {"l": 134.765, "t": 91.49300000000005, "r": 143.979, "b": 102.78200000000004, "coord_origin": "TOPLEFT"}, "confidence": 0.8309906721115112, "cells": [{"index": 0, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 102.78200000000004, "r_x1": 143.979, "r_y1": 102.78200000000004, "r_x2": 143.979, "r_y2": 91.49300000000005, "r_x3": 134.765, "r_y3": 91.49300000000005, "coord_origin": "TOPLEFT"}, "text": "10", "orig": "10", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 6, "label": "page_header", "bbox": {"l": 167.821, "t": 91.49300000000005, "r": 231.72, "b": 102.78200000000004, "coord_origin": "TOPLEFT"}, "confidence": 0.8367075324058533, "cells": [{"index": 1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 167.821, "r_y0": 102.78200000000004, "r_x1": 231.72, "r_y1": 102.78200000000004, "r_x2": 231.72, "r_y2": 91.49300000000005, "r_x3": 167.821, "r_y3": 91.49300000000005, "coord_origin": "TOPLEFT"}, "text": "M. Lysak, et al.", "orig": "M. Lysak, et al.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 4, "label": "caption", "bbox": {"l": 134.765, "t": 113.62099999999998, "r": 480.594, "b": 146.82799999999997, "coord_origin": "TOPLEFT"}, "confidence": 0.9512290954589844, "cells": [{"index": 2, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 123.76199999999994, "r_x1": 173.094, "r_y1": 123.76199999999994, "r_x2": 173.094, "r_y2": 115.83600000000001, "r_x3": 134.765, "r_y3": 115.83600000000001, "coord_origin": "TOPLEFT"}, "text": "Table 2.", "orig": "Table 2.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 3, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 181.303, "r_y0": 124.90999999999997, "r_x1": 480.592, "r_y1": 124.90999999999997, "r_x2": 480.592, "r_y2": 113.62099999999998, "r_x3": 181.303, "r_y3": 113.62099999999998, "coord_origin": "TOPLEFT"}, "text": "TSR and cell detection results compared between OTSL and HTML on", "orig": "TSR and cell detection results compared between OTSL and HTML on", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 4, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 135.86900000000003, "r_x1": 480.594, "r_y1": 135.86900000000003, "r_x2": 480.594, "r_y2": 124.58000000000004, "r_x3": 134.765, "r_y3": 124.58000000000004, "coord_origin": "TOPLEFT"}, "text": "the PubTabNet [22], FinTabNet [21] and PubTables-1M [14] data sets using Table-", "orig": "the PubTabNet [22], FinTabNet [21] and PubTables-1M [14] data sets using Table-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 5, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 146.82799999999997, "r_x1": 305.957, "r_y1": 146.82799999999997, "r_x2": 305.957, "r_y2": 135.539, "r_x3": 134.765, "r_y3": 135.539, "coord_origin": "TOPLEFT"}, "text": "Former [9] (with enc=6, dec=6, heads=8).", "orig": "Former [9] (with enc=6, dec=6, heads=8).", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 0, "label": "table", "bbox": {"l": 143.6376495361328, "t": 156.3477020263672, "r": 470.8485412597656, "b": 263.2624816894531, "coord_origin": "TOPLEFT"}, "confidence": 0.9884640574455261, "cells": [{"index": 6, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 160.782, "r_y0": 175.57000000000005, "r_x1": 194.998, "r_y1": 175.57000000000005, "r_x2": 194.998, "r_y2": 164.28099999999995, "r_x3": 160.782, "r_y3": 164.28099999999995, "coord_origin": "TOPLEFT"}, "text": "Data set", "orig": "Data set", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 7, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 215.525, "r_y0": 175.54499999999996, "r_x1": 254.045, "r_y1": 175.54499999999996, "r_x2": 254.045, "r_y2": 164.25599999999997, "r_x3": 215.525, "r_y3": 164.25599999999997, "coord_origin": "TOPLEFT"}, "text": "Language", "orig": "Language", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 8, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 300.397, "r_y0": 170.09000000000003, "r_x1": 323.991, "r_y1": 170.09000000000003, "r_x2": 323.991, "r_y2": 158.80100000000004, "r_x3": 300.397, "r_y3": 158.80100000000004, "coord_origin": "TOPLEFT"}, "text": "TEDs", "orig": "TEDs", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 9, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 370.345, "r_y0": 175.57000000000005, "r_x1": 414.747, "r_y1": 175.57000000000005, "r_x2": 414.747, "r_y2": 164.28099999999995, "r_x3": 370.345, "r_y3": 164.28099999999995, "coord_origin": "TOPLEFT"}, "text": "mAP(0.75)", "orig": "mAP(0.75)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 10, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 426.737, "r_y0": 170.09000000000003, "r_x1": 463.108, "r_y1": 170.09000000000003, "r_x2": 463.108, "r_y2": 158.80100000000004, "r_x3": 426.737, "r_y3": 158.80100000000004, "coord_origin": "TOPLEFT"}, "text": "Inference", "orig": "Inference", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 11, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 423.114, "r_y0": 181.04899999999998, "r_x1": 466.727, "r_y1": 181.04899999999998, "r_x2": 466.727, "r_y2": 169.76, "r_x3": 423.114, "r_y3": 169.76, "coord_origin": "TOPLEFT"}, "text": "time (secs)", "orig": "time (secs)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 12, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 262.413, "r_y0": 183.04200000000003, "r_x1": 288.06, "r_y1": 183.04200000000003, "r_x2": 288.06, "r_y2": 171.75300000000004, "r_x3": 262.413, "r_y3": 171.75300000000004, "coord_origin": "TOPLEFT"}, "text": "simple", "orig": "simple", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 13, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 296.429, "r_y0": 183.04200000000003, "r_x1": 329.447, "r_y1": 183.04200000000003, "r_x2": 329.447, "r_y2": 171.75300000000004, "r_x3": 296.429, "r_y3": 171.75300000000004, "coord_origin": "TOPLEFT"}, "text": "complex", "orig": "complex", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 14, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 345.033, "r_y0": 183.04200000000003, "r_x1": 354.758, "r_y1": 183.04200000000003, "r_x2": 354.758, "r_y2": 171.75300000000004, "r_x3": 345.033, "r_y3": 171.75300000000004, "coord_origin": "TOPLEFT"}, "text": "all", "orig": "all", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 15, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 154.538, "r_y0": 201.87099999999998, "r_x1": 201.241, "r_y1": 201.87099999999998, "r_x2": 201.241, "r_y2": 190.582, "r_x3": 154.538, "r_y3": 190.582, "coord_origin": "TOPLEFT"}, "text": "PubTabNet", "orig": "PubTabNet", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 16, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 222.437, "r_y0": 196.39200000000005, "r_x1": 247.132, "r_y1": 196.39200000000005, "r_x2": 247.132, "r_y2": 185.10299999999995, "r_x3": 222.437, "r_y3": 185.10299999999995, "coord_origin": "TOPLEFT"}, "text": "OTSL", "orig": "OTSL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 17, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 264.744, "r_y0": 196.39200000000005, "r_x1": 285.731, "r_y1": 196.39200000000005, "r_x2": 285.731, "r_y2": 185.10299999999995, "r_x3": 264.744, "r_y3": 185.10299999999995, "coord_origin": "TOPLEFT"}, "text": "0.965", "orig": "0.965", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 18, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 302.444, "r_y0": 196.39200000000005, "r_x1": 323.431, "r_y1": 196.39200000000005, "r_x2": 323.431, "r_y2": 185.10299999999995, "r_x3": 302.444, "r_y3": 185.10299999999995, "coord_origin": "TOPLEFT"}, "text": "0.934", "orig": "0.934", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 19, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 339.403, "r_y0": 196.39200000000005, "r_x1": 360.39, "r_y1": 196.39200000000005, "r_x2": 360.39, "r_y2": 185.10299999999995, "r_x3": 339.403, "r_y3": 185.10299999999995, "coord_origin": "TOPLEFT"}, "text": "0.955", "orig": "0.955", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 20, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 383.116, "r_y0": 195.24400000000003, "r_x1": 401.973, "r_y1": 195.24400000000003, "r_x2": 401.973, "r_y2": 187.31799999999998, "r_x3": 383.116, "r_y3": 187.31799999999998, "coord_origin": "TOPLEFT"}, "text": "0.88", "orig": "0.88", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 21, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 435.493, "r_y0": 195.24400000000003, "r_x1": 454.35, "r_y1": 195.24400000000003, "r_x2": 454.35, "r_y2": 187.31799999999998, "r_x3": 435.493, "r_y3": 187.31799999999998, "coord_origin": "TOPLEFT"}, "text": "2.73", "orig": "2.73", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 22, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 220.903, "r_y0": 209.34299999999996, "r_x1": 248.667, "r_y1": 209.34299999999996, "r_x2": 248.667, "r_y2": 198.05399999999997, "r_x3": 220.903, "r_y3": 198.05399999999997, "coord_origin": "TOPLEFT"}, "text": "HTML", "orig": "HTML", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 23, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 264.744, "r_y0": 209.34299999999996, "r_x1": 285.731, "r_y1": 209.34299999999996, "r_x2": 285.731, "r_y2": 198.05399999999997, "r_x3": 264.744, "r_y3": 198.05399999999997, "coord_origin": "TOPLEFT"}, "text": "0.969", "orig": "0.969", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 24, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 302.444, "r_y0": 209.34299999999996, "r_x1": 323.431, "r_y1": 209.34299999999996, "r_x2": 323.431, "r_y2": 198.05399999999997, "r_x3": 302.444, "r_y3": 198.05399999999997, "coord_origin": "TOPLEFT"}, "text": "0.927", "orig": "0.927", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 25, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 339.403, "r_y0": 209.34299999999996, "r_x1": 360.39, "r_y1": 209.34299999999996, "r_x2": 360.39, "r_y2": 198.05399999999997, "r_x3": 339.403, "r_y3": 198.05399999999997, "coord_origin": "TOPLEFT"}, "text": "0.955", "orig": "0.955", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 26, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 382.052, "r_y0": 209.34299999999996, "r_x1": 403.039, "r_y1": 209.34299999999996, "r_x2": 403.039, "r_y2": 198.05399999999997, "r_x3": 382.052, "r_y3": 198.05399999999997, "coord_origin": "TOPLEFT"}, "text": "0.857", "orig": "0.857", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 27, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 436.732, "r_y0": 209.34299999999996, "r_x1": 453.112, "r_y1": 209.34299999999996, "r_x2": 453.112, "r_y2": 198.05399999999997, "r_x3": 436.732, "r_y3": 198.05399999999997, "coord_origin": "TOPLEFT"}, "text": "5.39", "orig": "5.39", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 28, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 155.945, "r_y0": 228.173, "r_x1": 199.834, "r_y1": 228.173, "r_x2": 199.834, "r_y2": 216.88400000000001, "r_x3": 155.945, "r_y3": 216.88400000000001, "coord_origin": "TOPLEFT"}, "text": "FinTabNet", "orig": "FinTabNet", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 29, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 222.437, "r_y0": 222.69299999999998, "r_x1": 247.132, "r_y1": 222.69299999999998, "r_x2": 247.132, "r_y2": 211.404, "r_x3": 222.437, "r_y3": 211.404, "coord_origin": "TOPLEFT"}, "text": "OTSL", "orig": "OTSL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 30, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 264.744, "r_y0": 222.69299999999998, "r_x1": 285.731, "r_y1": 222.69299999999998, "r_x2": 285.731, "r_y2": 211.404, "r_x3": 264.744, "r_y3": 211.404, "coord_origin": "TOPLEFT"}, "text": "0.955", "orig": "0.955", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 31, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 302.444, "r_y0": 222.69299999999998, "r_x1": 323.431, "r_y1": 222.69299999999998, "r_x2": 323.431, "r_y2": 211.404, "r_x3": 302.444, "r_y3": 211.404, "coord_origin": "TOPLEFT"}, "text": "0.961", "orig": "0.961", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 32, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 337.815, "r_y0": 221.54499999999996, "r_x1": 361.976, "r_y1": 221.54499999999996, "r_x2": 361.976, "r_y2": 213.61900000000003, "r_x3": 337.815, "r_y3": 213.61900000000003, "coord_origin": "TOPLEFT"}, "text": "0.959", "orig": "0.959", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 33, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 380.464, "r_y0": 221.54499999999996, "r_x1": 404.625, "r_y1": 221.54499999999996, "r_x2": 404.625, "r_y2": 213.61900000000003, "r_x3": 380.464, "r_y3": 213.61900000000003, "coord_origin": "TOPLEFT"}, "text": "0.862", "orig": "0.862", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 34, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 435.493, "r_y0": 221.54499999999996, "r_x1": 454.35, "r_y1": 221.54499999999996, "r_x2": 454.35, "r_y2": 213.61900000000003, "r_x3": 435.493, "r_y3": 213.61900000000003, "coord_origin": "TOPLEFT"}, "text": "1.85", "orig": "1.85", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 35, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 220.903, "r_y0": 235.64499999999998, "r_x1": 248.667, "r_y1": 235.64499999999998, "r_x2": 248.667, "r_y2": 224.356, "r_x3": 220.903, "r_y3": 224.356, "coord_origin": "TOPLEFT"}, "text": "HTML", "orig": "HTML", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 36, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 264.744, "r_y0": 235.64499999999998, "r_x1": 285.731, "r_y1": 235.64499999999998, "r_x2": 285.731, "r_y2": 224.356, "r_x3": 264.744, "r_y3": 224.356, "coord_origin": "TOPLEFT"}, "text": "0.917", "orig": "0.917", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 37, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 302.444, "r_y0": 235.64499999999998, "r_x1": 323.431, "r_y1": 235.64499999999998, "r_x2": 323.431, "r_y2": 224.356, "r_x3": 302.444, "r_y3": 224.356, "coord_origin": "TOPLEFT"}, "text": "0.922", "orig": "0.922", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 38, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 341.706, "r_y0": 235.64499999999998, "r_x1": 358.086, "r_y1": 235.64499999999998, "r_x2": 358.086, "r_y2": 224.356, "r_x3": 341.706, "r_y3": 224.356, "coord_origin": "TOPLEFT"}, "text": "0.92", "orig": "0.92", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 39, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 382.052, "r_y0": 235.64499999999998, "r_x1": 403.039, "r_y1": 235.64499999999998, "r_x2": 403.039, "r_y2": 224.356, "r_x3": 382.052, "r_y3": 224.356, "coord_origin": "TOPLEFT"}, "text": "0.722", "orig": "0.722", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 40, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 436.732, "r_y0": 235.64499999999998, "r_x1": 453.112, "r_y1": 235.64499999999998, "r_x2": 453.112, "r_y2": 224.356, "r_x3": 436.732, "r_y3": 224.356, "coord_origin": "TOPLEFT"}, "text": "3.26", "orig": "3.26", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 41, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 148.626, "r_y0": 254.47400000000005, "r_x1": 207.152, "r_y1": 254.47400000000005, "r_x2": 207.152, "r_y2": 243.18499999999995, "r_x3": 148.626, "r_y3": 243.18499999999995, "coord_origin": "TOPLEFT"}, "text": "PubTables-1M", "orig": "PubTables-1M", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 42, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 222.437, "r_y0": 248.99400000000003, "r_x1": 247.132, "r_y1": 248.99400000000003, "r_x2": 247.132, "r_y2": 237.70500000000004, "r_x3": 222.437, "r_y3": 237.70500000000004, "coord_origin": "TOPLEFT"}, "text": "OTSL", "orig": "OTSL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 43, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 264.744, "r_y0": 248.99400000000003, "r_x1": 285.731, "r_y1": 248.99400000000003, "r_x2": 285.731, "r_y2": 237.70500000000004, "r_x3": 264.744, "r_y3": 237.70500000000004, "coord_origin": "TOPLEFT"}, "text": "0.987", "orig": "0.987", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 44, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 302.444, "r_y0": 248.99400000000003, "r_x1": 323.431, "r_y1": 248.99400000000003, "r_x2": 323.431, "r_y2": 237.70500000000004, "r_x3": 302.444, "r_y3": 237.70500000000004, "coord_origin": "TOPLEFT"}, "text": "0.964", "orig": "0.964", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 45, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 337.815, "r_y0": 247.846, "r_x1": 361.976, "r_y1": 247.846, "r_x2": 361.976, "r_y2": 239.91999999999996, "r_x3": 337.815, "r_y3": 239.91999999999996, "coord_origin": "TOPLEFT"}, "text": "0.977", "orig": "0.977", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 46, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 380.464, "r_y0": 247.846, "r_x1": 404.625, "r_y1": 247.846, "r_x2": 404.625, "r_y2": 239.91999999999996, "r_x3": 380.464, "r_y3": 239.91999999999996, "coord_origin": "TOPLEFT"}, "text": "0.896", "orig": "0.896", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 47, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 435.493, "r_y0": 247.846, "r_x1": 454.35, "r_y1": 247.846, "r_x2": 454.35, "r_y2": 239.91999999999996, "r_x3": 435.493, "r_y3": 239.91999999999996, "coord_origin": "TOPLEFT"}, "text": "1.79", "orig": "1.79", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 48, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 220.903, "r_y0": 261.946, "r_x1": 248.667, "r_y1": 261.946, "r_x2": 248.667, "r_y2": 250.65700000000004, "r_x3": 220.903, "r_y3": 250.65700000000004, "coord_origin": "TOPLEFT"}, "text": "HTML", "orig": "HTML", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 49, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 264.744, "r_y0": 261.946, "r_x1": 285.731, "r_y1": 261.946, "r_x2": 285.731, "r_y2": 250.65700000000004, "r_x3": 264.744, "r_y3": 250.65700000000004, "coord_origin": "TOPLEFT"}, "text": "0.983", "orig": "0.983", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 50, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 302.444, "r_y0": 261.946, "r_x1": 323.431, "r_y1": 261.946, "r_x2": 323.431, "r_y2": 250.65700000000004, "r_x3": 302.444, "r_y3": 250.65700000000004, "coord_origin": "TOPLEFT"}, "text": "0.944", "orig": "0.944", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 51, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 339.403, "r_y0": 261.946, "r_x1": 360.39, "r_y1": 261.946, "r_x2": 360.39, "r_y2": 250.65700000000004, "r_x3": 339.403, "r_y3": 250.65700000000004, "coord_origin": "TOPLEFT"}, "text": "0.966", "orig": "0.966", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 52, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 382.052, "r_y0": 261.946, "r_x1": 403.039, "r_y1": 261.946, "r_x2": 403.039, "r_y2": 250.65700000000004, "r_x3": 382.052, "r_y3": 250.65700000000004, "coord_origin": "TOPLEFT"}, "text": "0.889", "orig": "0.889", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 53, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 436.732, "r_y0": 261.946, "r_x1": 453.112, "r_y1": 261.946, "r_x2": 453.112, "r_y2": 250.65700000000004, "r_x3": 436.732, "r_y3": 250.65700000000004, "coord_origin": "TOPLEFT"}, "text": "3.26", "orig": "3.26", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": [{"id": 10, "label": "text", "bbox": {"l": 160.782, "t": 164.28099999999995, "r": 194.998, "b": 175.57000000000005, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 6, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 160.782, "r_y0": 175.57000000000005, "r_x1": 194.998, "r_y1": 175.57000000000005, "r_x2": 194.998, "r_y2": 164.28099999999995, "r_x3": 160.782, "r_y3": 164.28099999999995, "coord_origin": "TOPLEFT"}, "text": "Data set", "orig": "Data set", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 11, "label": "text", "bbox": {"l": 215.525, "t": 164.25599999999997, "r": 254.045, "b": 175.54499999999996, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 7, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 215.525, "r_y0": 175.54499999999996, "r_x1": 254.045, "r_y1": 175.54499999999996, "r_x2": 254.045, "r_y2": 164.25599999999997, "r_x3": 215.525, "r_y3": 164.25599999999997, "coord_origin": "TOPLEFT"}, "text": "Language", "orig": "Language", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 12, "label": "text", "bbox": {"l": 300.397, "t": 158.80100000000004, "r": 323.991, "b": 170.09000000000003, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 8, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 300.397, "r_y0": 170.09000000000003, "r_x1": 323.991, "r_y1": 170.09000000000003, "r_x2": 323.991, "r_y2": 158.80100000000004, "r_x3": 300.397, "r_y3": 158.80100000000004, "coord_origin": "TOPLEFT"}, "text": "TEDs", "orig": "TEDs", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 13, "label": "text", "bbox": {"l": 370.345, "t": 164.28099999999995, "r": 414.747, "b": 175.57000000000005, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 9, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 370.345, "r_y0": 175.57000000000005, "r_x1": 414.747, "r_y1": 175.57000000000005, "r_x2": 414.747, "r_y2": 164.28099999999995, "r_x3": 370.345, "r_y3": 164.28099999999995, "coord_origin": "TOPLEFT"}, "text": "mAP(0.75)", "orig": "mAP(0.75)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 14, "label": "text", "bbox": {"l": 426.737, "t": 158.80100000000004, "r": 463.108, "b": 170.09000000000003, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 10, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 426.737, "r_y0": 170.09000000000003, "r_x1": 463.108, "r_y1": 170.09000000000003, "r_x2": 463.108, "r_y2": 158.80100000000004, "r_x3": 426.737, "r_y3": 158.80100000000004, "coord_origin": "TOPLEFT"}, "text": "Inference", "orig": "Inference", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 15, "label": "text", "bbox": {"l": 423.114, "t": 169.76, "r": 466.727, "b": 181.04899999999998, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 11, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 423.114, "r_y0": 181.04899999999998, "r_x1": 466.727, "r_y1": 181.04899999999998, "r_x2": 466.727, "r_y2": 169.76, "r_x3": 423.114, "r_y3": 169.76, "coord_origin": "TOPLEFT"}, "text": "time (secs)", "orig": "time (secs)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 16, "label": "text", "bbox": {"l": 262.413, "t": 171.75300000000004, "r": 288.06, "b": 183.04200000000003, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 12, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 262.413, "r_y0": 183.04200000000003, "r_x1": 288.06, "r_y1": 183.04200000000003, "r_x2": 288.06, "r_y2": 171.75300000000004, "r_x3": 262.413, "r_y3": 171.75300000000004, "coord_origin": "TOPLEFT"}, "text": "simple", "orig": "simple", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 17, "label": "text", "bbox": {"l": 296.429, "t": 171.75300000000004, "r": 329.447, "b": 183.04200000000003, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 13, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 296.429, "r_y0": 183.04200000000003, "r_x1": 329.447, "r_y1": 183.04200000000003, "r_x2": 329.447, "r_y2": 171.75300000000004, "r_x3": 296.429, "r_y3": 171.75300000000004, "coord_origin": "TOPLEFT"}, "text": "complex", "orig": "complex", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 18, "label": "text", "bbox": {"l": 345.033, "t": 171.75300000000004, "r": 354.758, "b": 183.04200000000003, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 14, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 345.033, "r_y0": 183.04200000000003, "r_x1": 354.758, "r_y1": 183.04200000000003, "r_x2": 354.758, "r_y2": 171.75300000000004, "r_x3": 345.033, "r_y3": 171.75300000000004, "coord_origin": "TOPLEFT"}, "text": "all", "orig": "all", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 19, "label": "text", "bbox": {"l": 154.538, "t": 190.582, "r": 201.241, "b": 201.87099999999998, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 15, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 154.538, "r_y0": 201.87099999999998, "r_x1": 201.241, "r_y1": 201.87099999999998, "r_x2": 201.241, "r_y2": 190.582, "r_x3": 154.538, "r_y3": 190.582, "coord_origin": "TOPLEFT"}, "text": "PubTabNet", "orig": "PubTabNet", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 20, "label": "text", "bbox": {"l": 222.437, "t": 185.10299999999995, "r": 247.132, "b": 196.39200000000005, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 16, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 222.437, "r_y0": 196.39200000000005, "r_x1": 247.132, "r_y1": 196.39200000000005, "r_x2": 247.132, "r_y2": 185.10299999999995, "r_x3": 222.437, "r_y3": 185.10299999999995, "coord_origin": "TOPLEFT"}, "text": "OTSL", "orig": "OTSL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 21, "label": "text", "bbox": {"l": 264.744, "t": 185.10299999999995, "r": 285.731, "b": 196.39200000000005, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 17, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 264.744, "r_y0": 196.39200000000005, "r_x1": 285.731, "r_y1": 196.39200000000005, "r_x2": 285.731, "r_y2": 185.10299999999995, "r_x3": 264.744, "r_y3": 185.10299999999995, "coord_origin": "TOPLEFT"}, "text": "0.965", "orig": "0.965", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 22, "label": "text", "bbox": {"l": 302.444, "t": 185.10299999999995, "r": 323.431, "b": 196.39200000000005, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 18, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 302.444, "r_y0": 196.39200000000005, "r_x1": 323.431, "r_y1": 196.39200000000005, "r_x2": 323.431, "r_y2": 185.10299999999995, "r_x3": 302.444, "r_y3": 185.10299999999995, "coord_origin": "TOPLEFT"}, "text": "0.934", "orig": "0.934", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 23, "label": "text", "bbox": {"l": 339.403, "t": 185.10299999999995, "r": 360.39, "b": 196.39200000000005, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 19, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 339.403, "r_y0": 196.39200000000005, "r_x1": 360.39, "r_y1": 196.39200000000005, "r_x2": 360.39, "r_y2": 185.10299999999995, "r_x3": 339.403, "r_y3": 185.10299999999995, "coord_origin": "TOPLEFT"}, "text": "0.955", "orig": "0.955", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 24, "label": "text", "bbox": {"l": 383.116, "t": 187.31799999999998, "r": 401.973, "b": 195.24400000000003, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 20, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 383.116, "r_y0": 195.24400000000003, "r_x1": 401.973, "r_y1": 195.24400000000003, "r_x2": 401.973, "r_y2": 187.31799999999998, "r_x3": 383.116, "r_y3": 187.31799999999998, "coord_origin": "TOPLEFT"}, "text": "0.88", "orig": "0.88", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 25, "label": "text", "bbox": {"l": 435.493, "t": 187.31799999999998, "r": 454.35, "b": 195.24400000000003, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 21, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 435.493, "r_y0": 195.24400000000003, "r_x1": 454.35, "r_y1": 195.24400000000003, "r_x2": 454.35, "r_y2": 187.31799999999998, "r_x3": 435.493, "r_y3": 187.31799999999998, "coord_origin": "TOPLEFT"}, "text": "2.73", "orig": "2.73", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 26, "label": "text", "bbox": {"l": 220.903, "t": 198.05399999999997, "r": 248.667, "b": 209.34299999999996, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 22, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 220.903, "r_y0": 209.34299999999996, "r_x1": 248.667, "r_y1": 209.34299999999996, "r_x2": 248.667, "r_y2": 198.05399999999997, "r_x3": 220.903, "r_y3": 198.05399999999997, "coord_origin": "TOPLEFT"}, "text": "HTML", "orig": "HTML", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 27, "label": "text", "bbox": {"l": 264.744, "t": 198.05399999999997, "r": 285.731, "b": 209.34299999999996, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 23, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 264.744, "r_y0": 209.34299999999996, "r_x1": 285.731, "r_y1": 209.34299999999996, "r_x2": 285.731, "r_y2": 198.05399999999997, "r_x3": 264.744, "r_y3": 198.05399999999997, "coord_origin": "TOPLEFT"}, "text": "0.969", "orig": "0.969", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 28, "label": "text", "bbox": {"l": 302.444, "t": 198.05399999999997, "r": 323.431, "b": 209.34299999999996, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 24, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 302.444, "r_y0": 209.34299999999996, "r_x1": 323.431, "r_y1": 209.34299999999996, "r_x2": 323.431, "r_y2": 198.05399999999997, "r_x3": 302.444, "r_y3": 198.05399999999997, "coord_origin": "TOPLEFT"}, "text": "0.927", "orig": "0.927", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 29, "label": "text", "bbox": {"l": 339.403, "t": 198.05399999999997, "r": 360.39, "b": 209.34299999999996, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 25, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 339.403, "r_y0": 209.34299999999996, "r_x1": 360.39, "r_y1": 209.34299999999996, "r_x2": 360.39, "r_y2": 198.05399999999997, "r_x3": 339.403, "r_y3": 198.05399999999997, "coord_origin": "TOPLEFT"}, "text": "0.955", "orig": "0.955", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 30, "label": "text", "bbox": {"l": 382.052, "t": 198.05399999999997, "r": 403.039, "b": 209.34299999999996, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 26, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 382.052, "r_y0": 209.34299999999996, "r_x1": 403.039, "r_y1": 209.34299999999996, "r_x2": 403.039, "r_y2": 198.05399999999997, "r_x3": 382.052, "r_y3": 198.05399999999997, "coord_origin": "TOPLEFT"}, "text": "0.857", "orig": "0.857", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 31, "label": "text", "bbox": {"l": 436.732, "t": 198.05399999999997, "r": 453.112, "b": 209.34299999999996, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 27, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 436.732, "r_y0": 209.34299999999996, "r_x1": 453.112, "r_y1": 209.34299999999996, "r_x2": 453.112, "r_y2": 198.05399999999997, "r_x3": 436.732, "r_y3": 198.05399999999997, "coord_origin": "TOPLEFT"}, "text": "5.39", "orig": "5.39", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 32, "label": "text", "bbox": {"l": 155.945, "t": 216.88400000000001, "r": 199.834, "b": 228.173, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 28, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 155.945, "r_y0": 228.173, "r_x1": 199.834, "r_y1": 228.173, "r_x2": 199.834, "r_y2": 216.88400000000001, "r_x3": 155.945, "r_y3": 216.88400000000001, "coord_origin": "TOPLEFT"}, "text": "FinTabNet", "orig": "FinTabNet", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 33, "label": "text", "bbox": {"l": 222.437, "t": 211.404, "r": 247.132, "b": 222.69299999999998, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 29, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 222.437, "r_y0": 222.69299999999998, "r_x1": 247.132, "r_y1": 222.69299999999998, "r_x2": 247.132, "r_y2": 211.404, "r_x3": 222.437, "r_y3": 211.404, "coord_origin": "TOPLEFT"}, "text": "OTSL", "orig": "OTSL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 34, "label": "text", "bbox": {"l": 264.744, "t": 211.404, "r": 285.731, "b": 222.69299999999998, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 30, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 264.744, "r_y0": 222.69299999999998, "r_x1": 285.731, "r_y1": 222.69299999999998, "r_x2": 285.731, "r_y2": 211.404, "r_x3": 264.744, "r_y3": 211.404, "coord_origin": "TOPLEFT"}, "text": "0.955", "orig": "0.955", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 35, "label": "text", "bbox": {"l": 302.444, "t": 211.404, "r": 323.431, "b": 222.69299999999998, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 31, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 302.444, "r_y0": 222.69299999999998, "r_x1": 323.431, "r_y1": 222.69299999999998, "r_x2": 323.431, "r_y2": 211.404, "r_x3": 302.444, "r_y3": 211.404, "coord_origin": "TOPLEFT"}, "text": "0.961", "orig": "0.961", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 36, "label": "text", "bbox": {"l": 337.815, "t": 213.61900000000003, "r": 361.976, "b": 221.54499999999996, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 32, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 337.815, "r_y0": 221.54499999999996, "r_x1": 361.976, "r_y1": 221.54499999999996, "r_x2": 361.976, "r_y2": 213.61900000000003, "r_x3": 337.815, "r_y3": 213.61900000000003, "coord_origin": "TOPLEFT"}, "text": "0.959", "orig": "0.959", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 37, "label": "text", "bbox": {"l": 380.464, "t": 213.61900000000003, "r": 404.625, "b": 221.54499999999996, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 33, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 380.464, "r_y0": 221.54499999999996, "r_x1": 404.625, "r_y1": 221.54499999999996, "r_x2": 404.625, "r_y2": 213.61900000000003, "r_x3": 380.464, "r_y3": 213.61900000000003, "coord_origin": "TOPLEFT"}, "text": "0.862", "orig": "0.862", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 38, "label": "text", "bbox": {"l": 435.493, "t": 213.61900000000003, "r": 454.35, "b": 221.54499999999996, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 34, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 435.493, "r_y0": 221.54499999999996, "r_x1": 454.35, "r_y1": 221.54499999999996, "r_x2": 454.35, "r_y2": 213.61900000000003, "r_x3": 435.493, "r_y3": 213.61900000000003, "coord_origin": "TOPLEFT"}, "text": "1.85", "orig": "1.85", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 39, "label": "text", "bbox": {"l": 220.903, "t": 224.356, "r": 248.667, "b": 235.64499999999998, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 35, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 220.903, "r_y0": 235.64499999999998, "r_x1": 248.667, "r_y1": 235.64499999999998, "r_x2": 248.667, "r_y2": 224.356, "r_x3": 220.903, "r_y3": 224.356, "coord_origin": "TOPLEFT"}, "text": "HTML", "orig": "HTML", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 40, "label": "text", "bbox": {"l": 264.744, "t": 224.356, "r": 285.731, "b": 235.64499999999998, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 36, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 264.744, "r_y0": 235.64499999999998, "r_x1": 285.731, "r_y1": 235.64499999999998, "r_x2": 285.731, "r_y2": 224.356, "r_x3": 264.744, "r_y3": 224.356, "coord_origin": "TOPLEFT"}, "text": "0.917", "orig": "0.917", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 41, "label": "text", "bbox": {"l": 302.444, "t": 224.356, "r": 323.431, "b": 235.64499999999998, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 37, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 302.444, "r_y0": 235.64499999999998, "r_x1": 323.431, "r_y1": 235.64499999999998, "r_x2": 323.431, "r_y2": 224.356, "r_x3": 302.444, "r_y3": 224.356, "coord_origin": "TOPLEFT"}, "text": "0.922", "orig": "0.922", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 42, "label": "text", "bbox": {"l": 341.706, "t": 224.356, "r": 358.086, "b": 235.64499999999998, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 38, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 341.706, "r_y0": 235.64499999999998, "r_x1": 358.086, "r_y1": 235.64499999999998, "r_x2": 358.086, "r_y2": 224.356, "r_x3": 341.706, "r_y3": 224.356, "coord_origin": "TOPLEFT"}, "text": "0.92", "orig": "0.92", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 43, "label": "text", "bbox": {"l": 382.052, "t": 224.356, "r": 403.039, "b": 235.64499999999998, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 39, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 382.052, "r_y0": 235.64499999999998, "r_x1": 403.039, "r_y1": 235.64499999999998, "r_x2": 403.039, "r_y2": 224.356, "r_x3": 382.052, "r_y3": 224.356, "coord_origin": "TOPLEFT"}, "text": "0.722", "orig": "0.722", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 44, "label": "text", "bbox": {"l": 436.732, "t": 224.356, "r": 453.112, "b": 235.64499999999998, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 40, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 436.732, "r_y0": 235.64499999999998, "r_x1": 453.112, "r_y1": 235.64499999999998, "r_x2": 453.112, "r_y2": 224.356, "r_x3": 436.732, "r_y3": 224.356, "coord_origin": "TOPLEFT"}, "text": "3.26", "orig": "3.26", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 45, "label": "text", "bbox": {"l": 148.626, "t": 243.18499999999995, "r": 207.152, "b": 254.47400000000005, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 41, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 148.626, "r_y0": 254.47400000000005, "r_x1": 207.152, "r_y1": 254.47400000000005, "r_x2": 207.152, "r_y2": 243.18499999999995, "r_x3": 148.626, "r_y3": 243.18499999999995, "coord_origin": "TOPLEFT"}, "text": "PubTables-1M", "orig": "PubTables-1M", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 46, "label": "text", "bbox": {"l": 222.437, "t": 237.70500000000004, "r": 247.132, "b": 248.99400000000003, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 42, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 222.437, "r_y0": 248.99400000000003, "r_x1": 247.132, "r_y1": 248.99400000000003, "r_x2": 247.132, "r_y2": 237.70500000000004, "r_x3": 222.437, "r_y3": 237.70500000000004, "coord_origin": "TOPLEFT"}, "text": "OTSL", "orig": "OTSL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 47, "label": "text", "bbox": {"l": 264.744, "t": 237.70500000000004, "r": 285.731, "b": 248.99400000000003, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 43, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 264.744, "r_y0": 248.99400000000003, "r_x1": 285.731, "r_y1": 248.99400000000003, "r_x2": 285.731, "r_y2": 237.70500000000004, "r_x3": 264.744, "r_y3": 237.70500000000004, "coord_origin": "TOPLEFT"}, "text": "0.987", "orig": "0.987", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 48, "label": "text", "bbox": {"l": 302.444, "t": 237.70500000000004, "r": 323.431, "b": 248.99400000000003, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 44, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 302.444, "r_y0": 248.99400000000003, "r_x1": 323.431, "r_y1": 248.99400000000003, "r_x2": 323.431, "r_y2": 237.70500000000004, "r_x3": 302.444, "r_y3": 237.70500000000004, "coord_origin": "TOPLEFT"}, "text": "0.964", "orig": "0.964", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 49, "label": "text", "bbox": {"l": 337.815, "t": 239.91999999999996, "r": 361.976, "b": 247.846, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 45, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 337.815, "r_y0": 247.846, "r_x1": 361.976, "r_y1": 247.846, "r_x2": 361.976, "r_y2": 239.91999999999996, "r_x3": 337.815, "r_y3": 239.91999999999996, "coord_origin": "TOPLEFT"}, "text": "0.977", "orig": "0.977", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 50, "label": "text", "bbox": {"l": 380.464, "t": 239.91999999999996, "r": 404.625, "b": 247.846, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 46, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 380.464, "r_y0": 247.846, "r_x1": 404.625, "r_y1": 247.846, "r_x2": 404.625, "r_y2": 239.91999999999996, "r_x3": 380.464, "r_y3": 239.91999999999996, "coord_origin": "TOPLEFT"}, "text": "0.896", "orig": "0.896", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 51, "label": "text", "bbox": {"l": 435.493, "t": 239.91999999999996, "r": 454.35, "b": 247.846, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 47, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 435.493, "r_y0": 247.846, "r_x1": 454.35, "r_y1": 247.846, "r_x2": 454.35, "r_y2": 239.91999999999996, "r_x3": 435.493, "r_y3": 239.91999999999996, "coord_origin": "TOPLEFT"}, "text": "1.79", "orig": "1.79", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 52, "label": "text", "bbox": {"l": 220.903, "t": 250.65700000000004, "r": 248.667, "b": 261.946, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 48, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 220.903, "r_y0": 261.946, "r_x1": 248.667, "r_y1": 261.946, "r_x2": 248.667, "r_y2": 250.65700000000004, "r_x3": 220.903, "r_y3": 250.65700000000004, "coord_origin": "TOPLEFT"}, "text": "HTML", "orig": "HTML", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 53, "label": "text", "bbox": {"l": 264.744, "t": 250.65700000000004, "r": 285.731, "b": 261.946, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 49, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 264.744, "r_y0": 261.946, "r_x1": 285.731, "r_y1": 261.946, "r_x2": 285.731, "r_y2": 250.65700000000004, "r_x3": 264.744, "r_y3": 250.65700000000004, "coord_origin": "TOPLEFT"}, "text": "0.983", "orig": "0.983", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 54, "label": "text", "bbox": {"l": 302.444, "t": 250.65700000000004, "r": 323.431, "b": 261.946, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 50, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 302.444, "r_y0": 261.946, "r_x1": 323.431, "r_y1": 261.946, "r_x2": 323.431, "r_y2": 250.65700000000004, "r_x3": 302.444, "r_y3": 250.65700000000004, "coord_origin": "TOPLEFT"}, "text": "0.944", "orig": "0.944", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 55, "label": "text", "bbox": {"l": 339.403, "t": 250.65700000000004, "r": 360.39, "b": 261.946, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 51, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 339.403, "r_y0": 261.946, "r_x1": 360.39, "r_y1": 261.946, "r_x2": 360.39, "r_y2": 250.65700000000004, "r_x3": 339.403, "r_y3": 250.65700000000004, "coord_origin": "TOPLEFT"}, "text": "0.966", "orig": "0.966", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 56, "label": "text", "bbox": {"l": 382.052, "t": 250.65700000000004, "r": 403.039, "b": 261.946, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 52, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 382.052, "r_y0": 261.946, "r_x1": 403.039, "r_y1": 261.946, "r_x2": 403.039, "r_y2": 250.65700000000004, "r_x3": 382.052, "r_y3": 250.65700000000004, "coord_origin": "TOPLEFT"}, "text": "0.889", "orig": "0.889", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 57, "label": "text", "bbox": {"l": 436.732, "t": 250.65700000000004, "r": 453.112, "b": 261.946, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 53, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 436.732, "r_y0": 261.946, "r_x1": 453.112, "r_y1": 261.946, "r_x2": 453.112, "r_y2": 250.65700000000004, "r_x3": 436.732, "r_y3": 250.65700000000004, "coord_origin": "TOPLEFT"}, "text": "3.26", "orig": "3.26", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}]}, {"id": 3, "label": "section_header", "bbox": {"l": 134.765, "t": 288.915, "r": 257.087, "b": 297.722, "coord_origin": "TOPLEFT"}, "confidence": 0.9546447992324829, "cells": [{"index": 54, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 297.722, "r_x1": 149.402, "r_y1": 297.722, "r_x2": 149.402, "r_y2": 288.915, "r_x3": 134.765, "r_y3": 288.915, "coord_origin": "TOPLEFT"}, "text": "5.3", "orig": "5.3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 55, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 160.859, "r_y0": 297.722, "r_x1": 257.087, "r_y1": 297.722, "r_x2": 257.087, "r_y2": 288.915, "r_x3": 160.859, "r_y3": 288.915, "coord_origin": "TOPLEFT"}, "text": "Qualitative Results", "orig": "Qualitative Results", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 1, "label": "text", "bbox": {"l": 134.765, "t": 309.861, "r": 480.59, "b": 366.478, "coord_origin": "TOPLEFT"}, "confidence": 0.9834085702896118, "cells": [{"index": 56, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 318.658, "r_x1": 189.59, "r_y1": 318.658, "r_x2": 189.59, "r_y2": 309.861, "r_x3": 134.765, "r_y3": 309.861, "coord_origin": "TOPLEFT"}, "text": "To illustrate", "orig": "To illustrate", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 57, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 194.263, "r_y0": 318.658, "r_x1": 208.096, "r_y1": 318.658, "r_x2": 208.096, "r_y2": 309.861, "r_x3": 194.263, "r_y3": 309.861, "coord_origin": "TOPLEFT"}, "text": "the", "orig": "the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 58, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 212.768, "r_y0": 318.658, "r_x1": 258.971, "r_y1": 318.658, "r_x2": 258.971, "r_y2": 309.861, "r_x3": 212.768, "r_y3": 309.861, "coord_origin": "TOPLEFT"}, "text": "qualitative", "orig": "qualitative", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 59, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 263.643, "r_y0": 318.658, "r_x1": 308.822, "r_y1": 318.658, "r_x2": 308.822, "r_y2": 309.861, "r_x3": 263.643, "r_y3": 309.861, "coord_origin": "TOPLEFT"}, "text": "differences", "orig": "differences", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 60, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 313.484, "r_y0": 318.658, "r_x1": 480.588, "r_y1": 318.658, "r_x2": 480.588, "r_y2": 309.861, "r_x3": 313.484, "r_y3": 309.861, "coord_origin": "TOPLEFT"}, "text": "between OTSL and HTML, Figure 5", "orig": "between OTSL and HTML, Figure 5", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 61, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 330.613, "r_x1": 480.589, "r_y1": 330.613, "r_x2": 480.589, "r_y2": 321.816, "r_x3": 134.765, "r_y3": 321.816, "coord_origin": "TOPLEFT"}, "text": "demonstrates less overlap and more accurate bounding boxes with OTSL. In", "orig": "demonstrates less overlap and more accurate bounding boxes with OTSL. In", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 62, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 342.568, "r_x1": 480.587, "r_y1": 342.568, "r_x2": 480.587, "r_y2": 333.771, "r_x3": 134.765, "r_y3": 333.771, "coord_origin": "TOPLEFT"}, "text": "Figure 6, OTSL proves to be more effective in handling tables with longer to-", "orig": "Figure 6, OTSL proves to be more effective in handling tables with longer to-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 63, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 354.523, "r_x1": 480.59, "r_y1": 354.523, "r_x2": 480.59, "r_y2": 345.726, "r_x3": 134.765, "r_y3": 345.726, "coord_origin": "TOPLEFT"}, "text": "ken sequences, resulting in even more precise structure prediction and bounding", "orig": "ken sequences, resulting in even more precise structure prediction and bounding", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 64, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 366.478, "r_x1": 161.657, "r_y1": 366.478, "r_x2": 161.657, "r_y2": 357.681, "r_x3": 134.765, "r_y3": 357.681, "coord_origin": "TOPLEFT"}, "text": "boxes.", "orig": "boxes.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 5, "label": "caption", "bbox": {"l": 134.765, "t": 395.375, "r": 480.591, "b": 439.717, "coord_origin": "TOPLEFT"}, "confidence": 0.9482728838920593, "cells": [{"index": 65, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 405.516, "r_x1": 162.644, "r_y1": 405.516, "r_x2": 162.644, "r_y2": 397.59, "r_x3": 134.765, "r_y3": 397.59, "coord_origin": "TOPLEFT"}, "text": "Fig. 5.", "orig": "Fig. 5.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 66, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 167.384, "r_y0": 406.664, "r_x1": 437.456, "r_y1": 406.664, "r_x2": 437.456, "r_y2": 395.375, "r_x3": 167.384, "r_y3": 395.375, "coord_origin": "TOPLEFT"}, "text": "The OTSL model produces more accurate bounding boxes with", "orig": "The OTSL model produces more accurate bounding boxes with", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 67, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 442.2, "r_y0": 406.664, "r_x1": 456.125, "r_y1": 406.664, "r_x2": 456.125, "r_y2": 395.375, "r_x3": 442.2, "r_y3": 395.375, "coord_origin": "TOPLEFT"}, "text": "less", "orig": "less", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 68, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 460.86, "r_y0": 406.664, "r_x1": 480.591, "r_y1": 406.664, "r_x2": 480.591, "r_y2": 395.375, "r_x3": 460.86, "r_y3": 395.375, "coord_origin": "TOPLEFT"}, "text": "over-", "orig": "over-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 69, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 417.623, "r_x1": 147.049, "r_y1": 417.623, "r_x2": 147.049, "r_y2": 406.334, "r_x3": 134.765, "r_y3": 406.334, "coord_origin": "TOPLEFT"}, "text": "lap", "orig": "lap", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 70, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 151.434, "r_y0": 417.623, "r_x1": 480.591, "r_y1": 417.623, "r_x2": 480.591, "r_y2": 406.334, "r_x3": 151.434, "r_y3": 406.334, "coord_origin": "TOPLEFT"}, "text": "(E) than the HTML model (D), when predicting the structure of a sparse ta-", "orig": "(E) than the HTML model (D), when predicting the structure of a sparse ta-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 71, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 428.582, "r_x1": 146.541, "r_y1": 428.582, "r_x2": 146.541, "r_y2": 417.293, "r_x3": 134.765, "r_y3": 417.293, "coord_origin": "TOPLEFT"}, "text": "ble", "orig": "ble", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 72, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 151.391, "r_y0": 428.582, "r_x1": 168.025, "r_y1": 428.582, "r_x2": 168.025, "r_y2": 417.293, "r_x3": 151.391, "r_y3": 417.293, "coord_origin": "TOPLEFT"}, "text": "(A),", "orig": "(A),", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 73, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 172.885, "r_y0": 428.582, "r_x1": 181.066, "r_y1": 428.582, "r_x2": 181.066, "r_y2": 417.293, "r_x3": 172.885, "r_y3": 417.293, "coord_origin": "TOPLEFT"}, "text": "at", "orig": "at", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 74, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 185.925, "r_y0": 428.582, "r_x1": 206.655, "r_y1": 428.582, "r_x2": 206.655, "r_y2": 417.293, "r_x3": 185.925, "r_y3": 417.293, "coord_origin": "TOPLEFT"}, "text": "twice", "orig": "twice", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 75, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 211.506, "r_y0": 428.582, "r_x1": 224.305, "r_y1": 428.582, "r_x2": 224.305, "r_y2": 417.293, "r_x3": 211.506, "r_y3": 417.293, "coord_origin": "TOPLEFT"}, "text": "the", "orig": "the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 76, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 229.165, "r_y0": 428.582, "r_x1": 264.77, "r_y1": 428.582, "r_x2": 264.77, "r_y2": 417.293, "r_x3": 229.165, "r_y3": 417.293, "coord_origin": "TOPLEFT"}, "text": "inference", "orig": "inference", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 77, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 269.621, "r_y0": 428.582, "r_x1": 291.939, "r_y1": 428.582, "r_x2": 291.939, "r_y2": 417.293, "r_x3": 269.621, "r_y3": 417.293, "coord_origin": "TOPLEFT"}, "text": "speed", "orig": "speed", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 78, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 296.799, "r_y0": 428.582, "r_x1": 327.819, "r_y1": 428.582, "r_x2": 327.819, "r_y2": 417.293, "r_x3": 296.799, "r_y3": 417.293, "coord_origin": "TOPLEFT"}, "text": "because", "orig": "because", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 79, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 332.67, "r_y0": 428.582, "r_x1": 340.092, "r_y1": 428.582, "r_x2": 340.092, "r_y2": 417.293, "r_x3": 332.67, "r_y3": 417.293, "coord_origin": "TOPLEFT"}, "text": "of", "orig": "of", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 80, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 344.952, "r_y0": 428.582, "r_x1": 373.2, "r_y1": 428.582, "r_x2": 373.2, "r_y2": 417.293, "r_x3": 344.952, "r_y3": 417.293, "coord_origin": "TOPLEFT"}, "text": "shorter", "orig": "shorter", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 81, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 378.05, "r_y0": 428.582, "r_x1": 413.174, "r_y1": 428.582, "r_x2": 413.174, "r_y2": 417.293, "r_x3": 378.05, "r_y3": 417.293, "coord_origin": "TOPLEFT"}, "text": "sequence", "orig": "sequence", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 82, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 418.024, "r_y0": 428.582, "r_x1": 443.108, "r_y1": 428.582, "r_x2": 443.108, "r_y2": 417.293, "r_x3": 418.024, "r_y3": 417.293, "coord_origin": "TOPLEFT"}, "text": "length", "orig": "length", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 83, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 447.959, "r_y0": 428.582, "r_x1": 480.588, "r_y1": 428.582, "r_x2": 480.588, "r_y2": 417.293, "r_x3": 447.959, "r_y3": 417.293, "coord_origin": "TOPLEFT"}, "text": "(B),(C).", "orig": "(B),(C).", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 84, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 439.541, "r_x1": 304.692, "r_y1": 439.541, "r_x2": 304.692, "r_y2": 428.252, "r_x3": 134.765, "r_y3": 428.252, "coord_origin": "TOPLEFT"}, "text": "\"PMC2807444_006_00.png\" PubTabNet.", "orig": "\"PMC2807444_006_00.png\" PubTabNet.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 125, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 342.634, "r_y0": 439.717, "r_x1": 344.819, "r_y1": 439.717, "r_x2": 344.819, "r_y2": 430.197, "r_x3": 342.634, "r_y3": 430.197, "coord_origin": "TOPLEFT"}, "text": "\u03bc", "orig": "\u03bc", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 2, "label": "picture", "bbox": {"l": 162.67430114746094, "t": 444.62255859375, "r": 451.70062255859375, "b": 663.2135620117188, "coord_origin": "TOPLEFT"}, "confidence": 0.9742383360862732, "cells": [{"index": 85, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 180.125, "r_y0": 518.934, "r_x1": 190.62, "r_y1": 518.934, "r_x2": 190.62, "r_y2": 516.296, "r_x3": 180.125, "r_y3": 516.296, "coord_origin": "TOPLEFT"}, "text": "<table>", "orig": "<table>", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 86, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 183.244, "r_y0": 522.8330000000001, "r_x1": 304.548, "r_y1": 522.8330000000001, "r_x2": 304.548, "r_y2": 520.194, "r_x3": 183.244, "r_y3": 520.194, "coord_origin": "TOPLEFT"}, "text": "<tr><td></td><td colspan=\"4\"></td><td colspan=\"6\"></td><td colspan=\"3\"></td></tr>", "orig": "<tr><td></td><td colspan=\"4\"></td><td colspan=\"6\"></td><td colspan=\"3\"></td></tr>", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 87, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 183.244, "r_y0": 526.731, "r_x1": 388.423, "r_y1": 526.731, "r_x2": 388.423, "r_y2": 524.0930000000001, "r_x3": 183.244, "r_y3": 524.0930000000001, "coord_origin": "TOPLEFT"}, "text": "<tr><td></td><td></td><td></td><td></td><td></td><td></td><td></td><td></td><td></td><td></td><td></td><td></td><td></td><td></td></tr>", "orig": "<tr><td></td><td></td><td></td><td></td><td></td><td></td><td></td><td></td><td></td><td></td><td></td><td></td><td></td><td></td></tr>", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 88, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 183.244, "r_y0": 530.63, "r_x1": 388.423, "r_y1": 530.63, "r_x2": 388.423, "r_y2": 527.992, "r_x3": 183.244, "r_y3": 527.992, "coord_origin": "TOPLEFT"}, "text": "<tr><td></td><td></td><td></td><td></td><td></td><td></td><td></td><td></td><td></td><td></td><td></td><td></td><td></td><td></td></tr>", "orig": "<tr><td></td><td></td><td></td><td></td><td></td><td></td><td></td><td></td><td></td><td></td><td></td><td></td><td></td><td></td></tr>", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 89, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 183.244, "r_y0": 534.529, "r_x1": 388.423, "r_y1": 534.529, "r_x2": 388.423, "r_y2": 531.8910000000001, "r_x3": 183.244, "r_y3": 531.8910000000001, "coord_origin": "TOPLEFT"}, "text": "<tr><td></td><td></td><td></td><td></td><td></td><td></td><td></td><td></td><td></td><td></td><td></td><td></td><td></td><td></td></tr>", "orig": "<tr><td></td><td></td><td></td><td></td><td></td><td></td><td></td><td></td><td></td><td></td><td></td><td></td><td></td><td></td></tr>", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 90, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 183.244, "r_y0": 538.428, "r_x1": 388.423, "r_y1": 538.428, "r_x2": 388.423, "r_y2": 535.79, "r_x3": 183.244, "r_y3": 535.79, "coord_origin": "TOPLEFT"}, "text": "<tr><td></td><td></td><td></td><td></td><td></td><td></td><td></td><td></td><td></td><td></td><td></td><td></td><td></td><td></td></tr>", "orig": "<tr><td></td><td></td><td></td><td></td><td></td><td></td><td></td><td></td><td></td><td></td><td></td><td></td><td></td><td></td></tr>", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 91, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 183.244, "r_y0": 542.327, "r_x1": 388.423, "r_y1": 542.327, "r_x2": 388.423, "r_y2": 539.689, "r_x3": 183.244, "r_y3": 539.689, "coord_origin": "TOPLEFT"}, "text": "<tr><td></td><td></td><td></td><td></td><td></td><td></td><td></td><td></td><td></td><td></td><td></td><td></td><td></td><td></td></tr>", "orig": "<tr><td></td><td></td><td></td><td></td><td></td><td></td><td></td><td></td><td></td><td></td><td></td><td></td><td></td><td></td></tr>", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 92, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 183.244, "r_y0": 546.226, "r_x1": 388.423, "r_y1": 546.226, "r_x2": 388.423, "r_y2": 543.588, "r_x3": 183.244, "r_y3": 543.588, "coord_origin": "TOPLEFT"}, "text": "<tr><td></td><td></td><td></td><td></td><td></td><td></td><td></td><td></td><td></td><td></td><td></td><td></td><td></td><td></td></tr>", "orig": "<tr><td></td><td></td><td></td><td></td><td></td><td></td><td></td><td></td><td></td><td></td><td></td><td></td><td></td><td></td></tr>", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 93, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 183.244, "r_y0": 550.124, "r_x1": 388.423, "r_y1": 550.124, "r_x2": 388.423, "r_y2": 547.486, "r_x3": 183.244, "r_y3": 547.486, "coord_origin": "TOPLEFT"}, "text": "<tr><td></td><td></td><td></td><td></td><td></td><td></td><td></td><td></td><td></td><td></td><td></td><td></td><td></td><td></td></tr>", "orig": "<tr><td></td><td></td><td></td><td></td><td></td><td></td><td></td><td></td><td></td><td></td><td></td><td></td><td></td><td></td></tr>", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 94, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 183.244, "r_y0": 554.023, "r_x1": 388.423, "r_y1": 554.023, "r_x2": 388.423, "r_y2": 551.385, "r_x3": 183.244, "r_y3": 551.385, "coord_origin": "TOPLEFT"}, "text": "<tr><td></td><td></td><td></td><td></td><td></td><td></td><td></td><td></td><td></td><td></td><td></td><td></td><td></td><td></td></tr>", "orig": "<tr><td></td><td></td><td></td><td></td><td></td><td></td><td></td><td></td><td></td><td></td><td></td><td></td><td></td><td></td></tr>", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 95, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 180.125, "r_y0": 557.922, "r_x1": 191.868, "r_y1": 557.922, "r_x2": 191.868, "r_y2": 555.284, "r_x3": 180.125, "r_y3": 555.284, "coord_origin": "TOPLEFT"}, "text": "</table>", "orig": "</table>", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 96, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 407.383, "r_y0": 521.001, "r_x1": 450.486, "r_y1": 521.001, "r_x2": 450.486, "r_y2": 518.363, "r_x3": 407.383, "r_y3": 518.363, "coord_origin": "TOPLEFT"}, "text": "C C L L L C L L L L L C L L NL", "orig": "C C L L L C L L L L L C L L NL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 97, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 407.383, "r_y0": 524.9, "r_x1": 450.486, "r_y1": 524.9, "r_x2": 450.486, "r_y2": 522.262, "r_x3": 407.383, "r_y3": 522.262, "coord_origin": "TOPLEFT"}, "text": "C C C C C C C C C C C C C C NL", "orig": "C C C C C C C C C C C C C C NL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 98, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 407.383, "r_y0": 528.799, "r_x1": 450.486, "r_y1": 528.799, "r_x2": 450.486, "r_y2": 526.1600000000001, "r_x3": 407.383, "r_y3": 526.1600000000001, "coord_origin": "TOPLEFT"}, "text": "C C C C C C C C C C C C C C NL", "orig": "C C C C C C C C C C C C C C NL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 99, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 407.383, "r_y0": 532.697, "r_x1": 450.486, "r_y1": 532.697, "r_x2": 450.486, "r_y2": 530.059, "r_x3": 407.383, "r_y3": 530.059, "coord_origin": "TOPLEFT"}, "text": "C C C C C C C C C C C C C C NL", "orig": "C C C C C C C C C C C C C C NL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 100, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 407.383, "r_y0": 536.596, "r_x1": 450.486, "r_y1": 536.596, "r_x2": 450.486, "r_y2": 533.9580000000001, "r_x3": 407.383, "r_y3": 533.9580000000001, "coord_origin": "TOPLEFT"}, "text": "C C C C C C C C C C C C C C NL", "orig": "C C C C C C C C C C C C C C NL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 101, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 407.383, "r_y0": 540.495, "r_x1": 450.486, "r_y1": 540.495, "r_x2": 450.486, "r_y2": 537.857, "r_x3": 407.383, "r_y3": 537.857, "coord_origin": "TOPLEFT"}, "text": "C C C C C C C C C C C C C C NL", "orig": "C C C C C C C C C C C C C C NL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 102, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 407.383, "r_y0": 544.394, "r_x1": 450.486, "r_y1": 544.394, "r_x2": 450.486, "r_y2": 541.756, "r_x3": 407.383, "r_y3": 541.756, "coord_origin": "TOPLEFT"}, "text": "C C C C C C C C C C C C C C NL", "orig": "C C C C C C C C C C C C C C NL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 103, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 407.383, "r_y0": 548.293, "r_x1": 450.486, "r_y1": 548.293, "r_x2": 450.486, "r_y2": 545.655, "r_x3": 407.383, "r_y3": 545.655, "coord_origin": "TOPLEFT"}, "text": "C C C C C C C C C C C C C C NL", "orig": "C C C C C C C C C C C C C C NL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 104, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 407.383, "r_y0": 552.192, "r_x1": 450.486, "r_y1": 552.192, "r_x2": 450.486, "r_y2": 549.554, "r_x3": 407.383, "r_y3": 549.554, "coord_origin": "TOPLEFT"}, "text": "C C C C C C C C C C C C C C NL", "orig": "C C C C C C C C C C C C C C NL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 105, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 164.529, "r_y0": 515.288, "r_x1": 181.853, "r_y1": 515.288, "r_x2": 181.853, "r_y2": 509.533, "r_x3": 164.529, "r_y3": 509.533, "coord_origin": "TOPLEFT"}, "text": "HTML", "orig": "HTML", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 106, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 183.584, "r_y0": 515.288, "r_x1": 208.901, "r_y1": 515.288, "r_x2": 208.901, "r_y2": 509.533, "r_x3": 183.584, "r_y3": 509.533, "coord_origin": "TOPLEFT"}, "text": "# tokens:", "orig": "# tokens:", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 107, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 210.633, "r_y0": 515.288, "r_x1": 221.04, "r_y1": 515.288, "r_x2": 221.04, "r_y2": 509.533, "r_x3": 210.633, "r_y3": 509.533, "coord_origin": "TOPLEFT"}, "text": "258", "orig": "258", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 108, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 390.202, "r_y0": 515.433, "r_x1": 406.836, "r_y1": 515.433, "r_x2": 406.836, "r_y2": 509.678, "r_x3": 390.202, "r_y3": 509.678, "coord_origin": "TOPLEFT"}, "text": "OTSL", "orig": "OTSL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 109, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 408.569, "r_y0": 515.433, "r_x1": 433.886, "r_y1": 515.433, "r_x2": 433.886, "r_y2": 509.678, "r_x3": 408.569, "r_y3": 509.678, "coord_origin": "TOPLEFT"}, "text": "# tokens:", "orig": "# tokens:", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 110, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 435.617, "r_y0": 515.433, "r_x1": 446.025, "r_y1": 515.433, "r_x2": 446.025, "r_y2": 509.678, "r_x3": 435.617, "r_y3": 509.678, "coord_origin": "TOPLEFT"}, "text": "135", "orig": "135", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 111, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 167.193, "r_y0": 526.36, "r_x1": 172.823, "r_y1": 526.36, "r_x2": 172.823, "r_y2": 519.1659999999999, "r_x3": 167.193, "r_y3": 519.1659999999999, "coord_origin": "TOPLEFT"}, "text": "B", "orig": "B", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 112, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 187.337, "r_y0": 455.912, "r_x1": 192.967, "r_y1": 455.912, "r_x2": 192.967, "r_y2": 448.718, "r_x3": 187.337, "r_y3": 448.718, "coord_origin": "TOPLEFT"}, "text": "A", "orig": "A", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 113, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 167.387, "r_y0": 573.292, "r_x1": 173.016, "r_y1": 573.292, "r_x2": 173.016, "r_y2": 566.0989999999999, "r_x3": 167.387, "r_y3": 566.0989999999999, "coord_origin": "TOPLEFT"}, "text": "D", "orig": "D", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 114, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 248.456, "r_y0": 629.067, "r_x1": 253.657, "r_y1": 629.067, "r_x2": 253.657, "r_y2": 621.874, "r_x3": 248.456, "r_y3": 621.874, "coord_origin": "TOPLEFT"}, "text": "E", "orig": "E", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 115, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 395.901, "r_y0": 526.4870000000001, "r_x1": 401.531, "r_y1": 526.4870000000001, "r_x2": 401.531, "r_y2": 519.293, "r_x3": 395.901, "r_y3": 519.293, "coord_origin": "TOPLEFT"}, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 116, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 177.46, "r_y0": 597.268, "r_x1": 177.455, "r_y1": 580.287, "r_x2": 171.7, "r_y2": 580.289, "r_x3": 171.705, "r_y3": 597.269, "coord_origin": "TOPLEFT"}, "text": "HTML", "orig": "HTML", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 117, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 256.891, "r_y0": 649.923, "r_x1": 256.886, "r_y1": 633.633, "r_x2": 251.131, "r_y2": 633.634, "r_x3": 251.136, "r_y3": 649.925, "coord_origin": "TOPLEFT"}, "text": "OTSL", "orig": "OTSL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 118, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 372.146, "r_y0": 607.287, "r_x1": 427.038, "r_y1": 607.287, "r_x2": 427.038, "r_y2": 601.532, "r_x3": 372.146, "r_y3": 601.532, "coord_origin": "TOPLEFT"}, "text": "HTML model shows", "orig": "HTML model shows", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 119, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 372.146, "r_y0": 613.729, "r_x1": 430.068, "r_y1": 613.729, "r_x2": 430.068, "r_y2": 607.9739999999999, "r_x3": 372.146, "r_y3": 607.9739999999999, "coord_origin": "TOPLEFT"}, "text": "bounding box drifting", "orig": "bounding box drifting", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 120, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 176.88, "r_y0": 648.702, "r_x1": 231.082, "r_y1": 648.702, "r_x2": 231.082, "r_y2": 642.947, "r_x3": 176.88, "r_y3": 642.947, "coord_origin": "TOPLEFT"}, "text": "OTSL model shows", "orig": "OTSL model shows", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 121, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 176.88, "r_y0": 655.144, "r_x1": 230.993, "r_y1": 655.144, "r_x2": 230.993, "r_y2": 649.389, "r_x3": 176.88, "r_y3": 649.389, "coord_origin": "TOPLEFT"}, "text": "clean bounding box", "orig": "clean bounding box", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 122, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 176.88, "r_y0": 661.586, "r_x1": 203.932, "r_y1": 661.586, "r_x2": 203.932, "r_y2": 655.831, "r_x3": 176.88, "r_y3": 655.831, "coord_origin": "TOPLEFT"}, "text": "alignment", "orig": "alignment", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 123, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 215.932, "r_y0": 569.16, "r_x1": 218.47, "r_y1": 569.16, "r_x2": 218.47, "r_y2": 557.563, "r_x3": 215.932, "r_y3": 557.563, "coord_origin": "TOPLEFT"}, "text": "\u2264", "orig": "\u2264", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 124, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 229.057, "r_y0": 569.16, "r_x1": 231.719, "r_y1": 569.16, "r_x2": 231.719, "r_y2": 557.563, "r_x3": 229.057, "r_y3": 557.563, "coord_origin": "TOPLEFT"}, "text": "\u03bc", "orig": "\u03bc", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 126, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 261.209, "r_y0": 451.197, "r_x1": 263.57, "r_y1": 451.197, "r_x2": 263.57, "r_y2": 448.461, "r_x3": 261.209, "r_y3": 448.461, "coord_origin": "TOPLEFT"}, "text": "S", "orig": "S", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 127, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 312.335, "r_y0": 451.197, "r_x1": 313.636, "r_y1": 451.197, "r_x2": 313.636, "r_y2": 448.461, "r_x3": 312.335, "r_y3": 448.461, "coord_origin": "TOPLEFT"}, "text": "I", "orig": "I", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 128, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 377.411, "r_y0": 451.197, "r_x1": 380.057, "r_y1": 451.197, "r_x2": 380.057, "r_y2": 448.461, "r_x3": 377.411, "r_y3": 448.461, "coord_origin": "TOPLEFT"}, "text": "R", "orig": "R", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 129, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 200.64, "r_y0": 456.076, "r_x1": 205.818, "r_y1": 456.076, "r_x2": 205.818, "r_y2": 453.34, "r_x3": 200.64, "r_y3": 453.34, "coord_origin": "TOPLEFT"}, "text": "ST", "orig": "ST", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 130, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 222.208, "r_y0": 456.076, "r_x1": 229.761, "r_y1": 456.076, "r_x2": 229.761, "r_y2": 453.34, "r_x3": 222.208, "r_y3": 453.34, "coord_origin": "TOPLEFT"}, "text": "0.03", "orig": "0.03", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 131, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 243.267, "r_y0": 456.076, "r_x1": 250.82, "r_y1": 456.076, "r_x2": 250.82, "r_y2": 453.34, "r_x3": 243.267, "r_y3": 453.34, "coord_origin": "TOPLEFT"}, "text": "0.06", "orig": "0.06", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 132, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 264.297, "r_y0": 456.076, "r_x1": 271.842, "r_y1": 456.076, "r_x2": 271.842, "r_y2": 453.34, "r_x3": 264.297, "r_y3": 453.34, "coord_origin": "TOPLEFT"}, "text": "0.12", "orig": "0.12", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 133, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 285.319, "r_y0": 456.076, "r_x1": 292.872, "r_y1": 456.076, "r_x2": 292.872, "r_y2": 453.34, "r_x3": 285.319, "r_y3": 453.34, "coord_origin": "TOPLEFT"}, "text": "0.25", "orig": "0.25", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 134, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 306.378, "r_y0": 456.076, "r_x1": 311.766, "r_y1": 456.076, "r_x2": 311.766, "r_y2": 453.34, "r_x3": 306.378, "r_y3": 453.34, "coord_origin": "TOPLEFT"}, "text": "0.5", "orig": "0.5", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 135, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 323.417, "r_y0": 456.076, "r_x1": 325.575, "r_y1": 456.076, "r_x2": 325.575, "r_y2": 453.34, "r_x3": 323.417, "r_y3": 453.34, "coord_origin": "TOPLEFT"}, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 136, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 334.458, "r_y0": 456.076, "r_x1": 336.616, "r_y1": 456.076, "r_x2": 336.616, "r_y2": 453.34, "r_x3": 334.458, "r_y3": 453.34, "coord_origin": "TOPLEFT"}, "text": "2", "orig": "2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 137, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 345.528, "r_y0": 456.076, "r_x1": 347.685, "r_y1": 456.076, "r_x2": 347.685, "r_y2": 453.34, "r_x3": 345.528, "r_y3": 453.34, "coord_origin": "TOPLEFT"}, "text": "4", "orig": "4", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 138, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 356.569, "r_y0": 456.076, "r_x1": 358.726, "r_y1": 456.076, "r_x2": 358.726, "r_y2": 453.34, "r_x3": 356.569, "r_y3": 453.34, "coord_origin": "TOPLEFT"}, "text": "8", "orig": "8", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 139, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 367.638, "r_y0": 456.076, "r_x1": 371.964, "r_y1": 456.076, "r_x2": 371.964, "r_y2": 453.34, "r_x3": 367.638, "r_y3": 453.34, "coord_origin": "TOPLEFT"}, "text": "16", "orig": "16", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 140, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 382.673, "r_y0": 456.076, "r_x1": 386.999, "r_y1": 456.076, "r_x2": 386.999, "r_y2": 453.34, "r_x3": 382.673, "r_y3": 453.34, "coord_origin": "TOPLEFT"}, "text": "32", "orig": "32", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 141, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 397.737, "r_y0": 456.076, "r_x1": 402.063, "r_y1": 456.076, "r_x2": 402.063, "r_y2": 453.34, "r_x3": 397.737, "r_y3": 453.34, "coord_origin": "TOPLEFT"}, "text": "64", "orig": "64", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 142, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 412.789, "r_y0": 457.8, "r_x1": 414.935, "r_y1": 457.8, "r_x2": 414.935, "r_y2": 447.993, "r_x3": 412.789, "r_y3": 447.993, "coord_origin": "TOPLEFT"}, "text": "\u2265", "orig": "\u2265", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 143, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 416.07, "r_y0": 456.076, "r_x1": 422.535, "r_y1": 456.076, "r_x2": 422.535, "r_y2": 453.34, "r_x3": 416.07, "r_y3": 453.34, "coord_origin": "TOPLEFT"}, "text": "128", "orig": "128", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 144, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 200.64, "r_y0": 466.66, "r_x1": 204.563, "r_y1": 466.66, "r_x2": 204.563, "r_y2": 463.924, "r_x3": 200.64, "r_y3": 463.924, "coord_origin": "TOPLEFT"}, "text": "63", "orig": "63", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 145, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 367.626, "r_y0": 466.66, "r_x1": 369.58, "r_y1": 466.66, "r_x2": 369.58, "r_y2": 463.924, "r_x3": 367.626, "r_y3": 463.924, "coord_origin": "TOPLEFT"}, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 146, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 382.661, "r_y0": 466.66, "r_x1": 384.616, "r_y1": 466.66, "r_x2": 384.616, "r_y2": 463.924, "r_x3": 382.661, "r_y3": 463.924, "coord_origin": "TOPLEFT"}, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 147, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 397.725, "r_y0": 466.66, "r_x1": 399.679, "r_y1": 466.66, "r_x2": 399.679, "r_y2": 463.924, "r_x3": 397.725, "r_y3": 463.924, "coord_origin": "TOPLEFT"}, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 148, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 200.64, "r_y0": 471.539, "r_x1": 206.503, "r_y1": 471.539, "r_x2": 206.503, "r_y2": 468.803, "r_x3": 200.64, "r_y3": 468.803, "coord_origin": "TOPLEFT"}, "text": "199", "orig": "199", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 149, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 264.29, "r_y0": 471.539, "r_x1": 266.245, "r_y1": 471.539, "r_x2": 266.245, "r_y2": 468.803, "r_x3": 264.29, "r_y3": 468.803, "coord_origin": "TOPLEFT"}, "text": "5", "orig": "5", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 150, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 306.372, "r_y0": 471.539, "r_x1": 308.326, "r_y1": 471.539, "r_x2": 308.326, "r_y2": 468.803, "r_x3": 306.372, "r_y3": 468.803, "coord_origin": "TOPLEFT"}, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 151, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 345.515, "r_y0": 471.539, "r_x1": 347.47, "r_y1": 471.539, "r_x2": 347.47, "r_y2": 468.803, "r_x3": 345.515, "r_y3": 468.803, "coord_origin": "TOPLEFT"}, "text": "2", "orig": "2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 152, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 356.556, "r_y0": 471.539, "r_x1": 358.511, "r_y1": 471.539, "r_x2": 358.511, "r_y2": 468.803, "r_x3": 356.556, "r_y3": 468.803, "coord_origin": "TOPLEFT"}, "text": "4", "orig": "4", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 153, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 367.626, "r_y0": 471.539, "r_x1": 369.58, "r_y1": 471.539, "r_x2": 369.58, "r_y2": 468.803, "r_x3": 367.626, "r_y3": 468.803, "coord_origin": "TOPLEFT"}, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 154, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 382.661, "r_y0": 471.539, "r_x1": 384.615, "r_y1": 471.539, "r_x2": 384.615, "r_y2": 468.803, "r_x3": 382.661, "r_y3": 468.803, "coord_origin": "TOPLEFT"}, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 155, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 200.64, "r_y0": 476.418, "r_x1": 206.503, "r_y1": 476.418, "r_x2": 206.503, "r_y2": 473.682, "r_x3": 200.64, "r_y3": 473.682, "coord_origin": "TOPLEFT"}, "text": "416", "orig": "416", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 156, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 264.29, "r_y0": 476.418, "r_x1": 266.245, "r_y1": 476.418, "r_x2": 266.245, "r_y2": 473.682, "r_x3": 264.29, "r_y3": 473.682, "coord_origin": "TOPLEFT"}, "text": "4", "orig": "4", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 157, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 200.64, "r_y0": 481.268, "r_x1": 206.503, "r_y1": 481.268, "r_x2": 206.503, "r_y2": 478.532, "r_x3": 200.64, "r_y3": 478.532, "coord_origin": "TOPLEFT"}, "text": "230", "orig": "230", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 158, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 243.264, "r_y0": 481.268, "r_x1": 245.218, "r_y1": 481.268, "r_x2": 245.218, "r_y2": 478.532, "r_x3": 243.264, "r_y3": 478.532, "coord_origin": "TOPLEFT"}, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 159, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 264.29, "r_y0": 481.268, "r_x1": 266.245, "r_y1": 481.268, "r_x2": 266.245, "r_y2": 478.532, "r_x3": 264.29, "r_y3": 478.532, "coord_origin": "TOPLEFT"}, "text": "9", "orig": "9", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 160, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 323.405, "r_y0": 481.268, "r_x1": 325.359, "r_y1": 481.268, "r_x2": 325.359, "r_y2": 478.532, "r_x3": 323.405, "r_y3": 478.532, "coord_origin": "TOPLEFT"}, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 161, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 397.725, "r_y0": 481.268, "r_x1": 399.679, "r_y1": 481.268, "r_x2": 399.679, "r_y2": 478.532, "r_x3": 397.725, "r_y3": 478.532, "coord_origin": "TOPLEFT"}, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 162, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 200.64, "r_y0": 486.147, "r_x1": 206.503, "r_y1": 486.147, "r_x2": 206.503, "r_y2": 483.411, "r_x3": 200.64, "r_y3": 483.411, "coord_origin": "TOPLEFT"}, "text": "276", "orig": "276", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 163, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 382.661, "r_y0": 486.147, "r_x1": 384.616, "r_y1": 486.147, "r_x2": 384.616, "r_y2": 483.411, "r_x3": 382.661, "r_y3": 483.411, "coord_origin": "TOPLEFT"}, "text": "2", "orig": "2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 164, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 397.725, "r_y0": 486.147, "r_x1": 401.648, "r_y1": 486.147, "r_x2": 401.648, "r_y2": 483.411, "r_x3": 397.725, "r_y3": 483.411, "coord_origin": "TOPLEFT"}, "text": "12", "orig": "12", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 165, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 412.789, "r_y0": 486.147, "r_x1": 414.744, "r_y1": 486.147, "r_x2": 414.744, "r_y2": 483.411, "r_x3": 412.789, "r_y3": 483.411, "coord_origin": "TOPLEFT"}, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 166, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 200.64, "r_y0": 491.026, "r_x1": 207.134, "r_y1": 491.026, "r_x2": 207.134, "r_y2": 488.29, "r_x3": 200.64, "r_y3": 488.29, "coord_origin": "TOPLEFT"}, "text": "320", "orig": "320", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 167, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 367.626, "r_y0": 491.026, "r_x1": 369.784, "r_y1": 491.026, "r_x2": 369.784, "r_y2": 488.29, "r_x3": 367.626, "r_y3": 488.29, "coord_origin": "TOPLEFT"}, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 168, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 382.661, "r_y0": 491.026, "r_x1": 384.819, "r_y1": 491.026, "r_x2": 384.819, "r_y2": 488.29, "r_x3": 382.661, "r_y3": 488.29, "coord_origin": "TOPLEFT"}, "text": "4", "orig": "4", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 169, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 397.725, "r_y0": 491.026, "r_x1": 402.051, "r_y1": 491.026, "r_x2": 402.051, "r_y2": 488.29, "r_x3": 397.725, "r_y3": 488.29, "coord_origin": "TOPLEFT"}, "text": "20", "orig": "20", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 170, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 200.64, "r_y0": 495.904, "r_x1": 208.472, "r_y1": 495.904, "r_x2": 208.472, "r_y2": 493.168, "r_x3": 200.64, "r_y3": 493.168, "coord_origin": "TOPLEFT"}, "text": "2013", "orig": "2013", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 171, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 264.29, "r_y0": 495.904, "r_x1": 266.245, "r_y1": 495.904, "r_x2": 266.245, "r_y2": 493.168, "r_x3": 264.29, "r_y3": 493.168, "coord_origin": "TOPLEFT"}, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": [{"id": 58, "label": "text", "bbox": {"l": 180.125, "t": 516.296, "r": 190.62, "b": 518.934, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 85, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 180.125, "r_y0": 518.934, "r_x1": 190.62, "r_y1": 518.934, "r_x2": 190.62, "r_y2": 516.296, "r_x3": 180.125, "r_y3": 516.296, "coord_origin": "TOPLEFT"}, "text": "<table>", "orig": "<table>", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 59, "label": "text", "bbox": {"l": 183.244, "t": 520.194, "r": 304.548, "b": 522.8330000000001, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 86, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 183.244, "r_y0": 522.8330000000001, "r_x1": 304.548, "r_y1": 522.8330000000001, "r_x2": 304.548, "r_y2": 520.194, "r_x3": 183.244, "r_y3": 520.194, "coord_origin": "TOPLEFT"}, "text": "<tr><td></td><td colspan=\"4\"></td><td colspan=\"6\"></td><td colspan=\"3\"></td></tr>", "orig": "<tr><td></td><td colspan=\"4\"></td><td colspan=\"6\"></td><td colspan=\"3\"></td></tr>", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 60, "label": "text", "bbox": {"l": 183.244, "t": 524.0930000000001, "r": 388.423, "b": 526.731, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 87, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 183.244, "r_y0": 526.731, "r_x1": 388.423, "r_y1": 526.731, "r_x2": 388.423, "r_y2": 524.0930000000001, "r_x3": 183.244, "r_y3": 524.0930000000001, "coord_origin": "TOPLEFT"}, "text": "<tr><td></td><td></td><td></td><td></td><td></td><td></td><td></td><td></td><td></td><td></td><td></td><td></td><td></td><td></td></tr>", "orig": "<tr><td></td><td></td><td></td><td></td><td></td><td></td><td></td><td></td><td></td><td></td><td></td><td></td><td></td><td></td></tr>", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 61, "label": "text", "bbox": {"l": 183.244, "t": 527.992, "r": 388.423, "b": 530.63, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 88, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 183.244, "r_y0": 530.63, "r_x1": 388.423, "r_y1": 530.63, "r_x2": 388.423, "r_y2": 527.992, "r_x3": 183.244, "r_y3": 527.992, "coord_origin": "TOPLEFT"}, "text": "<tr><td></td><td></td><td></td><td></td><td></td><td></td><td></td><td></td><td></td><td></td><td></td><td></td><td></td><td></td></tr>", "orig": "<tr><td></td><td></td><td></td><td></td><td></td><td></td><td></td><td></td><td></td><td></td><td></td><td></td><td></td><td></td></tr>", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 62, "label": "text", "bbox": {"l": 183.244, "t": 531.8910000000001, "r": 388.423, "b": 534.529, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 89, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 183.244, "r_y0": 534.529, "r_x1": 388.423, "r_y1": 534.529, "r_x2": 388.423, "r_y2": 531.8910000000001, "r_x3": 183.244, "r_y3": 531.8910000000001, "coord_origin": "TOPLEFT"}, "text": "<tr><td></td><td></td><td></td><td></td><td></td><td></td><td></td><td></td><td></td><td></td><td></td><td></td><td></td><td></td></tr>", "orig": "<tr><td></td><td></td><td></td><td></td><td></td><td></td><td></td><td></td><td></td><td></td><td></td><td></td><td></td><td></td></tr>", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 63, "label": "text", "bbox": {"l": 183.244, "t": 535.79, "r": 388.423, "b": 538.428, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 90, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 183.244, "r_y0": 538.428, "r_x1": 388.423, "r_y1": 538.428, "r_x2": 388.423, "r_y2": 535.79, "r_x3": 183.244, "r_y3": 535.79, "coord_origin": "TOPLEFT"}, "text": "<tr><td></td><td></td><td></td><td></td><td></td><td></td><td></td><td></td><td></td><td></td><td></td><td></td><td></td><td></td></tr>", "orig": "<tr><td></td><td></td><td></td><td></td><td></td><td></td><td></td><td></td><td></td><td></td><td></td><td></td><td></td><td></td></tr>", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 64, "label": "text", "bbox": {"l": 183.244, "t": 539.689, "r": 388.423, "b": 542.327, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 91, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 183.244, "r_y0": 542.327, "r_x1": 388.423, "r_y1": 542.327, "r_x2": 388.423, "r_y2": 539.689, "r_x3": 183.244, "r_y3": 539.689, "coord_origin": "TOPLEFT"}, "text": "<tr><td></td><td></td><td></td><td></td><td></td><td></td><td></td><td></td><td></td><td></td><td></td><td></td><td></td><td></td></tr>", "orig": "<tr><td></td><td></td><td></td><td></td><td></td><td></td><td></td><td></td><td></td><td></td><td></td><td></td><td></td><td></td></tr>", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 65, "label": "text", "bbox": {"l": 183.244, "t": 543.588, "r": 388.423, "b": 546.226, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 92, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 183.244, "r_y0": 546.226, "r_x1": 388.423, "r_y1": 546.226, "r_x2": 388.423, "r_y2": 543.588, "r_x3": 183.244, "r_y3": 543.588, "coord_origin": "TOPLEFT"}, "text": "<tr><td></td><td></td><td></td><td></td><td></td><td></td><td></td><td></td><td></td><td></td><td></td><td></td><td></td><td></td></tr>", "orig": "<tr><td></td><td></td><td></td><td></td><td></td><td></td><td></td><td></td><td></td><td></td><td></td><td></td><td></td><td></td></tr>", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 66, "label": "text", "bbox": {"l": 183.244, "t": 547.486, "r": 388.423, "b": 550.124, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 93, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 183.244, "r_y0": 550.124, "r_x1": 388.423, "r_y1": 550.124, "r_x2": 388.423, "r_y2": 547.486, "r_x3": 183.244, "r_y3": 547.486, "coord_origin": "TOPLEFT"}, "text": "<tr><td></td><td></td><td></td><td></td><td></td><td></td><td></td><td></td><td></td><td></td><td></td><td></td><td></td><td></td></tr>", "orig": "<tr><td></td><td></td><td></td><td></td><td></td><td></td><td></td><td></td><td></td><td></td><td></td><td></td><td></td><td></td></tr>", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 67, "label": "text", "bbox": {"l": 183.244, "t": 551.385, "r": 388.423, "b": 554.023, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 94, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 183.244, "r_y0": 554.023, "r_x1": 388.423, "r_y1": 554.023, "r_x2": 388.423, "r_y2": 551.385, "r_x3": 183.244, "r_y3": 551.385, "coord_origin": "TOPLEFT"}, "text": "<tr><td></td><td></td><td></td><td></td><td></td><td></td><td></td><td></td><td></td><td></td><td></td><td></td><td></td><td></td></tr>", "orig": "<tr><td></td><td></td><td></td><td></td><td></td><td></td><td></td><td></td><td></td><td></td><td></td><td></td><td></td><td></td></tr>", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 68, "label": "text", "bbox": {"l": 180.125, "t": 555.284, "r": 191.868, "b": 557.922, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 95, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 180.125, "r_y0": 557.922, "r_x1": 191.868, "r_y1": 557.922, "r_x2": 191.868, "r_y2": 555.284, "r_x3": 180.125, "r_y3": 555.284, "coord_origin": "TOPLEFT"}, "text": "</table>", "orig": "</table>", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 69, "label": "text", "bbox": {"l": 407.383, "t": 518.363, "r": 450.486, "b": 521.001, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 96, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 407.383, "r_y0": 521.001, "r_x1": 450.486, "r_y1": 521.001, "r_x2": 450.486, "r_y2": 518.363, "r_x3": 407.383, "r_y3": 518.363, "coord_origin": "TOPLEFT"}, "text": "C C L L L C L L L L L C L L NL", "orig": "C C L L L C L L L L L C L L NL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 70, "label": "text", "bbox": {"l": 407.383, "t": 522.262, "r": 450.486, "b": 524.9, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 97, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 407.383, "r_y0": 524.9, "r_x1": 450.486, "r_y1": 524.9, "r_x2": 450.486, "r_y2": 522.262, "r_x3": 407.383, "r_y3": 522.262, "coord_origin": "TOPLEFT"}, "text": "C C C C C C C C C C C C C C NL", "orig": "C C C C C C C C C C C C C C NL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 71, "label": "text", "bbox": {"l": 407.383, "t": 526.1600000000001, "r": 450.486, "b": 528.799, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 98, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 407.383, "r_y0": 528.799, "r_x1": 450.486, "r_y1": 528.799, "r_x2": 450.486, "r_y2": 526.1600000000001, "r_x3": 407.383, "r_y3": 526.1600000000001, "coord_origin": "TOPLEFT"}, "text": "C C C C C C C C C C C C C C NL", "orig": "C C C C C C C C C C C C C C NL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 72, "label": "text", "bbox": {"l": 407.383, "t": 530.059, "r": 450.486, "b": 532.697, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 99, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 407.383, "r_y0": 532.697, "r_x1": 450.486, "r_y1": 532.697, "r_x2": 450.486, "r_y2": 530.059, "r_x3": 407.383, "r_y3": 530.059, "coord_origin": "TOPLEFT"}, "text": "C C C C C C C C C C C C C C NL", "orig": "C C C C C C C C C C C C C C NL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 73, "label": "text", "bbox": {"l": 407.383, "t": 533.9580000000001, "r": 450.486, "b": 536.596, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 100, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 407.383, "r_y0": 536.596, "r_x1": 450.486, "r_y1": 536.596, "r_x2": 450.486, "r_y2": 533.9580000000001, "r_x3": 407.383, "r_y3": 533.9580000000001, "coord_origin": "TOPLEFT"}, "text": "C C C C C C C C C C C C C C NL", "orig": "C C C C C C C C C C C C C C NL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 74, "label": "text", "bbox": {"l": 407.383, "t": 537.857, "r": 450.486, "b": 540.495, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 101, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 407.383, "r_y0": 540.495, "r_x1": 450.486, "r_y1": 540.495, "r_x2": 450.486, "r_y2": 537.857, "r_x3": 407.383, "r_y3": 537.857, "coord_origin": "TOPLEFT"}, "text": "C C C C C C C C C C C C C C NL", "orig": "C C C C C C C C C C C C C C NL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 75, "label": "text", "bbox": {"l": 407.383, "t": 541.756, "r": 450.486, "b": 544.394, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 102, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 407.383, "r_y0": 544.394, "r_x1": 450.486, "r_y1": 544.394, "r_x2": 450.486, "r_y2": 541.756, "r_x3": 407.383, "r_y3": 541.756, "coord_origin": "TOPLEFT"}, "text": "C C C C C C C C C C C C C C NL", "orig": "C C C C C C C C C C C C C C NL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 76, "label": "text", "bbox": {"l": 407.383, "t": 545.655, "r": 450.486, "b": 548.293, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 103, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 407.383, "r_y0": 548.293, "r_x1": 450.486, "r_y1": 548.293, "r_x2": 450.486, "r_y2": 545.655, "r_x3": 407.383, "r_y3": 545.655, "coord_origin": "TOPLEFT"}, "text": "C C C C C C C C C C C C C C NL", "orig": "C C C C C C C C C C C C C C NL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 77, "label": "text", "bbox": {"l": 407.383, "t": 549.554, "r": 450.486, "b": 552.192, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 104, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 407.383, "r_y0": 552.192, "r_x1": 450.486, "r_y1": 552.192, "r_x2": 450.486, "r_y2": 549.554, "r_x3": 407.383, "r_y3": 549.554, "coord_origin": "TOPLEFT"}, "text": "C C C C C C C C C C C C C C NL", "orig": "C C C C C C C C C C C C C C NL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 78, "label": "text", "bbox": {"l": 164.529, "t": 509.533, "r": 181.853, "b": 515.288, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 105, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 164.529, "r_y0": 515.288, "r_x1": 181.853, "r_y1": 515.288, "r_x2": 181.853, "r_y2": 509.533, "r_x3": 164.529, "r_y3": 509.533, "coord_origin": "TOPLEFT"}, "text": "HTML", "orig": "HTML", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 79, "label": "text", "bbox": {"l": 183.584, "t": 509.533, "r": 208.901, "b": 515.288, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 106, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 183.584, "r_y0": 515.288, "r_x1": 208.901, "r_y1": 515.288, "r_x2": 208.901, "r_y2": 509.533, "r_x3": 183.584, "r_y3": 509.533, "coord_origin": "TOPLEFT"}, "text": "# tokens:", "orig": "# tokens:", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 80, "label": "text", "bbox": {"l": 210.633, "t": 509.533, "r": 221.04, "b": 515.288, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 107, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 210.633, "r_y0": 515.288, "r_x1": 221.04, "r_y1": 515.288, "r_x2": 221.04, "r_y2": 509.533, "r_x3": 210.633, "r_y3": 509.533, "coord_origin": "TOPLEFT"}, "text": "258", "orig": "258", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 81, "label": "text", "bbox": {"l": 390.202, "t": 509.678, "r": 406.836, "b": 515.433, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 108, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 390.202, "r_y0": 515.433, "r_x1": 406.836, "r_y1": 515.433, "r_x2": 406.836, "r_y2": 509.678, "r_x3": 390.202, "r_y3": 509.678, "coord_origin": "TOPLEFT"}, "text": "OTSL", "orig": "OTSL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 82, "label": "text", "bbox": {"l": 408.569, "t": 509.678, "r": 433.886, "b": 515.433, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 109, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 408.569, "r_y0": 515.433, "r_x1": 433.886, "r_y1": 515.433, "r_x2": 433.886, "r_y2": 509.678, "r_x3": 408.569, "r_y3": 509.678, "coord_origin": "TOPLEFT"}, "text": "# tokens:", "orig": "# tokens:", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 83, "label": "text", "bbox": {"l": 435.617, "t": 509.678, "r": 446.025, "b": 515.433, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 110, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 435.617, "r_y0": 515.433, "r_x1": 446.025, "r_y1": 515.433, "r_x2": 446.025, "r_y2": 509.678, "r_x3": 435.617, "r_y3": 509.678, "coord_origin": "TOPLEFT"}, "text": "135", "orig": "135", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 84, "label": "text", "bbox": {"l": 167.193, "t": 519.1659999999999, "r": 172.823, "b": 526.36, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 111, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 167.193, "r_y0": 526.36, "r_x1": 172.823, "r_y1": 526.36, "r_x2": 172.823, "r_y2": 519.1659999999999, "r_x3": 167.193, "r_y3": 519.1659999999999, "coord_origin": "TOPLEFT"}, "text": "B", "orig": "B", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 85, "label": "text", "bbox": {"l": 187.337, "t": 448.718, "r": 192.967, "b": 455.912, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 112, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 187.337, "r_y0": 455.912, "r_x1": 192.967, "r_y1": 455.912, "r_x2": 192.967, "r_y2": 448.718, "r_x3": 187.337, "r_y3": 448.718, "coord_origin": "TOPLEFT"}, "text": "A", "orig": "A", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 86, "label": "text", "bbox": {"l": 167.387, "t": 566.0989999999999, "r": 173.016, "b": 573.292, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 113, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 167.387, "r_y0": 573.292, "r_x1": 173.016, "r_y1": 573.292, "r_x2": 173.016, "r_y2": 566.0989999999999, "r_x3": 167.387, "r_y3": 566.0989999999999, "coord_origin": "TOPLEFT"}, "text": "D", "orig": "D", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 87, "label": "text", "bbox": {"l": 248.456, "t": 621.874, "r": 253.657, "b": 629.067, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 114, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 248.456, "r_y0": 629.067, "r_x1": 253.657, "r_y1": 629.067, "r_x2": 253.657, "r_y2": 621.874, "r_x3": 248.456, "r_y3": 621.874, "coord_origin": "TOPLEFT"}, "text": "E", "orig": "E", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 88, "label": "text", "bbox": {"l": 395.901, "t": 519.293, "r": 401.531, "b": 526.4870000000001, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 115, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 395.901, "r_y0": 526.4870000000001, "r_x1": 401.531, "r_y1": 526.4870000000001, "r_x2": 401.531, "r_y2": 519.293, "r_x3": 395.901, "r_y3": 519.293, "coord_origin": "TOPLEFT"}, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 89, "label": "text", "bbox": {"l": 171.7, "t": 580.287, "r": 177.46, "b": 597.269, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 116, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 177.46, "r_y0": 597.268, "r_x1": 177.455, "r_y1": 580.287, "r_x2": 171.7, "r_y2": 580.289, "r_x3": 171.705, "r_y3": 597.269, "coord_origin": "TOPLEFT"}, "text": "HTML", "orig": "HTML", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 90, "label": "text", "bbox": {"l": 251.131, "t": 633.633, "r": 256.891, "b": 649.925, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 117, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 256.891, "r_y0": 649.923, "r_x1": 256.886, "r_y1": 633.633, "r_x2": 251.131, "r_y2": 633.634, "r_x3": 251.136, "r_y3": 649.925, "coord_origin": "TOPLEFT"}, "text": "OTSL", "orig": "OTSL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 91, "label": "text", "bbox": {"l": 372.146, "t": 601.532, "r": 427.038, "b": 607.287, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 118, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 372.146, "r_y0": 607.287, "r_x1": 427.038, "r_y1": 607.287, "r_x2": 427.038, "r_y2": 601.532, "r_x3": 372.146, "r_y3": 601.532, "coord_origin": "TOPLEFT"}, "text": "HTML model shows", "orig": "HTML model shows", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 92, "label": "text", "bbox": {"l": 372.146, "t": 607.9739999999999, "r": 430.068, "b": 613.729, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 119, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 372.146, "r_y0": 613.729, "r_x1": 430.068, "r_y1": 613.729, "r_x2": 430.068, "r_y2": 607.9739999999999, "r_x3": 372.146, "r_y3": 607.9739999999999, "coord_origin": "TOPLEFT"}, "text": "bounding box drifting", "orig": "bounding box drifting", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 93, "label": "text", "bbox": {"l": 176.88, "t": 642.947, "r": 231.082, "b": 648.702, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 120, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 176.88, "r_y0": 648.702, "r_x1": 231.082, "r_y1": 648.702, "r_x2": 231.082, "r_y2": 642.947, "r_x3": 176.88, "r_y3": 642.947, "coord_origin": "TOPLEFT"}, "text": "OTSL model shows", "orig": "OTSL model shows", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 94, "label": "text", "bbox": {"l": 176.88, "t": 649.389, "r": 230.993, "b": 655.144, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 121, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 176.88, "r_y0": 655.144, "r_x1": 230.993, "r_y1": 655.144, "r_x2": 230.993, "r_y2": 649.389, "r_x3": 176.88, "r_y3": 649.389, "coord_origin": "TOPLEFT"}, "text": "clean bounding box", "orig": "clean bounding box", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 95, "label": "text", "bbox": {"l": 176.88, "t": 655.831, "r": 203.932, "b": 661.586, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 122, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 176.88, "r_y0": 661.586, "r_x1": 203.932, "r_y1": 661.586, "r_x2": 203.932, "r_y2": 655.831, "r_x3": 176.88, "r_y3": 655.831, "coord_origin": "TOPLEFT"}, "text": "alignment", "orig": "alignment", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 96, "label": "text", "bbox": {"l": 215.932, "t": 557.563, "r": 218.47, "b": 569.16, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 123, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 215.932, "r_y0": 569.16, "r_x1": 218.47, "r_y1": 569.16, "r_x2": 218.47, "r_y2": 557.563, "r_x3": 215.932, "r_y3": 557.563, "coord_origin": "TOPLEFT"}, "text": "\u2264", "orig": "\u2264", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 97, "label": "text", "bbox": {"l": 229.057, "t": 557.563, "r": 231.719, "b": 569.16, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 124, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 229.057, "r_y0": 569.16, "r_x1": 231.719, "r_y1": 569.16, "r_x2": 231.719, "r_y2": 557.563, "r_x3": 229.057, "r_y3": 557.563, "coord_origin": "TOPLEFT"}, "text": "\u03bc", "orig": "\u03bc", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 98, "label": "text", "bbox": {"l": 261.209, "t": 448.461, "r": 263.57, "b": 451.197, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 126, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 261.209, "r_y0": 451.197, "r_x1": 263.57, "r_y1": 451.197, "r_x2": 263.57, "r_y2": 448.461, "r_x3": 261.209, "r_y3": 448.461, "coord_origin": "TOPLEFT"}, "text": "S", "orig": "S", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 99, "label": "text", "bbox": {"l": 312.335, "t": 448.461, "r": 313.636, "b": 451.197, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 127, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 312.335, "r_y0": 451.197, "r_x1": 313.636, "r_y1": 451.197, "r_x2": 313.636, "r_y2": 448.461, "r_x3": 312.335, "r_y3": 448.461, "coord_origin": "TOPLEFT"}, "text": "I", "orig": "I", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 100, "label": "text", "bbox": {"l": 377.411, "t": 448.461, "r": 380.057, "b": 451.197, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 128, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 377.411, "r_y0": 451.197, "r_x1": 380.057, "r_y1": 451.197, "r_x2": 380.057, "r_y2": 448.461, "r_x3": 377.411, "r_y3": 448.461, "coord_origin": "TOPLEFT"}, "text": "R", "orig": "R", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 101, "label": "text", "bbox": {"l": 200.64, "t": 453.34, "r": 205.818, "b": 456.076, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 129, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 200.64, "r_y0": 456.076, "r_x1": 205.818, "r_y1": 456.076, "r_x2": 205.818, "r_y2": 453.34, "r_x3": 200.64, "r_y3": 453.34, "coord_origin": "TOPLEFT"}, "text": "ST", "orig": "ST", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 102, "label": "text", "bbox": {"l": 222.208, "t": 453.34, "r": 229.761, "b": 456.076, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 130, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 222.208, "r_y0": 456.076, "r_x1": 229.761, "r_y1": 456.076, "r_x2": 229.761, "r_y2": 453.34, "r_x3": 222.208, "r_y3": 453.34, "coord_origin": "TOPLEFT"}, "text": "0.03", "orig": "0.03", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 103, "label": "text", "bbox": {"l": 243.267, "t": 453.34, "r": 250.82, "b": 456.076, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 131, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 243.267, "r_y0": 456.076, "r_x1": 250.82, "r_y1": 456.076, "r_x2": 250.82, "r_y2": 453.34, "r_x3": 243.267, "r_y3": 453.34, "coord_origin": "TOPLEFT"}, "text": "0.06", "orig": "0.06", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 104, "label": "text", "bbox": {"l": 264.297, "t": 453.34, "r": 271.842, "b": 456.076, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 132, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 264.297, "r_y0": 456.076, "r_x1": 271.842, "r_y1": 456.076, "r_x2": 271.842, "r_y2": 453.34, "r_x3": 264.297, "r_y3": 453.34, "coord_origin": "TOPLEFT"}, "text": "0.12", "orig": "0.12", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 105, "label": "text", "bbox": {"l": 285.319, "t": 453.34, "r": 292.872, "b": 456.076, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 133, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 285.319, "r_y0": 456.076, "r_x1": 292.872, "r_y1": 456.076, "r_x2": 292.872, "r_y2": 453.34, "r_x3": 285.319, "r_y3": 453.34, "coord_origin": "TOPLEFT"}, "text": "0.25", "orig": "0.25", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 106, "label": "text", "bbox": {"l": 306.378, "t": 453.34, "r": 311.766, "b": 456.076, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 134, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 306.378, "r_y0": 456.076, "r_x1": 311.766, "r_y1": 456.076, "r_x2": 311.766, "r_y2": 453.34, "r_x3": 306.378, "r_y3": 453.34, "coord_origin": "TOPLEFT"}, "text": "0.5", "orig": "0.5", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 107, "label": "text", "bbox": {"l": 323.417, "t": 453.34, "r": 325.575, "b": 456.076, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 135, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 323.417, "r_y0": 456.076, "r_x1": 325.575, "r_y1": 456.076, "r_x2": 325.575, "r_y2": 453.34, "r_x3": 323.417, "r_y3": 453.34, "coord_origin": "TOPLEFT"}, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 108, "label": "text", "bbox": {"l": 334.458, "t": 453.34, "r": 336.616, "b": 456.076, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 136, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 334.458, "r_y0": 456.076, "r_x1": 336.616, "r_y1": 456.076, "r_x2": 336.616, "r_y2": 453.34, "r_x3": 334.458, "r_y3": 453.34, "coord_origin": "TOPLEFT"}, "text": "2", "orig": "2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 109, "label": "text", "bbox": {"l": 345.528, "t": 453.34, "r": 347.685, "b": 456.076, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 137, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 345.528, "r_y0": 456.076, "r_x1": 347.685, "r_y1": 456.076, "r_x2": 347.685, "r_y2": 453.34, "r_x3": 345.528, "r_y3": 453.34, "coord_origin": "TOPLEFT"}, "text": "4", "orig": "4", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 110, "label": "text", "bbox": {"l": 356.569, "t": 453.34, "r": 358.726, "b": 456.076, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 138, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 356.569, "r_y0": 456.076, "r_x1": 358.726, "r_y1": 456.076, "r_x2": 358.726, "r_y2": 453.34, "r_x3": 356.569, "r_y3": 453.34, "coord_origin": "TOPLEFT"}, "text": "8", "orig": "8", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 111, "label": "text", "bbox": {"l": 367.638, "t": 453.34, "r": 371.964, "b": 456.076, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 139, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 367.638, "r_y0": 456.076, "r_x1": 371.964, "r_y1": 456.076, "r_x2": 371.964, "r_y2": 453.34, "r_x3": 367.638, "r_y3": 453.34, "coord_origin": "TOPLEFT"}, "text": "16", "orig": "16", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 112, "label": "text", "bbox": {"l": 382.673, "t": 453.34, "r": 386.999, "b": 456.076, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 140, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 382.673, "r_y0": 456.076, "r_x1": 386.999, "r_y1": 456.076, "r_x2": 386.999, "r_y2": 453.34, "r_x3": 382.673, "r_y3": 453.34, "coord_origin": "TOPLEFT"}, "text": "32", "orig": "32", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 113, "label": "text", "bbox": {"l": 397.737, "t": 453.34, "r": 402.063, "b": 456.076, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 141, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 397.737, "r_y0": 456.076, "r_x1": 402.063, "r_y1": 456.076, "r_x2": 402.063, "r_y2": 453.34, "r_x3": 397.737, "r_y3": 453.34, "coord_origin": "TOPLEFT"}, "text": "64", "orig": "64", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 114, "label": "text", "bbox": {"l": 412.789, "t": 447.993, "r": 414.935, "b": 457.8, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 142, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 412.789, "r_y0": 457.8, "r_x1": 414.935, "r_y1": 457.8, "r_x2": 414.935, "r_y2": 447.993, "r_x3": 412.789, "r_y3": 447.993, "coord_origin": "TOPLEFT"}, "text": "\u2265", "orig": "\u2265", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 115, "label": "text", "bbox": {"l": 416.07, "t": 453.34, "r": 422.535, "b": 456.076, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 143, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 416.07, "r_y0": 456.076, "r_x1": 422.535, "r_y1": 456.076, "r_x2": 422.535, "r_y2": 453.34, "r_x3": 416.07, "r_y3": 453.34, "coord_origin": "TOPLEFT"}, "text": "128", "orig": "128", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 116, "label": "text", "bbox": {"l": 200.64, "t": 463.924, "r": 204.563, "b": 466.66, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 144, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 200.64, "r_y0": 466.66, "r_x1": 204.563, "r_y1": 466.66, "r_x2": 204.563, "r_y2": 463.924, "r_x3": 200.64, "r_y3": 463.924, "coord_origin": "TOPLEFT"}, "text": "63", "orig": "63", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 117, "label": "text", "bbox": {"l": 367.626, "t": 463.924, "r": 369.58, "b": 466.66, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 145, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 367.626, "r_y0": 466.66, "r_x1": 369.58, "r_y1": 466.66, "r_x2": 369.58, "r_y2": 463.924, "r_x3": 367.626, "r_y3": 463.924, "coord_origin": "TOPLEFT"}, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 118, "label": "text", "bbox": {"l": 382.661, "t": 463.924, "r": 384.616, "b": 466.66, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 146, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 382.661, "r_y0": 466.66, "r_x1": 384.616, "r_y1": 466.66, "r_x2": 384.616, "r_y2": 463.924, "r_x3": 382.661, "r_y3": 463.924, "coord_origin": "TOPLEFT"}, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 119, "label": "text", "bbox": {"l": 397.725, "t": 463.924, "r": 399.679, "b": 466.66, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 147, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 397.725, "r_y0": 466.66, "r_x1": 399.679, "r_y1": 466.66, "r_x2": 399.679, "r_y2": 463.924, "r_x3": 397.725, "r_y3": 463.924, "coord_origin": "TOPLEFT"}, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 120, "label": "text", "bbox": {"l": 200.64, "t": 468.803, "r": 206.503, "b": 471.539, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 148, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 200.64, "r_y0": 471.539, "r_x1": 206.503, "r_y1": 471.539, "r_x2": 206.503, "r_y2": 468.803, "r_x3": 200.64, "r_y3": 468.803, "coord_origin": "TOPLEFT"}, "text": "199", "orig": "199", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 121, "label": "text", "bbox": {"l": 264.29, "t": 468.803, "r": 266.245, "b": 471.539, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 149, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 264.29, "r_y0": 471.539, "r_x1": 266.245, "r_y1": 471.539, "r_x2": 266.245, "r_y2": 468.803, "r_x3": 264.29, "r_y3": 468.803, "coord_origin": "TOPLEFT"}, "text": "5", "orig": "5", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 122, "label": "text", "bbox": {"l": 306.372, "t": 468.803, "r": 308.326, "b": 471.539, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 150, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 306.372, "r_y0": 471.539, "r_x1": 308.326, "r_y1": 471.539, "r_x2": 308.326, "r_y2": 468.803, "r_x3": 306.372, "r_y3": 468.803, "coord_origin": "TOPLEFT"}, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 123, "label": "text", "bbox": {"l": 345.515, "t": 468.803, "r": 347.47, "b": 471.539, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 151, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 345.515, "r_y0": 471.539, "r_x1": 347.47, "r_y1": 471.539, "r_x2": 347.47, "r_y2": 468.803, "r_x3": 345.515, "r_y3": 468.803, "coord_origin": "TOPLEFT"}, "text": "2", "orig": "2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 124, "label": "text", "bbox": {"l": 356.556, "t": 468.803, "r": 358.511, "b": 471.539, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 152, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 356.556, "r_y0": 471.539, "r_x1": 358.511, "r_y1": 471.539, "r_x2": 358.511, "r_y2": 468.803, "r_x3": 356.556, "r_y3": 468.803, "coord_origin": "TOPLEFT"}, "text": "4", "orig": "4", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 125, "label": "text", "bbox": {"l": 367.626, "t": 468.803, "r": 369.58, "b": 471.539, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 153, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 367.626, "r_y0": 471.539, "r_x1": 369.58, "r_y1": 471.539, "r_x2": 369.58, "r_y2": 468.803, "r_x3": 367.626, "r_y3": 468.803, "coord_origin": "TOPLEFT"}, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 126, "label": "text", "bbox": {"l": 382.661, "t": 468.803, "r": 384.615, "b": 471.539, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 154, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 382.661, "r_y0": 471.539, "r_x1": 384.615, "r_y1": 471.539, "r_x2": 384.615, "r_y2": 468.803, "r_x3": 382.661, "r_y3": 468.803, "coord_origin": "TOPLEFT"}, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 127, "label": "text", "bbox": {"l": 200.64, "t": 473.682, "r": 206.503, "b": 476.418, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 155, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 200.64, "r_y0": 476.418, "r_x1": 206.503, "r_y1": 476.418, "r_x2": 206.503, "r_y2": 473.682, "r_x3": 200.64, "r_y3": 473.682, "coord_origin": "TOPLEFT"}, "text": "416", "orig": "416", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 128, "label": "text", "bbox": {"l": 264.29, "t": 473.682, "r": 266.245, "b": 476.418, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 156, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 264.29, "r_y0": 476.418, "r_x1": 266.245, "r_y1": 476.418, "r_x2": 266.245, "r_y2": 473.682, "r_x3": 264.29, "r_y3": 473.682, "coord_origin": "TOPLEFT"}, "text": "4", "orig": "4", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 129, "label": "text", "bbox": {"l": 200.64, "t": 478.532, "r": 206.503, "b": 481.268, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 157, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 200.64, "r_y0": 481.268, "r_x1": 206.503, "r_y1": 481.268, "r_x2": 206.503, "r_y2": 478.532, "r_x3": 200.64, "r_y3": 478.532, "coord_origin": "TOPLEFT"}, "text": "230", "orig": "230", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 130, "label": "text", "bbox": {"l": 243.264, "t": 478.532, "r": 245.218, "b": 481.268, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 158, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 243.264, "r_y0": 481.268, "r_x1": 245.218, "r_y1": 481.268, "r_x2": 245.218, "r_y2": 478.532, "r_x3": 243.264, "r_y3": 478.532, "coord_origin": "TOPLEFT"}, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 131, "label": "text", "bbox": {"l": 264.29, "t": 478.532, "r": 266.245, "b": 481.268, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 159, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 264.29, "r_y0": 481.268, "r_x1": 266.245, "r_y1": 481.268, "r_x2": 266.245, "r_y2": 478.532, "r_x3": 264.29, "r_y3": 478.532, "coord_origin": "TOPLEFT"}, "text": "9", "orig": "9", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 132, "label": "text", "bbox": {"l": 323.405, "t": 478.532, "r": 325.359, "b": 481.268, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 160, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 323.405, "r_y0": 481.268, "r_x1": 325.359, "r_y1": 481.268, "r_x2": 325.359, "r_y2": 478.532, "r_x3": 323.405, "r_y3": 478.532, "coord_origin": "TOPLEFT"}, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 133, "label": "text", "bbox": {"l": 397.725, "t": 478.532, "r": 399.679, "b": 481.268, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 161, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 397.725, "r_y0": 481.268, "r_x1": 399.679, "r_y1": 481.268, "r_x2": 399.679, "r_y2": 478.532, "r_x3": 397.725, "r_y3": 478.532, "coord_origin": "TOPLEFT"}, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 134, "label": "text", "bbox": {"l": 200.64, "t": 483.411, "r": 206.503, "b": 486.147, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 162, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 200.64, "r_y0": 486.147, "r_x1": 206.503, "r_y1": 486.147, "r_x2": 206.503, "r_y2": 483.411, "r_x3": 200.64, "r_y3": 483.411, "coord_origin": "TOPLEFT"}, "text": "276", "orig": "276", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 135, "label": "text", "bbox": {"l": 382.661, "t": 483.411, "r": 384.616, "b": 486.147, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 163, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 382.661, "r_y0": 486.147, "r_x1": 384.616, "r_y1": 486.147, "r_x2": 384.616, "r_y2": 483.411, "r_x3": 382.661, "r_y3": 483.411, "coord_origin": "TOPLEFT"}, "text": "2", "orig": "2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 136, "label": "text", "bbox": {"l": 397.725, "t": 483.411, "r": 401.648, "b": 486.147, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 164, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 397.725, "r_y0": 486.147, "r_x1": 401.648, "r_y1": 486.147, "r_x2": 401.648, "r_y2": 483.411, "r_x3": 397.725, "r_y3": 483.411, "coord_origin": "TOPLEFT"}, "text": "12", "orig": "12", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 137, "label": "text", "bbox": {"l": 412.789, "t": 483.411, "r": 414.744, "b": 486.147, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 165, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 412.789, "r_y0": 486.147, "r_x1": 414.744, "r_y1": 486.147, "r_x2": 414.744, "r_y2": 483.411, "r_x3": 412.789, "r_y3": 483.411, "coord_origin": "TOPLEFT"}, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 138, "label": "text", "bbox": {"l": 200.64, "t": 488.29, "r": 207.134, "b": 491.026, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 166, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 200.64, "r_y0": 491.026, "r_x1": 207.134, "r_y1": 491.026, "r_x2": 207.134, "r_y2": 488.29, "r_x3": 200.64, "r_y3": 488.29, "coord_origin": "TOPLEFT"}, "text": "320", "orig": "320", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 139, "label": "text", "bbox": {"l": 367.626, "t": 488.29, "r": 369.784, "b": 491.026, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 167, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 367.626, "r_y0": 491.026, "r_x1": 369.784, "r_y1": 491.026, "r_x2": 369.784, "r_y2": 488.29, "r_x3": 367.626, "r_y3": 488.29, "coord_origin": "TOPLEFT"}, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 140, "label": "text", "bbox": {"l": 382.661, "t": 488.29, "r": 384.819, "b": 491.026, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 168, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 382.661, "r_y0": 491.026, "r_x1": 384.819, "r_y1": 491.026, "r_x2": 384.819, "r_y2": 488.29, "r_x3": 382.661, "r_y3": 488.29, "coord_origin": "TOPLEFT"}, "text": "4", "orig": "4", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 141, "label": "text", "bbox": {"l": 397.725, "t": 488.29, "r": 402.051, "b": 491.026, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 169, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 397.725, "r_y0": 491.026, "r_x1": 402.051, "r_y1": 491.026, "r_x2": 402.051, "r_y2": 488.29, "r_x3": 397.725, "r_y3": 488.29, "coord_origin": "TOPLEFT"}, "text": "20", "orig": "20", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 142, "label": "text", "bbox": {"l": 200.64, "t": 493.168, "r": 208.472, "b": 495.904, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 170, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 200.64, "r_y0": 495.904, "r_x1": 208.472, "r_y1": 495.904, "r_x2": 208.472, "r_y2": 493.168, "r_x3": 200.64, "r_y3": 493.168, "coord_origin": "TOPLEFT"}, "text": "2013", "orig": "2013", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 143, "label": "text", "bbox": {"l": 264.29, "t": 493.168, "r": 266.245, "b": 495.904, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 171, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 264.29, "r_y0": 495.904, "r_x1": 266.245, "r_y1": 495.904, "r_x2": 266.245, "r_y2": 493.168, "r_x3": 264.29, "r_y3": 493.168, "coord_origin": "TOPLEFT"}, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}]}, {"id": 144, "label": "text", "bbox": {"l": 227.915, "t": 665.826, "r": 230.1, "b": 675.346, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 172, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 227.915, "r_y0": 675.346, "r_x1": 230.1, "r_y1": 675.346, "r_x2": 230.1, "r_y2": 665.826, "r_x3": 227.915, "r_y3": 665.826, "coord_origin": "TOPLEFT"}, "text": "\u03bc", "orig": "\u03bc", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 145, "label": "text", "bbox": {"l": 300.581, "t": 683.622, "r": 302.726, "b": 693.429, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 173, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 300.581, "r_y0": 693.429, "r_x1": 302.726, "r_y1": 693.429, "r_x2": 302.726, "r_y2": 683.622, "r_x3": 300.581, "r_y3": 683.622, "coord_origin": "TOPLEFT"}, "text": "\u2265", "orig": "\u2265", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}]}, "tablestructure": {"table_map": {"0": {"label": "table", "id": 0, "page_no": 9, "cluster": {"id": 0, "label": "table", "bbox": {"l": 143.6376495361328, "t": 156.3477020263672, "r": 470.8485412597656, "b": 263.2624816894531, "coord_origin": "TOPLEFT"}, "confidence": 0.9884640574455261, "cells": [{"index": 6, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 160.782, "r_y0": 175.57000000000005, "r_x1": 194.998, "r_y1": 175.57000000000005, "r_x2": 194.998, "r_y2": 164.28099999999995, "r_x3": 160.782, "r_y3": 164.28099999999995, "coord_origin": "TOPLEFT"}, "text": "Data set", "orig": "Data set", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 7, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 215.525, "r_y0": 175.54499999999996, "r_x1": 254.045, "r_y1": 175.54499999999996, "r_x2": 254.045, "r_y2": 164.25599999999997, "r_x3": 215.525, "r_y3": 164.25599999999997, "coord_origin": "TOPLEFT"}, "text": "Language", "orig": "Language", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 8, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 300.397, "r_y0": 170.09000000000003, "r_x1": 323.991, "r_y1": 170.09000000000003, "r_x2": 323.991, "r_y2": 158.80100000000004, "r_x3": 300.397, "r_y3": 158.80100000000004, "coord_origin": "TOPLEFT"}, "text": "TEDs", "orig": "TEDs", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 9, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 370.345, "r_y0": 175.57000000000005, "r_x1": 414.747, "r_y1": 175.57000000000005, "r_x2": 414.747, "r_y2": 164.28099999999995, "r_x3": 370.345, "r_y3": 164.28099999999995, "coord_origin": "TOPLEFT"}, "text": "mAP(0.75)", "orig": "mAP(0.75)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 10, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 426.737, "r_y0": 170.09000000000003, "r_x1": 463.108, "r_y1": 170.09000000000003, "r_x2": 463.108, "r_y2": 158.80100000000004, "r_x3": 426.737, "r_y3": 158.80100000000004, "coord_origin": "TOPLEFT"}, "text": "Inference", "orig": "Inference", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 11, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 423.114, "r_y0": 181.04899999999998, "r_x1": 466.727, "r_y1": 181.04899999999998, "r_x2": 466.727, "r_y2": 169.76, "r_x3": 423.114, "r_y3": 169.76, "coord_origin": "TOPLEFT"}, "text": "time (secs)", "orig": "time (secs)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 12, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 262.413, "r_y0": 183.04200000000003, "r_x1": 288.06, "r_y1": 183.04200000000003, "r_x2": 288.06, "r_y2": 171.75300000000004, "r_x3": 262.413, "r_y3": 171.75300000000004, "coord_origin": "TOPLEFT"}, "text": "simple", "orig": "simple", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 13, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 296.429, "r_y0": 183.04200000000003, "r_x1": 329.447, "r_y1": 183.04200000000003, "r_x2": 329.447, "r_y2": 171.75300000000004, "r_x3": 296.429, "r_y3": 171.75300000000004, "coord_origin": "TOPLEFT"}, "text": "complex", "orig": "complex", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 14, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 345.033, "r_y0": 183.04200000000003, "r_x1": 354.758, "r_y1": 183.04200000000003, "r_x2": 354.758, "r_y2": 171.75300000000004, "r_x3": 345.033, "r_y3": 171.75300000000004, "coord_origin": "TOPLEFT"}, "text": "all", "orig": "all", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 15, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 154.538, "r_y0": 201.87099999999998, "r_x1": 201.241, "r_y1": 201.87099999999998, "r_x2": 201.241, "r_y2": 190.582, "r_x3": 154.538, "r_y3": 190.582, "coord_origin": "TOPLEFT"}, "text": "PubTabNet", "orig": "PubTabNet", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 16, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 222.437, "r_y0": 196.39200000000005, "r_x1": 247.132, "r_y1": 196.39200000000005, "r_x2": 247.132, "r_y2": 185.10299999999995, "r_x3": 222.437, "r_y3": 185.10299999999995, "coord_origin": "TOPLEFT"}, "text": "OTSL", "orig": "OTSL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 17, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 264.744, "r_y0": 196.39200000000005, "r_x1": 285.731, "r_y1": 196.39200000000005, "r_x2": 285.731, "r_y2": 185.10299999999995, "r_x3": 264.744, "r_y3": 185.10299999999995, "coord_origin": "TOPLEFT"}, "text": "0.965", "orig": "0.965", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 18, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 302.444, "r_y0": 196.39200000000005, "r_x1": 323.431, "r_y1": 196.39200000000005, "r_x2": 323.431, "r_y2": 185.10299999999995, "r_x3": 302.444, "r_y3": 185.10299999999995, "coord_origin": "TOPLEFT"}, "text": "0.934", "orig": "0.934", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 19, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 339.403, "r_y0": 196.39200000000005, "r_x1": 360.39, "r_y1": 196.39200000000005, "r_x2": 360.39, "r_y2": 185.10299999999995, "r_x3": 339.403, "r_y3": 185.10299999999995, "coord_origin": "TOPLEFT"}, "text": "0.955", "orig": "0.955", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 20, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 383.116, "r_y0": 195.24400000000003, "r_x1": 401.973, "r_y1": 195.24400000000003, "r_x2": 401.973, "r_y2": 187.31799999999998, "r_x3": 383.116, "r_y3": 187.31799999999998, "coord_origin": "TOPLEFT"}, "text": "0.88", "orig": "0.88", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 21, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 435.493, "r_y0": 195.24400000000003, "r_x1": 454.35, "r_y1": 195.24400000000003, "r_x2": 454.35, "r_y2": 187.31799999999998, "r_x3": 435.493, "r_y3": 187.31799999999998, "coord_origin": "TOPLEFT"}, "text": "2.73", "orig": "2.73", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 22, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 220.903, "r_y0": 209.34299999999996, "r_x1": 248.667, "r_y1": 209.34299999999996, "r_x2": 248.667, "r_y2": 198.05399999999997, "r_x3": 220.903, "r_y3": 198.05399999999997, "coord_origin": "TOPLEFT"}, "text": "HTML", "orig": "HTML", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 23, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 264.744, "r_y0": 209.34299999999996, "r_x1": 285.731, "r_y1": 209.34299999999996, "r_x2": 285.731, "r_y2": 198.05399999999997, "r_x3": 264.744, "r_y3": 198.05399999999997, "coord_origin": "TOPLEFT"}, "text": "0.969", "orig": "0.969", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 24, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 302.444, "r_y0": 209.34299999999996, "r_x1": 323.431, "r_y1": 209.34299999999996, "r_x2": 323.431, "r_y2": 198.05399999999997, "r_x3": 302.444, "r_y3": 198.05399999999997, "coord_origin": "TOPLEFT"}, "text": "0.927", "orig": "0.927", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 25, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 339.403, "r_y0": 209.34299999999996, "r_x1": 360.39, "r_y1": 209.34299999999996, "r_x2": 360.39, "r_y2": 198.05399999999997, "r_x3": 339.403, "r_y3": 198.05399999999997, "coord_origin": "TOPLEFT"}, "text": "0.955", "orig": "0.955", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 26, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 382.052, "r_y0": 209.34299999999996, "r_x1": 403.039, "r_y1": 209.34299999999996, "r_x2": 403.039, "r_y2": 198.05399999999997, "r_x3": 382.052, "r_y3": 198.05399999999997, "coord_origin": "TOPLEFT"}, "text": "0.857", "orig": "0.857", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 27, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 436.732, "r_y0": 209.34299999999996, "r_x1": 453.112, "r_y1": 209.34299999999996, "r_x2": 453.112, "r_y2": 198.05399999999997, "r_x3": 436.732, "r_y3": 198.05399999999997, "coord_origin": "TOPLEFT"}, "text": "5.39", "orig": "5.39", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 28, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 155.945, "r_y0": 228.173, "r_x1": 199.834, "r_y1": 228.173, "r_x2": 199.834, "r_y2": 216.88400000000001, "r_x3": 155.945, "r_y3": 216.88400000000001, "coord_origin": "TOPLEFT"}, "text": "FinTabNet", "orig": "FinTabNet", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 29, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 222.437, "r_y0": 222.69299999999998, "r_x1": 247.132, "r_y1": 222.69299999999998, "r_x2": 247.132, "r_y2": 211.404, "r_x3": 222.437, "r_y3": 211.404, "coord_origin": "TOPLEFT"}, "text": "OTSL", "orig": "OTSL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 30, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 264.744, "r_y0": 222.69299999999998, "r_x1": 285.731, "r_y1": 222.69299999999998, "r_x2": 285.731, "r_y2": 211.404, "r_x3": 264.744, "r_y3": 211.404, "coord_origin": "TOPLEFT"}, "text": "0.955", "orig": "0.955", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 31, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 302.444, "r_y0": 222.69299999999998, "r_x1": 323.431, "r_y1": 222.69299999999998, "r_x2": 323.431, "r_y2": 211.404, "r_x3": 302.444, "r_y3": 211.404, "coord_origin": "TOPLEFT"}, "text": "0.961", "orig": "0.961", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 32, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 337.815, "r_y0": 221.54499999999996, "r_x1": 361.976, "r_y1": 221.54499999999996, "r_x2": 361.976, "r_y2": 213.61900000000003, "r_x3": 337.815, "r_y3": 213.61900000000003, "coord_origin": "TOPLEFT"}, "text": "0.959", "orig": "0.959", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 33, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 380.464, "r_y0": 221.54499999999996, "r_x1": 404.625, "r_y1": 221.54499999999996, "r_x2": 404.625, "r_y2": 213.61900000000003, "r_x3": 380.464, "r_y3": 213.61900000000003, "coord_origin": "TOPLEFT"}, "text": "0.862", "orig": "0.862", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 34, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 435.493, "r_y0": 221.54499999999996, "r_x1": 454.35, "r_y1": 221.54499999999996, "r_x2": 454.35, "r_y2": 213.61900000000003, "r_x3": 435.493, "r_y3": 213.61900000000003, "coord_origin": "TOPLEFT"}, "text": "1.85", "orig": "1.85", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 35, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 220.903, "r_y0": 235.64499999999998, "r_x1": 248.667, "r_y1": 235.64499999999998, "r_x2": 248.667, "r_y2": 224.356, "r_x3": 220.903, "r_y3": 224.356, "coord_origin": "TOPLEFT"}, "text": "HTML", "orig": "HTML", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 36, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 264.744, "r_y0": 235.64499999999998, "r_x1": 285.731, "r_y1": 235.64499999999998, "r_x2": 285.731, "r_y2": 224.356, "r_x3": 264.744, "r_y3": 224.356, "coord_origin": "TOPLEFT"}, "text": "0.917", "orig": "0.917", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 37, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 302.444, "r_y0": 235.64499999999998, "r_x1": 323.431, "r_y1": 235.64499999999998, "r_x2": 323.431, "r_y2": 224.356, "r_x3": 302.444, "r_y3": 224.356, "coord_origin": "TOPLEFT"}, "text": "0.922", "orig": "0.922", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 38, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 341.706, "r_y0": 235.64499999999998, "r_x1": 358.086, "r_y1": 235.64499999999998, "r_x2": 358.086, "r_y2": 224.356, "r_x3": 341.706, "r_y3": 224.356, "coord_origin": "TOPLEFT"}, "text": "0.92", "orig": "0.92", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 39, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 382.052, "r_y0": 235.64499999999998, "r_x1": 403.039, "r_y1": 235.64499999999998, "r_x2": 403.039, "r_y2": 224.356, "r_x3": 382.052, "r_y3": 224.356, "coord_origin": "TOPLEFT"}, "text": "0.722", "orig": "0.722", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 40, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 436.732, "r_y0": 235.64499999999998, "r_x1": 453.112, "r_y1": 235.64499999999998, "r_x2": 453.112, "r_y2": 224.356, "r_x3": 436.732, "r_y3": 224.356, "coord_origin": "TOPLEFT"}, "text": "3.26", "orig": "3.26", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 41, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 148.626, "r_y0": 254.47400000000005, "r_x1": 207.152, "r_y1": 254.47400000000005, "r_x2": 207.152, "r_y2": 243.18499999999995, "r_x3": 148.626, "r_y3": 243.18499999999995, "coord_origin": "TOPLEFT"}, "text": "PubTables-1M", "orig": "PubTables-1M", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 42, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 222.437, "r_y0": 248.99400000000003, "r_x1": 247.132, "r_y1": 248.99400000000003, "r_x2": 247.132, "r_y2": 237.70500000000004, "r_x3": 222.437, "r_y3": 237.70500000000004, "coord_origin": "TOPLEFT"}, "text": "OTSL", "orig": "OTSL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 43, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 264.744, "r_y0": 248.99400000000003, "r_x1": 285.731, "r_y1": 248.99400000000003, "r_x2": 285.731, "r_y2": 237.70500000000004, "r_x3": 264.744, "r_y3": 237.70500000000004, "coord_origin": "TOPLEFT"}, "text": "0.987", "orig": "0.987", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 44, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 302.444, "r_y0": 248.99400000000003, "r_x1": 323.431, "r_y1": 248.99400000000003, "r_x2": 323.431, "r_y2": 237.70500000000004, "r_x3": 302.444, "r_y3": 237.70500000000004, "coord_origin": "TOPLEFT"}, "text": "0.964", "orig": "0.964", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 45, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 337.815, "r_y0": 247.846, "r_x1": 361.976, "r_y1": 247.846, "r_x2": 361.976, "r_y2": 239.91999999999996, "r_x3": 337.815, "r_y3": 239.91999999999996, "coord_origin": "TOPLEFT"}, "text": "0.977", "orig": "0.977", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 46, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 380.464, "r_y0": 247.846, "r_x1": 404.625, "r_y1": 247.846, "r_x2": 404.625, "r_y2": 239.91999999999996, "r_x3": 380.464, "r_y3": 239.91999999999996, "coord_origin": "TOPLEFT"}, "text": "0.896", "orig": "0.896", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 47, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 435.493, "r_y0": 247.846, "r_x1": 454.35, "r_y1": 247.846, "r_x2": 454.35, "r_y2": 239.91999999999996, "r_x3": 435.493, "r_y3": 239.91999999999996, "coord_origin": "TOPLEFT"}, "text": "1.79", "orig": "1.79", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 48, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 220.903, "r_y0": 261.946, "r_x1": 248.667, "r_y1": 261.946, "r_x2": 248.667, "r_y2": 250.65700000000004, "r_x3": 220.903, "r_y3": 250.65700000000004, "coord_origin": "TOPLEFT"}, "text": "HTML", "orig": "HTML", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 49, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 264.744, "r_y0": 261.946, "r_x1": 285.731, "r_y1": 261.946, "r_x2": 285.731, "r_y2": 250.65700000000004, "r_x3": 264.744, "r_y3": 250.65700000000004, "coord_origin": "TOPLEFT"}, "text": "0.983", "orig": "0.983", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 50, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 302.444, "r_y0": 261.946, "r_x1": 323.431, "r_y1": 261.946, "r_x2": 323.431, "r_y2": 250.65700000000004, "r_x3": 302.444, "r_y3": 250.65700000000004, "coord_origin": "TOPLEFT"}, "text": "0.944", "orig": "0.944", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 51, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 339.403, "r_y0": 261.946, "r_x1": 360.39, "r_y1": 261.946, "r_x2": 360.39, "r_y2": 250.65700000000004, "r_x3": 339.403, "r_y3": 250.65700000000004, "coord_origin": "TOPLEFT"}, "text": "0.966", "orig": "0.966", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 52, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 382.052, "r_y0": 261.946, "r_x1": 403.039, "r_y1": 261.946, "r_x2": 403.039, "r_y2": 250.65700000000004, "r_x3": 382.052, "r_y3": 250.65700000000004, "coord_origin": "TOPLEFT"}, "text": "0.889", "orig": "0.889", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 53, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 436.732, "r_y0": 261.946, "r_x1": 453.112, "r_y1": 261.946, "r_x2": 453.112, "r_y2": 250.65700000000004, "r_x3": 436.732, "r_y3": 250.65700000000004, "coord_origin": "TOPLEFT"}, "text": "3.26", "orig": "3.26", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": [{"id": 10, "label": "text", "bbox": {"l": 160.782, "t": 164.28099999999995, "r": 194.998, "b": 175.57000000000005, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 6, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 160.782, "r_y0": 175.57000000000005, "r_x1": 194.998, "r_y1": 175.57000000000005, "r_x2": 194.998, "r_y2": 164.28099999999995, "r_x3": 160.782, "r_y3": 164.28099999999995, "coord_origin": "TOPLEFT"}, "text": "Data set", "orig": "Data set", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 11, "label": "text", "bbox": {"l": 215.525, "t": 164.25599999999997, "r": 254.045, "b": 175.54499999999996, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 7, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 215.525, "r_y0": 175.54499999999996, "r_x1": 254.045, "r_y1": 175.54499999999996, "r_x2": 254.045, "r_y2": 164.25599999999997, "r_x3": 215.525, "r_y3": 164.25599999999997, "coord_origin": "TOPLEFT"}, "text": "Language", "orig": "Language", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 12, "label": "text", "bbox": {"l": 300.397, "t": 158.80100000000004, "r": 323.991, "b": 170.09000000000003, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 8, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 300.397, "r_y0": 170.09000000000003, "r_x1": 323.991, "r_y1": 170.09000000000003, "r_x2": 323.991, "r_y2": 158.80100000000004, "r_x3": 300.397, "r_y3": 158.80100000000004, "coord_origin": "TOPLEFT"}, "text": "TEDs", "orig": "TEDs", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 13, "label": "text", "bbox": {"l": 370.345, "t": 164.28099999999995, "r": 414.747, "b": 175.57000000000005, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 9, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 370.345, "r_y0": 175.57000000000005, "r_x1": 414.747, "r_y1": 175.57000000000005, "r_x2": 414.747, "r_y2": 164.28099999999995, "r_x3": 370.345, "r_y3": 164.28099999999995, "coord_origin": "TOPLEFT"}, "text": "mAP(0.75)", "orig": "mAP(0.75)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 14, "label": "text", "bbox": {"l": 426.737, "t": 158.80100000000004, "r": 463.108, "b": 170.09000000000003, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 10, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 426.737, "r_y0": 170.09000000000003, "r_x1": 463.108, "r_y1": 170.09000000000003, "r_x2": 463.108, "r_y2": 158.80100000000004, "r_x3": 426.737, "r_y3": 158.80100000000004, "coord_origin": "TOPLEFT"}, "text": "Inference", "orig": "Inference", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 15, "label": "text", "bbox": {"l": 423.114, "t": 169.76, "r": 466.727, "b": 181.04899999999998, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 11, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 423.114, "r_y0": 181.04899999999998, "r_x1": 466.727, "r_y1": 181.04899999999998, "r_x2": 466.727, "r_y2": 169.76, "r_x3": 423.114, "r_y3": 169.76, "coord_origin": "TOPLEFT"}, "text": "time (secs)", "orig": "time (secs)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 16, "label": "text", "bbox": {"l": 262.413, "t": 171.75300000000004, "r": 288.06, "b": 183.04200000000003, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 12, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 262.413, "r_y0": 183.04200000000003, "r_x1": 288.06, "r_y1": 183.04200000000003, "r_x2": 288.06, "r_y2": 171.75300000000004, "r_x3": 262.413, "r_y3": 171.75300000000004, "coord_origin": "TOPLEFT"}, "text": "simple", "orig": "simple", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 17, "label": "text", "bbox": {"l": 296.429, "t": 171.75300000000004, "r": 329.447, "b": 183.04200000000003, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 13, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 296.429, "r_y0": 183.04200000000003, "r_x1": 329.447, "r_y1": 183.04200000000003, "r_x2": 329.447, "r_y2": 171.75300000000004, "r_x3": 296.429, "r_y3": 171.75300000000004, "coord_origin": "TOPLEFT"}, "text": "complex", "orig": "complex", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 18, "label": "text", "bbox": {"l": 345.033, "t": 171.75300000000004, "r": 354.758, "b": 183.04200000000003, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 14, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 345.033, "r_y0": 183.04200000000003, "r_x1": 354.758, "r_y1": 183.04200000000003, "r_x2": 354.758, "r_y2": 171.75300000000004, "r_x3": 345.033, "r_y3": 171.75300000000004, "coord_origin": "TOPLEFT"}, "text": "all", "orig": "all", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 19, "label": "text", "bbox": {"l": 154.538, "t": 190.582, "r": 201.241, "b": 201.87099999999998, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 15, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 154.538, "r_y0": 201.87099999999998, "r_x1": 201.241, "r_y1": 201.87099999999998, "r_x2": 201.241, "r_y2": 190.582, "r_x3": 154.538, "r_y3": 190.582, "coord_origin": "TOPLEFT"}, "text": "PubTabNet", "orig": "PubTabNet", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 20, "label": "text", "bbox": {"l": 222.437, "t": 185.10299999999995, "r": 247.132, "b": 196.39200000000005, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 16, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 222.437, "r_y0": 196.39200000000005, "r_x1": 247.132, "r_y1": 196.39200000000005, "r_x2": 247.132, "r_y2": 185.10299999999995, "r_x3": 222.437, "r_y3": 185.10299999999995, "coord_origin": "TOPLEFT"}, "text": "OTSL", "orig": "OTSL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 21, "label": "text", "bbox": {"l": 264.744, "t": 185.10299999999995, "r": 285.731, "b": 196.39200000000005, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 17, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 264.744, "r_y0": 196.39200000000005, "r_x1": 285.731, "r_y1": 196.39200000000005, "r_x2": 285.731, "r_y2": 185.10299999999995, "r_x3": 264.744, "r_y3": 185.10299999999995, "coord_origin": "TOPLEFT"}, "text": "0.965", "orig": "0.965", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 22, "label": "text", "bbox": {"l": 302.444, "t": 185.10299999999995, "r": 323.431, "b": 196.39200000000005, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 18, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 302.444, "r_y0": 196.39200000000005, "r_x1": 323.431, "r_y1": 196.39200000000005, "r_x2": 323.431, "r_y2": 185.10299999999995, "r_x3": 302.444, "r_y3": 185.10299999999995, "coord_origin": "TOPLEFT"}, "text": "0.934", "orig": "0.934", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 23, "label": "text", "bbox": {"l": 339.403, "t": 185.10299999999995, "r": 360.39, "b": 196.39200000000005, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 19, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 339.403, "r_y0": 196.39200000000005, "r_x1": 360.39, "r_y1": 196.39200000000005, "r_x2": 360.39, "r_y2": 185.10299999999995, "r_x3": 339.403, "r_y3": 185.10299999999995, "coord_origin": "TOPLEFT"}, "text": "0.955", "orig": "0.955", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 24, "label": "text", "bbox": {"l": 383.116, "t": 187.31799999999998, "r": 401.973, "b": 195.24400000000003, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 20, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 383.116, "r_y0": 195.24400000000003, "r_x1": 401.973, "r_y1": 195.24400000000003, "r_x2": 401.973, "r_y2": 187.31799999999998, "r_x3": 383.116, "r_y3": 187.31799999999998, "coord_origin": "TOPLEFT"}, "text": "0.88", "orig": "0.88", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 25, "label": "text", "bbox": {"l": 435.493, "t": 187.31799999999998, "r": 454.35, "b": 195.24400000000003, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 21, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 435.493, "r_y0": 195.24400000000003, "r_x1": 454.35, "r_y1": 195.24400000000003, "r_x2": 454.35, "r_y2": 187.31799999999998, "r_x3": 435.493, "r_y3": 187.31799999999998, "coord_origin": "TOPLEFT"}, "text": "2.73", "orig": "2.73", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 26, "label": "text", "bbox": {"l": 220.903, "t": 198.05399999999997, "r": 248.667, "b": 209.34299999999996, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 22, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 220.903, "r_y0": 209.34299999999996, "r_x1": 248.667, "r_y1": 209.34299999999996, "r_x2": 248.667, "r_y2": 198.05399999999997, "r_x3": 220.903, "r_y3": 198.05399999999997, "coord_origin": "TOPLEFT"}, "text": "HTML", "orig": "HTML", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 27, "label": "text", "bbox": {"l": 264.744, "t": 198.05399999999997, "r": 285.731, "b": 209.34299999999996, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 23, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 264.744, "r_y0": 209.34299999999996, "r_x1": 285.731, "r_y1": 209.34299999999996, "r_x2": 285.731, "r_y2": 198.05399999999997, "r_x3": 264.744, "r_y3": 198.05399999999997, "coord_origin": "TOPLEFT"}, "text": "0.969", "orig": "0.969", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 28, "label": "text", "bbox": {"l": 302.444, "t": 198.05399999999997, "r": 323.431, "b": 209.34299999999996, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 24, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 302.444, "r_y0": 209.34299999999996, "r_x1": 323.431, "r_y1": 209.34299999999996, "r_x2": 323.431, "r_y2": 198.05399999999997, "r_x3": 302.444, "r_y3": 198.05399999999997, "coord_origin": "TOPLEFT"}, "text": "0.927", "orig": "0.927", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 29, "label": "text", "bbox": {"l": 339.403, "t": 198.05399999999997, "r": 360.39, "b": 209.34299999999996, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 25, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 339.403, "r_y0": 209.34299999999996, "r_x1": 360.39, "r_y1": 209.34299999999996, "r_x2": 360.39, "r_y2": 198.05399999999997, "r_x3": 339.403, "r_y3": 198.05399999999997, "coord_origin": "TOPLEFT"}, "text": "0.955", "orig": "0.955", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 30, "label": "text", "bbox": {"l": 382.052, "t": 198.05399999999997, "r": 403.039, "b": 209.34299999999996, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 26, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 382.052, "r_y0": 209.34299999999996, "r_x1": 403.039, "r_y1": 209.34299999999996, "r_x2": 403.039, "r_y2": 198.05399999999997, "r_x3": 382.052, "r_y3": 198.05399999999997, "coord_origin": "TOPLEFT"}, "text": "0.857", "orig": "0.857", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 31, "label": "text", "bbox": {"l": 436.732, "t": 198.05399999999997, "r": 453.112, "b": 209.34299999999996, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 27, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 436.732, "r_y0": 209.34299999999996, "r_x1": 453.112, "r_y1": 209.34299999999996, "r_x2": 453.112, "r_y2": 198.05399999999997, "r_x3": 436.732, "r_y3": 198.05399999999997, "coord_origin": "TOPLEFT"}, "text": "5.39", "orig": "5.39", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 32, "label": "text", "bbox": {"l": 155.945, "t": 216.88400000000001, "r": 199.834, "b": 228.173, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 28, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 155.945, "r_y0": 228.173, "r_x1": 199.834, "r_y1": 228.173, "r_x2": 199.834, "r_y2": 216.88400000000001, "r_x3": 155.945, "r_y3": 216.88400000000001, "coord_origin": "TOPLEFT"}, "text": "FinTabNet", "orig": "FinTabNet", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 33, "label": "text", "bbox": {"l": 222.437, "t": 211.404, "r": 247.132, "b": 222.69299999999998, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 29, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 222.437, "r_y0": 222.69299999999998, "r_x1": 247.132, "r_y1": 222.69299999999998, "r_x2": 247.132, "r_y2": 211.404, "r_x3": 222.437, "r_y3": 211.404, "coord_origin": "TOPLEFT"}, "text": "OTSL", "orig": "OTSL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 34, "label": "text", "bbox": {"l": 264.744, "t": 211.404, "r": 285.731, "b": 222.69299999999998, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 30, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 264.744, "r_y0": 222.69299999999998, "r_x1": 285.731, "r_y1": 222.69299999999998, "r_x2": 285.731, "r_y2": 211.404, "r_x3": 264.744, "r_y3": 211.404, "coord_origin": "TOPLEFT"}, "text": "0.955", "orig": "0.955", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 35, "label": "text", "bbox": {"l": 302.444, "t": 211.404, "r": 323.431, "b": 222.69299999999998, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 31, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 302.444, "r_y0": 222.69299999999998, "r_x1": 323.431, "r_y1": 222.69299999999998, "r_x2": 323.431, "r_y2": 211.404, "r_x3": 302.444, "r_y3": 211.404, "coord_origin": "TOPLEFT"}, "text": "0.961", "orig": "0.961", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 36, "label": "text", "bbox": {"l": 337.815, "t": 213.61900000000003, "r": 361.976, "b": 221.54499999999996, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 32, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 337.815, "r_y0": 221.54499999999996, "r_x1": 361.976, "r_y1": 221.54499999999996, "r_x2": 361.976, "r_y2": 213.61900000000003, "r_x3": 337.815, "r_y3": 213.61900000000003, "coord_origin": "TOPLEFT"}, "text": "0.959", "orig": "0.959", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 37, "label": "text", "bbox": {"l": 380.464, "t": 213.61900000000003, "r": 404.625, "b": 221.54499999999996, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 33, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 380.464, "r_y0": 221.54499999999996, "r_x1": 404.625, "r_y1": 221.54499999999996, "r_x2": 404.625, "r_y2": 213.61900000000003, "r_x3": 380.464, "r_y3": 213.61900000000003, "coord_origin": "TOPLEFT"}, "text": "0.862", "orig": "0.862", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 38, "label": "text", "bbox": {"l": 435.493, "t": 213.61900000000003, "r": 454.35, "b": 221.54499999999996, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 34, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 435.493, "r_y0": 221.54499999999996, "r_x1": 454.35, "r_y1": 221.54499999999996, "r_x2": 454.35, "r_y2": 213.61900000000003, "r_x3": 435.493, "r_y3": 213.61900000000003, "coord_origin": "TOPLEFT"}, "text": "1.85", "orig": "1.85", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 39, "label": "text", "bbox": {"l": 220.903, "t": 224.356, "r": 248.667, "b": 235.64499999999998, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 35, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 220.903, "r_y0": 235.64499999999998, "r_x1": 248.667, "r_y1": 235.64499999999998, "r_x2": 248.667, "r_y2": 224.356, "r_x3": 220.903, "r_y3": 224.356, "coord_origin": "TOPLEFT"}, "text": "HTML", "orig": "HTML", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 40, "label": "text", "bbox": {"l": 264.744, "t": 224.356, "r": 285.731, "b": 235.64499999999998, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 36, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 264.744, "r_y0": 235.64499999999998, "r_x1": 285.731, "r_y1": 235.64499999999998, "r_x2": 285.731, "r_y2": 224.356, "r_x3": 264.744, "r_y3": 224.356, "coord_origin": "TOPLEFT"}, "text": "0.917", "orig": "0.917", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 41, "label": "text", "bbox": {"l": 302.444, "t": 224.356, "r": 323.431, "b": 235.64499999999998, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 37, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 302.444, "r_y0": 235.64499999999998, "r_x1": 323.431, "r_y1": 235.64499999999998, "r_x2": 323.431, "r_y2": 224.356, "r_x3": 302.444, "r_y3": 224.356, "coord_origin": "TOPLEFT"}, "text": "0.922", "orig": "0.922", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 42, "label": "text", "bbox": {"l": 341.706, "t": 224.356, "r": 358.086, "b": 235.64499999999998, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 38, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 341.706, "r_y0": 235.64499999999998, "r_x1": 358.086, "r_y1": 235.64499999999998, "r_x2": 358.086, "r_y2": 224.356, "r_x3": 341.706, "r_y3": 224.356, "coord_origin": "TOPLEFT"}, "text": "0.92", "orig": "0.92", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 43, "label": "text", "bbox": {"l": 382.052, "t": 224.356, "r": 403.039, "b": 235.64499999999998, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 39, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 382.052, "r_y0": 235.64499999999998, "r_x1": 403.039, "r_y1": 235.64499999999998, "r_x2": 403.039, "r_y2": 224.356, "r_x3": 382.052, "r_y3": 224.356, "coord_origin": "TOPLEFT"}, "text": "0.722", "orig": "0.722", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 44, "label": "text", "bbox": {"l": 436.732, "t": 224.356, "r": 453.112, "b": 235.64499999999998, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 40, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 436.732, "r_y0": 235.64499999999998, "r_x1": 453.112, "r_y1": 235.64499999999998, "r_x2": 453.112, "r_y2": 224.356, "r_x3": 436.732, "r_y3": 224.356, "coord_origin": "TOPLEFT"}, "text": "3.26", "orig": "3.26", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 45, "label": "text", "bbox": {"l": 148.626, "t": 243.18499999999995, "r": 207.152, "b": 254.47400000000005, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 41, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 148.626, "r_y0": 254.47400000000005, "r_x1": 207.152, "r_y1": 254.47400000000005, "r_x2": 207.152, "r_y2": 243.18499999999995, "r_x3": 148.626, "r_y3": 243.18499999999995, "coord_origin": "TOPLEFT"}, "text": "PubTables-1M", "orig": "PubTables-1M", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 46, "label": "text", "bbox": {"l": 222.437, "t": 237.70500000000004, "r": 247.132, "b": 248.99400000000003, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 42, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 222.437, "r_y0": 248.99400000000003, "r_x1": 247.132, "r_y1": 248.99400000000003, "r_x2": 247.132, "r_y2": 237.70500000000004, "r_x3": 222.437, "r_y3": 237.70500000000004, "coord_origin": "TOPLEFT"}, "text": "OTSL", "orig": "OTSL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 47, "label": "text", "bbox": {"l": 264.744, "t": 237.70500000000004, "r": 285.731, "b": 248.99400000000003, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 43, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 264.744, "r_y0": 248.99400000000003, "r_x1": 285.731, "r_y1": 248.99400000000003, "r_x2": 285.731, "r_y2": 237.70500000000004, "r_x3": 264.744, "r_y3": 237.70500000000004, "coord_origin": "TOPLEFT"}, "text": "0.987", "orig": "0.987", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 48, "label": "text", "bbox": {"l": 302.444, "t": 237.70500000000004, "r": 323.431, "b": 248.99400000000003, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 44, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 302.444, "r_y0": 248.99400000000003, "r_x1": 323.431, "r_y1": 248.99400000000003, "r_x2": 323.431, "r_y2": 237.70500000000004, "r_x3": 302.444, "r_y3": 237.70500000000004, "coord_origin": "TOPLEFT"}, "text": "0.964", "orig": "0.964", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 49, "label": "text", "bbox": {"l": 337.815, "t": 239.91999999999996, "r": 361.976, "b": 247.846, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 45, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 337.815, "r_y0": 247.846, "r_x1": 361.976, "r_y1": 247.846, "r_x2": 361.976, "r_y2": 239.91999999999996, "r_x3": 337.815, "r_y3": 239.91999999999996, "coord_origin": "TOPLEFT"}, "text": "0.977", "orig": "0.977", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 50, "label": "text", "bbox": {"l": 380.464, "t": 239.91999999999996, "r": 404.625, "b": 247.846, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 46, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 380.464, "r_y0": 247.846, "r_x1": 404.625, "r_y1": 247.846, "r_x2": 404.625, "r_y2": 239.91999999999996, "r_x3": 380.464, "r_y3": 239.91999999999996, "coord_origin": "TOPLEFT"}, "text": "0.896", "orig": "0.896", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 51, "label": "text", "bbox": {"l": 435.493, "t": 239.91999999999996, "r": 454.35, "b": 247.846, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 47, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 435.493, "r_y0": 247.846, "r_x1": 454.35, "r_y1": 247.846, "r_x2": 454.35, "r_y2": 239.91999999999996, "r_x3": 435.493, "r_y3": 239.91999999999996, "coord_origin": "TOPLEFT"}, "text": "1.79", "orig": "1.79", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 52, "label": "text", "bbox": {"l": 220.903, "t": 250.65700000000004, "r": 248.667, "b": 261.946, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 48, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 220.903, "r_y0": 261.946, "r_x1": 248.667, "r_y1": 261.946, "r_x2": 248.667, "r_y2": 250.65700000000004, "r_x3": 220.903, "r_y3": 250.65700000000004, "coord_origin": "TOPLEFT"}, "text": "HTML", "orig": "HTML", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 53, "label": "text", "bbox": {"l": 264.744, "t": 250.65700000000004, "r": 285.731, "b": 261.946, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 49, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 264.744, "r_y0": 261.946, "r_x1": 285.731, "r_y1": 261.946, "r_x2": 285.731, "r_y2": 250.65700000000004, "r_x3": 264.744, "r_y3": 250.65700000000004, "coord_origin": "TOPLEFT"}, "text": "0.983", "orig": "0.983", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 54, "label": "text", "bbox": {"l": 302.444, "t": 250.65700000000004, "r": 323.431, "b": 261.946, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 50, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 302.444, "r_y0": 261.946, "r_x1": 323.431, "r_y1": 261.946, "r_x2": 323.431, "r_y2": 250.65700000000004, "r_x3": 302.444, "r_y3": 250.65700000000004, "coord_origin": "TOPLEFT"}, "text": "0.944", "orig": "0.944", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 55, "label": "text", "bbox": {"l": 339.403, "t": 250.65700000000004, "r": 360.39, "b": 261.946, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 51, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 339.403, "r_y0": 261.946, "r_x1": 360.39, "r_y1": 261.946, "r_x2": 360.39, "r_y2": 250.65700000000004, "r_x3": 339.403, "r_y3": 250.65700000000004, "coord_origin": "TOPLEFT"}, "text": "0.966", "orig": "0.966", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 56, "label": "text", "bbox": {"l": 382.052, "t": 250.65700000000004, "r": 403.039, "b": 261.946, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 52, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 382.052, "r_y0": 261.946, "r_x1": 403.039, "r_y1": 261.946, "r_x2": 403.039, "r_y2": 250.65700000000004, "r_x3": 382.052, "r_y3": 250.65700000000004, "coord_origin": "TOPLEFT"}, "text": "0.889", "orig": "0.889", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 57, "label": "text", "bbox": {"l": 436.732, "t": 250.65700000000004, "r": 453.112, "b": 261.946, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 53, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 436.732, "r_y0": 261.946, "r_x1": 453.112, "r_y1": 261.946, "r_x2": 453.112, "r_y2": 250.65700000000004, "r_x3": 436.732, "r_y3": 250.65700000000004, "coord_origin": "TOPLEFT"}, "text": "3.26", "orig": "3.26", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}]}, "text": null, "otsl_seq": ["ched", "ched", "ched", "lcel", "lcel", "ched", "ched", "nl", "ucel", "ucel", "ched", "ched", "ched", "ucel", "ucel", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "nl"], "num_rows": 5, "num_cols": 7, "table_cells": [{"bbox": {"l": 160.782, "t": 164.28099999999995, "r": 194.998, "b": 175.57000000000005, "coord_origin": "TOPLEFT"}, "row_span": 2, "col_span": 1, "start_row_offset_idx": 0, "end_row_offset_idx": 2, "start_col_offset_idx": 0, "end_col_offset_idx": 1, "text": "Data set", "column_header": true, "row_header": false, "row_section": false}, {"bbox": {"l": 215.525, "t": 164.25599999999997, "r": 254.045, "b": 175.54499999999996, "coord_origin": "TOPLEFT"}, "row_span": 2, "col_span": 1, "start_row_offset_idx": 0, "end_row_offset_idx": 2, "start_col_offset_idx": 1, "end_col_offset_idx": 2, "text": "Language", "column_header": true, "row_header": false, "row_section": false}, {"bbox": {"l": 300.397, "t": 158.80100000000004, "r": 323.991, "b": 170.09000000000003, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 3, "start_row_offset_idx": 0, "end_row_offset_idx": 1, "start_col_offset_idx": 2, "end_col_offset_idx": 5, "text": "TEDs", "column_header": true, "row_header": false, "row_section": false}, {"bbox": {"l": 370.345, "t": 164.28099999999995, "r": 414.747, "b": 175.57000000000005, "coord_origin": "TOPLEFT"}, "row_span": 2, "col_span": 1, "start_row_offset_idx": 0, "end_row_offset_idx": 2, "start_col_offset_idx": 5, "end_col_offset_idx": 6, "text": "mAP(0.75)", "column_header": true, "row_header": false, "row_section": false}, {"bbox": {"l": 423.114, "t": 158.80100000000004, "r": 466.727, "b": 181.04899999999998, "coord_origin": "TOPLEFT"}, "row_span": 2, "col_span": 1, "start_row_offset_idx": 0, "end_row_offset_idx": 2, "start_col_offset_idx": 6, "end_col_offset_idx": 7, "text": "Inference time (secs)", "column_header": true, "row_header": false, "row_section": false}, {"bbox": {"l": 262.413, "t": 171.75300000000004, "r": 288.06, "b": 183.04200000000003, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 1, "end_row_offset_idx": 2, "start_col_offset_idx": 2, "end_col_offset_idx": 3, "text": "simple", "column_header": true, "row_header": false, "row_section": false}, {"bbox": {"l": 296.429, "t": 171.75300000000004, "r": 329.447, "b": 183.04200000000003, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 1, "end_row_offset_idx": 2, "start_col_offset_idx": 3, "end_col_offset_idx": 4, "text": "complex", "column_header": true, "row_header": false, "row_section": false}, {"bbox": {"l": 345.033, "t": 171.75300000000004, "r": 354.758, "b": 183.04200000000003, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 1, "end_row_offset_idx": 2, "start_col_offset_idx": 4, "end_col_offset_idx": 5, "text": "all", "column_header": true, "row_header": false, "row_section": false}, {"bbox": {"l": 154.538, "t": 190.582, "r": 201.241, "b": 201.87099999999998, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 2, "end_row_offset_idx": 3, "start_col_offset_idx": 0, "end_col_offset_idx": 1, "text": "PubTabNet", "column_header": false, "row_header": false, "row_section": false}, {"bbox": {"l": 220.903, "t": 185.10299999999995, "r": 248.667, "b": 209.34299999999996, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 2, "end_row_offset_idx": 3, "start_col_offset_idx": 1, "end_col_offset_idx": 2, "text": "OTSL HTML", "column_header": false, "row_header": false, "row_section": false}, {"bbox": {"l": 264.744, "t": 185.10299999999995, "r": 285.731, "b": 209.34299999999996, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 2, "end_row_offset_idx": 3, "start_col_offset_idx": 2, "end_col_offset_idx": 3, "text": "0.965 0.969", "column_header": false, "row_header": false, "row_section": false}, {"bbox": {"l": 302.444, "t": 185.10299999999995, "r": 323.431, "b": 209.34299999999996, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 2, "end_row_offset_idx": 3, "start_col_offset_idx": 3, "end_col_offset_idx": 4, "text": "0.934 0.927", "column_header": false, "row_header": false, "row_section": false}, {"bbox": {"l": 339.403, "t": 185.10299999999995, "r": 360.39, "b": 209.34299999999996, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 2, "end_row_offset_idx": 3, "start_col_offset_idx": 4, "end_col_offset_idx": 5, "text": "0.955 0.955", "column_header": false, "row_header": false, "row_section": false}, {"bbox": {"l": 382.052, "t": 187.31799999999998, "r": 403.039, "b": 209.34299999999996, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 2, "end_row_offset_idx": 3, "start_col_offset_idx": 5, "end_col_offset_idx": 6, "text": "0.88 0.857", "column_header": false, "row_header": false, "row_section": false}, {"bbox": {"l": 435.493, "t": 187.31799999999998, "r": 454.35, "b": 209.34299999999996, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 2, "end_row_offset_idx": 3, "start_col_offset_idx": 6, "end_col_offset_idx": 7, "text": "2.73 5.39", "column_header": false, "row_header": false, "row_section": false}, {"bbox": {"l": 155.945, "t": 216.88400000000001, "r": 199.834, "b": 228.173, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 3, "end_row_offset_idx": 4, "start_col_offset_idx": 0, "end_col_offset_idx": 1, "text": "FinTabNet", "column_header": false, "row_header": false, "row_section": false}, {"bbox": {"l": 220.903, "t": 211.404, "r": 248.667, "b": 235.64499999999998, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 3, "end_row_offset_idx": 4, "start_col_offset_idx": 1, "end_col_offset_idx": 2, "text": "OTSL HTML", "column_header": false, "row_header": false, "row_section": false}, {"bbox": {"l": 264.744, "t": 211.404, "r": 285.731, "b": 235.64499999999998, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 3, "end_row_offset_idx": 4, "start_col_offset_idx": 2, "end_col_offset_idx": 3, "text": "0.955 0.917", "column_header": false, "row_header": false, "row_section": false}, {"bbox": {"l": 302.444, "t": 211.404, "r": 323.431, "b": 235.64499999999998, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 3, "end_row_offset_idx": 4, "start_col_offset_idx": 3, "end_col_offset_idx": 4, "text": "0.961 0.922", "column_header": false, "row_header": false, "row_section": false}, {"bbox": {"l": 337.815, "t": 213.61900000000003, "r": 361.976, "b": 235.64499999999998, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 3, "end_row_offset_idx": 4, "start_col_offset_idx": 4, "end_col_offset_idx": 5, "text": "0.959 0.92", "column_header": false, "row_header": false, "row_section": false}, {"bbox": {"l": 380.464, "t": 213.61900000000003, "r": 404.625, "b": 235.64499999999998, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 3, "end_row_offset_idx": 4, "start_col_offset_idx": 5, "end_col_offset_idx": 6, "text": "0.862 0.722", "column_header": false, "row_header": false, "row_section": false}, {"bbox": {"l": 435.493, "t": 213.61900000000003, "r": 454.35, "b": 235.64499999999998, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 3, "end_row_offset_idx": 4, "start_col_offset_idx": 6, "end_col_offset_idx": 7, "text": "1.85 3.26", "column_header": false, "row_header": false, "row_section": false}, {"bbox": {"l": 148.626, "t": 243.18499999999995, "r": 207.152, "b": 254.47400000000005, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 4, "end_row_offset_idx": 5, "start_col_offset_idx": 0, "end_col_offset_idx": 1, "text": "PubTables-1M", "column_header": false, "row_header": false, "row_section": false}, {"bbox": {"l": 220.903, "t": 237.70500000000004, "r": 248.667, "b": 261.946, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 4, "end_row_offset_idx": 5, "start_col_offset_idx": 1, "end_col_offset_idx": 2, "text": "OTSL HTML", "column_header": false, "row_header": false, "row_section": false}, {"bbox": {"l": 264.744, "t": 237.70500000000004, "r": 285.731, "b": 261.946, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 4, "end_row_offset_idx": 5, "start_col_offset_idx": 2, "end_col_offset_idx": 3, "text": "0.987 0.983", "column_header": false, "row_header": false, "row_section": false}, {"bbox": {"l": 302.444, "t": 237.70500000000004, "r": 323.431, "b": 261.946, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 4, "end_row_offset_idx": 5, "start_col_offset_idx": 3, "end_col_offset_idx": 4, "text": "0.964 0.944", "column_header": false, "row_header": false, "row_section": false}, {"bbox": {"l": 337.815, "t": 239.91999999999996, "r": 361.976, "b": 261.946, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 4, "end_row_offset_idx": 5, "start_col_offset_idx": 4, "end_col_offset_idx": 5, "text": "0.977 0.966", "column_header": false, "row_header": false, "row_section": false}, {"bbox": {"l": 380.464, "t": 239.91999999999996, "r": 404.625, "b": 261.946, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 4, "end_row_offset_idx": 5, "start_col_offset_idx": 5, "end_col_offset_idx": 6, "text": "0.896 0.889", "column_header": false, "row_header": false, "row_section": false}, {"bbox": {"l": 435.493, "t": 239.91999999999996, "r": 454.35, "b": 261.946, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 4, "end_row_offset_idx": 5, "start_col_offset_idx": 6, "end_col_offset_idx": 7, "text": "1.79 3.26", "column_header": false, "row_header": false, "row_section": false}]}}}, "figures_classification": null, "equations_prediction": null, "vlm_response": null}, "assembled": {"elements": [{"label": "page_header", "id": 7, "page_no": 9, "cluster": {"id": 7, "label": "page_header", "bbox": {"l": 134.765, "t": 91.49300000000005, "r": 143.979, "b": 102.78200000000004, "coord_origin": "TOPLEFT"}, "confidence": 0.8309906721115112, "cells": [{"index": 0, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 102.78200000000004, "r_x1": 143.979, "r_y1": 102.78200000000004, "r_x2": 143.979, "r_y2": 91.49300000000005, "r_x3": 134.765, "r_y3": 91.49300000000005, "coord_origin": "TOPLEFT"}, "text": "10", "orig": "10", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "10"}, {"label": "page_header", "id": 6, "page_no": 9, "cluster": {"id": 6, "label": "page_header", "bbox": {"l": 167.821, "t": 91.49300000000005, "r": 231.72, "b": 102.78200000000004, "coord_origin": "TOPLEFT"}, "confidence": 0.8367075324058533, "cells": [{"index": 1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 167.821, "r_y0": 102.78200000000004, "r_x1": 231.72, "r_y1": 102.78200000000004, "r_x2": 231.72, "r_y2": 91.49300000000005, "r_x3": 167.821, "r_y3": 91.49300000000005, "coord_origin": "TOPLEFT"}, "text": "M. Lysak, et al.", "orig": "M. Lysak, et al.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "M. Lysak, et al."}, {"label": "caption", "id": 4, "page_no": 9, "cluster": {"id": 4, "label": "caption", "bbox": {"l": 134.765, "t": 113.62099999999998, "r": 480.594, "b": 146.82799999999997, "coord_origin": "TOPLEFT"}, "confidence": 0.9512290954589844, "cells": [{"index": 2, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 123.76199999999994, "r_x1": 173.094, "r_y1": 123.76199999999994, "r_x2": 173.094, "r_y2": 115.83600000000001, "r_x3": 134.765, "r_y3": 115.83600000000001, "coord_origin": "TOPLEFT"}, "text": "Table 2.", "orig": "Table 2.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 3, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 181.303, "r_y0": 124.90999999999997, "r_x1": 480.592, "r_y1": 124.90999999999997, "r_x2": 480.592, "r_y2": 113.62099999999998, "r_x3": 181.303, "r_y3": 113.62099999999998, "coord_origin": "TOPLEFT"}, "text": "TSR and cell detection results compared between OTSL and HTML on", "orig": "TSR and cell detection results compared between OTSL and HTML on", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 4, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 135.86900000000003, "r_x1": 480.594, "r_y1": 135.86900000000003, "r_x2": 480.594, "r_y2": 124.58000000000004, "r_x3": 134.765, "r_y3": 124.58000000000004, "coord_origin": "TOPLEFT"}, "text": "the PubTabNet [22], FinTabNet [21] and PubTables-1M [14] data sets using Table-", "orig": "the PubTabNet [22], FinTabNet [21] and PubTables-1M [14] data sets using Table-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 5, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 146.82799999999997, "r_x1": 305.957, "r_y1": 146.82799999999997, "r_x2": 305.957, "r_y2": 135.539, "r_x3": 134.765, "r_y3": 135.539, "coord_origin": "TOPLEFT"}, "text": "Former [9] (with enc=6, dec=6, heads=8).", "orig": "Former [9] (with enc=6, dec=6, heads=8).", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "Table 2. TSR and cell detection results compared between OTSL and HTML on the PubTabNet [22], FinTabNet [21] and PubTables-1M [14] data sets using TableFormer [9] (with enc=6, dec=6, heads=8)."}, {"label": "table", "id": 0, "page_no": 9, "cluster": {"id": 0, "label": "table", "bbox": {"l": 143.6376495361328, "t": 156.3477020263672, "r": 470.8485412597656, "b": 263.2624816894531, "coord_origin": "TOPLEFT"}, "confidence": 0.9884640574455261, "cells": [{"index": 6, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 160.782, "r_y0": 175.57000000000005, "r_x1": 194.998, "r_y1": 175.57000000000005, "r_x2": 194.998, "r_y2": 164.28099999999995, "r_x3": 160.782, "r_y3": 164.28099999999995, "coord_origin": "TOPLEFT"}, "text": "Data set", "orig": "Data set", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 7, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 215.525, "r_y0": 175.54499999999996, "r_x1": 254.045, "r_y1": 175.54499999999996, "r_x2": 254.045, "r_y2": 164.25599999999997, "r_x3": 215.525, "r_y3": 164.25599999999997, "coord_origin": "TOPLEFT"}, "text": "Language", "orig": "Language", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 8, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 300.397, "r_y0": 170.09000000000003, "r_x1": 323.991, "r_y1": 170.09000000000003, "r_x2": 323.991, "r_y2": 158.80100000000004, "r_x3": 300.397, "r_y3": 158.80100000000004, "coord_origin": "TOPLEFT"}, "text": "TEDs", "orig": "TEDs", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 9, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 370.345, "r_y0": 175.57000000000005, "r_x1": 414.747, "r_y1": 175.57000000000005, "r_x2": 414.747, "r_y2": 164.28099999999995, "r_x3": 370.345, "r_y3": 164.28099999999995, "coord_origin": "TOPLEFT"}, "text": "mAP(0.75)", "orig": "mAP(0.75)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 10, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 426.737, "r_y0": 170.09000000000003, "r_x1": 463.108, "r_y1": 170.09000000000003, "r_x2": 463.108, "r_y2": 158.80100000000004, "r_x3": 426.737, "r_y3": 158.80100000000004, "coord_origin": "TOPLEFT"}, "text": "Inference", "orig": "Inference", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 11, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 423.114, "r_y0": 181.04899999999998, "r_x1": 466.727, "r_y1": 181.04899999999998, "r_x2": 466.727, "r_y2": 169.76, "r_x3": 423.114, "r_y3": 169.76, "coord_origin": "TOPLEFT"}, "text": "time (secs)", "orig": "time (secs)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 12, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 262.413, "r_y0": 183.04200000000003, "r_x1": 288.06, "r_y1": 183.04200000000003, "r_x2": 288.06, "r_y2": 171.75300000000004, "r_x3": 262.413, "r_y3": 171.75300000000004, "coord_origin": "TOPLEFT"}, "text": "simple", "orig": "simple", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 13, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 296.429, "r_y0": 183.04200000000003, "r_x1": 329.447, "r_y1": 183.04200000000003, "r_x2": 329.447, "r_y2": 171.75300000000004, "r_x3": 296.429, "r_y3": 171.75300000000004, "coord_origin": "TOPLEFT"}, "text": "complex", "orig": "complex", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 14, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 345.033, "r_y0": 183.04200000000003, "r_x1": 354.758, "r_y1": 183.04200000000003, "r_x2": 354.758, "r_y2": 171.75300000000004, "r_x3": 345.033, "r_y3": 171.75300000000004, "coord_origin": "TOPLEFT"}, "text": "all", "orig": "all", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 15, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 154.538, "r_y0": 201.87099999999998, "r_x1": 201.241, "r_y1": 201.87099999999998, "r_x2": 201.241, "r_y2": 190.582, "r_x3": 154.538, "r_y3": 190.582, "coord_origin": "TOPLEFT"}, "text": "PubTabNet", "orig": "PubTabNet", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 16, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 222.437, "r_y0": 196.39200000000005, "r_x1": 247.132, "r_y1": 196.39200000000005, "r_x2": 247.132, "r_y2": 185.10299999999995, "r_x3": 222.437, "r_y3": 185.10299999999995, "coord_origin": "TOPLEFT"}, "text": "OTSL", "orig": "OTSL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 17, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 264.744, "r_y0": 196.39200000000005, "r_x1": 285.731, "r_y1": 196.39200000000005, "r_x2": 285.731, "r_y2": 185.10299999999995, "r_x3": 264.744, "r_y3": 185.10299999999995, "coord_origin": "TOPLEFT"}, "text": "0.965", "orig": "0.965", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 18, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 302.444, "r_y0": 196.39200000000005, "r_x1": 323.431, "r_y1": 196.39200000000005, "r_x2": 323.431, "r_y2": 185.10299999999995, "r_x3": 302.444, "r_y3": 185.10299999999995, "coord_origin": "TOPLEFT"}, "text": "0.934", "orig": "0.934", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 19, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 339.403, "r_y0": 196.39200000000005, "r_x1": 360.39, "r_y1": 196.39200000000005, "r_x2": 360.39, "r_y2": 185.10299999999995, "r_x3": 339.403, "r_y3": 185.10299999999995, "coord_origin": "TOPLEFT"}, "text": "0.955", "orig": "0.955", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 20, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 383.116, "r_y0": 195.24400000000003, "r_x1": 401.973, "r_y1": 195.24400000000003, "r_x2": 401.973, "r_y2": 187.31799999999998, "r_x3": 383.116, "r_y3": 187.31799999999998, "coord_origin": "TOPLEFT"}, "text": "0.88", "orig": "0.88", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 21, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 435.493, "r_y0": 195.24400000000003, "r_x1": 454.35, "r_y1": 195.24400000000003, "r_x2": 454.35, "r_y2": 187.31799999999998, "r_x3": 435.493, "r_y3": 187.31799999999998, "coord_origin": "TOPLEFT"}, "text": "2.73", "orig": "2.73", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 22, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 220.903, "r_y0": 209.34299999999996, "r_x1": 248.667, "r_y1": 209.34299999999996, "r_x2": 248.667, "r_y2": 198.05399999999997, "r_x3": 220.903, "r_y3": 198.05399999999997, "coord_origin": "TOPLEFT"}, "text": "HTML", "orig": "HTML", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 23, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 264.744, "r_y0": 209.34299999999996, "r_x1": 285.731, "r_y1": 209.34299999999996, "r_x2": 285.731, "r_y2": 198.05399999999997, "r_x3": 264.744, "r_y3": 198.05399999999997, "coord_origin": "TOPLEFT"}, "text": "0.969", "orig": "0.969", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 24, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 302.444, "r_y0": 209.34299999999996, "r_x1": 323.431, "r_y1": 209.34299999999996, "r_x2": 323.431, "r_y2": 198.05399999999997, "r_x3": 302.444, "r_y3": 198.05399999999997, "coord_origin": "TOPLEFT"}, "text": "0.927", "orig": "0.927", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 25, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 339.403, "r_y0": 209.34299999999996, "r_x1": 360.39, "r_y1": 209.34299999999996, "r_x2": 360.39, "r_y2": 198.05399999999997, "r_x3": 339.403, "r_y3": 198.05399999999997, "coord_origin": "TOPLEFT"}, "text": "0.955", "orig": "0.955", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 26, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 382.052, "r_y0": 209.34299999999996, "r_x1": 403.039, "r_y1": 209.34299999999996, "r_x2": 403.039, "r_y2": 198.05399999999997, "r_x3": 382.052, "r_y3": 198.05399999999997, "coord_origin": "TOPLEFT"}, "text": "0.857", "orig": "0.857", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 27, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 436.732, "r_y0": 209.34299999999996, "r_x1": 453.112, "r_y1": 209.34299999999996, "r_x2": 453.112, "r_y2": 198.05399999999997, "r_x3": 436.732, "r_y3": 198.05399999999997, "coord_origin": "TOPLEFT"}, "text": "5.39", "orig": "5.39", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 28, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 155.945, "r_y0": 228.173, "r_x1": 199.834, "r_y1": 228.173, "r_x2": 199.834, "r_y2": 216.88400000000001, "r_x3": 155.945, "r_y3": 216.88400000000001, "coord_origin": "TOPLEFT"}, "text": "FinTabNet", "orig": "FinTabNet", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 29, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 222.437, "r_y0": 222.69299999999998, "r_x1": 247.132, "r_y1": 222.69299999999998, "r_x2": 247.132, "r_y2": 211.404, "r_x3": 222.437, "r_y3": 211.404, "coord_origin": "TOPLEFT"}, "text": "OTSL", "orig": "OTSL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 30, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 264.744, "r_y0": 222.69299999999998, "r_x1": 285.731, "r_y1": 222.69299999999998, "r_x2": 285.731, "r_y2": 211.404, "r_x3": 264.744, "r_y3": 211.404, "coord_origin": "TOPLEFT"}, "text": "0.955", "orig": "0.955", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 31, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 302.444, "r_y0": 222.69299999999998, "r_x1": 323.431, "r_y1": 222.69299999999998, "r_x2": 323.431, "r_y2": 211.404, "r_x3": 302.444, "r_y3": 211.404, "coord_origin": "TOPLEFT"}, "text": "0.961", "orig": "0.961", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 32, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 337.815, "r_y0": 221.54499999999996, "r_x1": 361.976, "r_y1": 221.54499999999996, "r_x2": 361.976, "r_y2": 213.61900000000003, "r_x3": 337.815, "r_y3": 213.61900000000003, "coord_origin": "TOPLEFT"}, "text": "0.959", "orig": "0.959", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 33, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 380.464, "r_y0": 221.54499999999996, "r_x1": 404.625, "r_y1": 221.54499999999996, "r_x2": 404.625, "r_y2": 213.61900000000003, "r_x3": 380.464, "r_y3": 213.61900000000003, "coord_origin": "TOPLEFT"}, "text": "0.862", "orig": "0.862", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 34, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 435.493, "r_y0": 221.54499999999996, "r_x1": 454.35, "r_y1": 221.54499999999996, "r_x2": 454.35, "r_y2": 213.61900000000003, "r_x3": 435.493, "r_y3": 213.61900000000003, "coord_origin": "TOPLEFT"}, "text": "1.85", "orig": "1.85", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 35, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 220.903, "r_y0": 235.64499999999998, "r_x1": 248.667, "r_y1": 235.64499999999998, "r_x2": 248.667, "r_y2": 224.356, "r_x3": 220.903, "r_y3": 224.356, "coord_origin": "TOPLEFT"}, "text": "HTML", "orig": "HTML", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 36, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 264.744, "r_y0": 235.64499999999998, "r_x1": 285.731, "r_y1": 235.64499999999998, "r_x2": 285.731, "r_y2": 224.356, "r_x3": 264.744, "r_y3": 224.356, "coord_origin": "TOPLEFT"}, "text": "0.917", "orig": "0.917", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 37, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 302.444, "r_y0": 235.64499999999998, "r_x1": 323.431, "r_y1": 235.64499999999998, "r_x2": 323.431, "r_y2": 224.356, "r_x3": 302.444, "r_y3": 224.356, "coord_origin": "TOPLEFT"}, "text": "0.922", "orig": "0.922", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 38, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 341.706, "r_y0": 235.64499999999998, "r_x1": 358.086, "r_y1": 235.64499999999998, "r_x2": 358.086, "r_y2": 224.356, "r_x3": 341.706, "r_y3": 224.356, "coord_origin": "TOPLEFT"}, "text": "0.92", "orig": "0.92", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 39, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 382.052, "r_y0": 235.64499999999998, "r_x1": 403.039, "r_y1": 235.64499999999998, "r_x2": 403.039, "r_y2": 224.356, "r_x3": 382.052, "r_y3": 224.356, "coord_origin": "TOPLEFT"}, "text": "0.722", "orig": "0.722", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 40, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 436.732, "r_y0": 235.64499999999998, "r_x1": 453.112, "r_y1": 235.64499999999998, "r_x2": 453.112, "r_y2": 224.356, "r_x3": 436.732, "r_y3": 224.356, "coord_origin": "TOPLEFT"}, "text": "3.26", "orig": "3.26", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 41, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 148.626, "r_y0": 254.47400000000005, "r_x1": 207.152, "r_y1": 254.47400000000005, "r_x2": 207.152, "r_y2": 243.18499999999995, "r_x3": 148.626, "r_y3": 243.18499999999995, "coord_origin": "TOPLEFT"}, "text": "PubTables-1M", "orig": "PubTables-1M", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 42, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 222.437, "r_y0": 248.99400000000003, "r_x1": 247.132, "r_y1": 248.99400000000003, "r_x2": 247.132, "r_y2": 237.70500000000004, "r_x3": 222.437, "r_y3": 237.70500000000004, "coord_origin": "TOPLEFT"}, "text": "OTSL", "orig": "OTSL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 43, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 264.744, "r_y0": 248.99400000000003, "r_x1": 285.731, "r_y1": 248.99400000000003, "r_x2": 285.731, "r_y2": 237.70500000000004, "r_x3": 264.744, "r_y3": 237.70500000000004, "coord_origin": "TOPLEFT"}, "text": "0.987", "orig": "0.987", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 44, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 302.444, "r_y0": 248.99400000000003, "r_x1": 323.431, "r_y1": 248.99400000000003, "r_x2": 323.431, "r_y2": 237.70500000000004, "r_x3": 302.444, "r_y3": 237.70500000000004, "coord_origin": "TOPLEFT"}, "text": "0.964", "orig": "0.964", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 45, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 337.815, "r_y0": 247.846, "r_x1": 361.976, "r_y1": 247.846, "r_x2": 361.976, "r_y2": 239.91999999999996, "r_x3": 337.815, "r_y3": 239.91999999999996, "coord_origin": "TOPLEFT"}, "text": "0.977", "orig": "0.977", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 46, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 380.464, "r_y0": 247.846, "r_x1": 404.625, "r_y1": 247.846, "r_x2": 404.625, "r_y2": 239.91999999999996, "r_x3": 380.464, "r_y3": 239.91999999999996, "coord_origin": "TOPLEFT"}, "text": "0.896", "orig": "0.896", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 47, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 435.493, "r_y0": 247.846, "r_x1": 454.35, "r_y1": 247.846, "r_x2": 454.35, "r_y2": 239.91999999999996, "r_x3": 435.493, "r_y3": 239.91999999999996, "coord_origin": "TOPLEFT"}, "text": "1.79", "orig": "1.79", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 48, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 220.903, "r_y0": 261.946, "r_x1": 248.667, "r_y1": 261.946, "r_x2": 248.667, "r_y2": 250.65700000000004, "r_x3": 220.903, "r_y3": 250.65700000000004, "coord_origin": "TOPLEFT"}, "text": "HTML", "orig": "HTML", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 49, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 264.744, "r_y0": 261.946, "r_x1": 285.731, "r_y1": 261.946, "r_x2": 285.731, "r_y2": 250.65700000000004, "r_x3": 264.744, "r_y3": 250.65700000000004, "coord_origin": "TOPLEFT"}, "text": "0.983", "orig": "0.983", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 50, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 302.444, "r_y0": 261.946, "r_x1": 323.431, "r_y1": 261.946, "r_x2": 323.431, "r_y2": 250.65700000000004, "r_x3": 302.444, "r_y3": 250.65700000000004, "coord_origin": "TOPLEFT"}, "text": "0.944", "orig": "0.944", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 51, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 339.403, "r_y0": 261.946, "r_x1": 360.39, "r_y1": 261.946, "r_x2": 360.39, "r_y2": 250.65700000000004, "r_x3": 339.403, "r_y3": 250.65700000000004, "coord_origin": "TOPLEFT"}, "text": "0.966", "orig": "0.966", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 52, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 382.052, "r_y0": 261.946, "r_x1": 403.039, "r_y1": 261.946, "r_x2": 403.039, "r_y2": 250.65700000000004, "r_x3": 382.052, "r_y3": 250.65700000000004, "coord_origin": "TOPLEFT"}, "text": "0.889", "orig": "0.889", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 53, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 436.732, "r_y0": 261.946, "r_x1": 453.112, "r_y1": 261.946, "r_x2": 453.112, "r_y2": 250.65700000000004, "r_x3": 436.732, "r_y3": 250.65700000000004, "coord_origin": "TOPLEFT"}, "text": "3.26", "orig": "3.26", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": [{"id": 10, "label": "text", "bbox": {"l": 160.782, "t": 164.28099999999995, "r": 194.998, "b": 175.57000000000005, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 6, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 160.782, "r_y0": 175.57000000000005, "r_x1": 194.998, "r_y1": 175.57000000000005, "r_x2": 194.998, "r_y2": 164.28099999999995, "r_x3": 160.782, "r_y3": 164.28099999999995, "coord_origin": "TOPLEFT"}, "text": "Data set", "orig": "Data set", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 11, "label": "text", "bbox": {"l": 215.525, "t": 164.25599999999997, "r": 254.045, "b": 175.54499999999996, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 7, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 215.525, "r_y0": 175.54499999999996, "r_x1": 254.045, "r_y1": 175.54499999999996, "r_x2": 254.045, "r_y2": 164.25599999999997, "r_x3": 215.525, "r_y3": 164.25599999999997, "coord_origin": "TOPLEFT"}, "text": "Language", "orig": "Language", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 12, "label": "text", "bbox": {"l": 300.397, "t": 158.80100000000004, "r": 323.991, "b": 170.09000000000003, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 8, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 300.397, "r_y0": 170.09000000000003, "r_x1": 323.991, "r_y1": 170.09000000000003, "r_x2": 323.991, "r_y2": 158.80100000000004, "r_x3": 300.397, "r_y3": 158.80100000000004, "coord_origin": "TOPLEFT"}, "text": "TEDs", "orig": "TEDs", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 13, "label": "text", "bbox": {"l": 370.345, "t": 164.28099999999995, "r": 414.747, "b": 175.57000000000005, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 9, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 370.345, "r_y0": 175.57000000000005, "r_x1": 414.747, "r_y1": 175.57000000000005, "r_x2": 414.747, "r_y2": 164.28099999999995, "r_x3": 370.345, "r_y3": 164.28099999999995, "coord_origin": "TOPLEFT"}, "text": "mAP(0.75)", "orig": "mAP(0.75)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 14, "label": "text", "bbox": {"l": 426.737, "t": 158.80100000000004, "r": 463.108, "b": 170.09000000000003, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 10, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 426.737, "r_y0": 170.09000000000003, "r_x1": 463.108, "r_y1": 170.09000000000003, "r_x2": 463.108, "r_y2": 158.80100000000004, "r_x3": 426.737, "r_y3": 158.80100000000004, "coord_origin": "TOPLEFT"}, "text": "Inference", "orig": "Inference", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 15, "label": "text", "bbox": {"l": 423.114, "t": 169.76, "r": 466.727, "b": 181.04899999999998, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 11, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 423.114, "r_y0": 181.04899999999998, "r_x1": 466.727, "r_y1": 181.04899999999998, "r_x2": 466.727, "r_y2": 169.76, "r_x3": 423.114, "r_y3": 169.76, "coord_origin": "TOPLEFT"}, "text": "time (secs)", "orig": "time (secs)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 16, "label": "text", "bbox": {"l": 262.413, "t": 171.75300000000004, "r": 288.06, "b": 183.04200000000003, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 12, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 262.413, "r_y0": 183.04200000000003, "r_x1": 288.06, "r_y1": 183.04200000000003, "r_x2": 288.06, "r_y2": 171.75300000000004, "r_x3": 262.413, "r_y3": 171.75300000000004, "coord_origin": "TOPLEFT"}, "text": "simple", "orig": "simple", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 17, "label": "text", "bbox": {"l": 296.429, "t": 171.75300000000004, "r": 329.447, "b": 183.04200000000003, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 13, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 296.429, "r_y0": 183.04200000000003, "r_x1": 329.447, "r_y1": 183.04200000000003, "r_x2": 329.447, "r_y2": 171.75300000000004, "r_x3": 296.429, "r_y3": 171.75300000000004, "coord_origin": "TOPLEFT"}, "text": "complex", "orig": "complex", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 18, "label": "text", "bbox": {"l": 345.033, "t": 171.75300000000004, "r": 354.758, "b": 183.04200000000003, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 14, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 345.033, "r_y0": 183.04200000000003, "r_x1": 354.758, "r_y1": 183.04200000000003, "r_x2": 354.758, "r_y2": 171.75300000000004, "r_x3": 345.033, "r_y3": 171.75300000000004, "coord_origin": "TOPLEFT"}, "text": "all", "orig": "all", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 19, "label": "text", "bbox": {"l": 154.538, "t": 190.582, "r": 201.241, "b": 201.87099999999998, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 15, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 154.538, "r_y0": 201.87099999999998, "r_x1": 201.241, "r_y1": 201.87099999999998, "r_x2": 201.241, "r_y2": 190.582, "r_x3": 154.538, "r_y3": 190.582, "coord_origin": "TOPLEFT"}, "text": "PubTabNet", "orig": "PubTabNet", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 20, "label": "text", "bbox": {"l": 222.437, "t": 185.10299999999995, "r": 247.132, "b": 196.39200000000005, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 16, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 222.437, "r_y0": 196.39200000000005, "r_x1": 247.132, "r_y1": 196.39200000000005, "r_x2": 247.132, "r_y2": 185.10299999999995, "r_x3": 222.437, "r_y3": 185.10299999999995, "coord_origin": "TOPLEFT"}, "text": "OTSL", "orig": "OTSL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 21, "label": "text", "bbox": {"l": 264.744, "t": 185.10299999999995, "r": 285.731, "b": 196.39200000000005, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 17, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 264.744, "r_y0": 196.39200000000005, "r_x1": 285.731, "r_y1": 196.39200000000005, "r_x2": 285.731, "r_y2": 185.10299999999995, "r_x3": 264.744, "r_y3": 185.10299999999995, "coord_origin": "TOPLEFT"}, "text": "0.965", "orig": "0.965", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 22, "label": "text", "bbox": {"l": 302.444, "t": 185.10299999999995, "r": 323.431, "b": 196.39200000000005, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 18, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 302.444, "r_y0": 196.39200000000005, "r_x1": 323.431, "r_y1": 196.39200000000005, "r_x2": 323.431, "r_y2": 185.10299999999995, "r_x3": 302.444, "r_y3": 185.10299999999995, "coord_origin": "TOPLEFT"}, "text": "0.934", "orig": "0.934", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 23, "label": "text", "bbox": {"l": 339.403, "t": 185.10299999999995, "r": 360.39, "b": 196.39200000000005, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 19, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 339.403, "r_y0": 196.39200000000005, "r_x1": 360.39, "r_y1": 196.39200000000005, "r_x2": 360.39, "r_y2": 185.10299999999995, "r_x3": 339.403, "r_y3": 185.10299999999995, "coord_origin": "TOPLEFT"}, "text": "0.955", "orig": "0.955", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 24, "label": "text", "bbox": {"l": 383.116, "t": 187.31799999999998, "r": 401.973, "b": 195.24400000000003, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 20, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 383.116, "r_y0": 195.24400000000003, "r_x1": 401.973, "r_y1": 195.24400000000003, "r_x2": 401.973, "r_y2": 187.31799999999998, "r_x3": 383.116, "r_y3": 187.31799999999998, "coord_origin": "TOPLEFT"}, "text": "0.88", "orig": "0.88", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 25, "label": "text", "bbox": {"l": 435.493, "t": 187.31799999999998, "r": 454.35, "b": 195.24400000000003, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 21, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 435.493, "r_y0": 195.24400000000003, "r_x1": 454.35, "r_y1": 195.24400000000003, "r_x2": 454.35, "r_y2": 187.31799999999998, "r_x3": 435.493, "r_y3": 187.31799999999998, "coord_origin": "TOPLEFT"}, "text": "2.73", "orig": "2.73", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 26, "label": "text", "bbox": {"l": 220.903, "t": 198.05399999999997, "r": 248.667, "b": 209.34299999999996, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 22, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 220.903, "r_y0": 209.34299999999996, "r_x1": 248.667, "r_y1": 209.34299999999996, "r_x2": 248.667, "r_y2": 198.05399999999997, "r_x3": 220.903, "r_y3": 198.05399999999997, "coord_origin": "TOPLEFT"}, "text": "HTML", "orig": "HTML", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 27, "label": "text", "bbox": {"l": 264.744, "t": 198.05399999999997, "r": 285.731, "b": 209.34299999999996, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 23, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 264.744, "r_y0": 209.34299999999996, "r_x1": 285.731, "r_y1": 209.34299999999996, "r_x2": 285.731, "r_y2": 198.05399999999997, "r_x3": 264.744, "r_y3": 198.05399999999997, "coord_origin": "TOPLEFT"}, "text": "0.969", "orig": "0.969", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 28, "label": "text", "bbox": {"l": 302.444, "t": 198.05399999999997, "r": 323.431, "b": 209.34299999999996, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 24, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 302.444, "r_y0": 209.34299999999996, "r_x1": 323.431, "r_y1": 209.34299999999996, "r_x2": 323.431, "r_y2": 198.05399999999997, "r_x3": 302.444, "r_y3": 198.05399999999997, "coord_origin": "TOPLEFT"}, "text": "0.927", "orig": "0.927", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 29, "label": "text", "bbox": {"l": 339.403, "t": 198.05399999999997, "r": 360.39, "b": 209.34299999999996, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 25, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 339.403, "r_y0": 209.34299999999996, "r_x1": 360.39, "r_y1": 209.34299999999996, "r_x2": 360.39, "r_y2": 198.05399999999997, "r_x3": 339.403, "r_y3": 198.05399999999997, "coord_origin": "TOPLEFT"}, "text": "0.955", "orig": "0.955", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 30, "label": "text", "bbox": {"l": 382.052, "t": 198.05399999999997, "r": 403.039, "b": 209.34299999999996, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 26, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 382.052, "r_y0": 209.34299999999996, "r_x1": 403.039, "r_y1": 209.34299999999996, "r_x2": 403.039, "r_y2": 198.05399999999997, "r_x3": 382.052, "r_y3": 198.05399999999997, "coord_origin": "TOPLEFT"}, "text": "0.857", "orig": "0.857", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 31, "label": "text", "bbox": {"l": 436.732, "t": 198.05399999999997, "r": 453.112, "b": 209.34299999999996, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 27, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 436.732, "r_y0": 209.34299999999996, "r_x1": 453.112, "r_y1": 209.34299999999996, "r_x2": 453.112, "r_y2": 198.05399999999997, "r_x3": 436.732, "r_y3": 198.05399999999997, "coord_origin": "TOPLEFT"}, "text": "5.39", "orig": "5.39", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 32, "label": "text", "bbox": {"l": 155.945, "t": 216.88400000000001, "r": 199.834, "b": 228.173, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 28, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 155.945, "r_y0": 228.173, "r_x1": 199.834, "r_y1": 228.173, "r_x2": 199.834, "r_y2": 216.88400000000001, "r_x3": 155.945, "r_y3": 216.88400000000001, "coord_origin": "TOPLEFT"}, "text": "FinTabNet", "orig": "FinTabNet", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 33, "label": "text", "bbox": {"l": 222.437, "t": 211.404, "r": 247.132, "b": 222.69299999999998, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 29, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 222.437, "r_y0": 222.69299999999998, "r_x1": 247.132, "r_y1": 222.69299999999998, "r_x2": 247.132, "r_y2": 211.404, "r_x3": 222.437, "r_y3": 211.404, "coord_origin": "TOPLEFT"}, "text": "OTSL", "orig": "OTSL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 34, "label": "text", "bbox": {"l": 264.744, "t": 211.404, "r": 285.731, "b": 222.69299999999998, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 30, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 264.744, "r_y0": 222.69299999999998, "r_x1": 285.731, "r_y1": 222.69299999999998, "r_x2": 285.731, "r_y2": 211.404, "r_x3": 264.744, "r_y3": 211.404, "coord_origin": "TOPLEFT"}, "text": "0.955", "orig": "0.955", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 35, "label": "text", "bbox": {"l": 302.444, "t": 211.404, "r": 323.431, "b": 222.69299999999998, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 31, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 302.444, "r_y0": 222.69299999999998, "r_x1": 323.431, "r_y1": 222.69299999999998, "r_x2": 323.431, "r_y2": 211.404, "r_x3": 302.444, "r_y3": 211.404, "coord_origin": "TOPLEFT"}, "text": "0.961", "orig": "0.961", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 36, "label": "text", "bbox": {"l": 337.815, "t": 213.61900000000003, "r": 361.976, "b": 221.54499999999996, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 32, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 337.815, "r_y0": 221.54499999999996, "r_x1": 361.976, "r_y1": 221.54499999999996, "r_x2": 361.976, "r_y2": 213.61900000000003, "r_x3": 337.815, "r_y3": 213.61900000000003, "coord_origin": "TOPLEFT"}, "text": "0.959", "orig": "0.959", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 37, "label": "text", "bbox": {"l": 380.464, "t": 213.61900000000003, "r": 404.625, "b": 221.54499999999996, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 33, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 380.464, "r_y0": 221.54499999999996, "r_x1": 404.625, "r_y1": 221.54499999999996, "r_x2": 404.625, "r_y2": 213.61900000000003, "r_x3": 380.464, "r_y3": 213.61900000000003, "coord_origin": "TOPLEFT"}, "text": "0.862", "orig": "0.862", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 38, "label": "text", "bbox": {"l": 435.493, "t": 213.61900000000003, "r": 454.35, "b": 221.54499999999996, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 34, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 435.493, "r_y0": 221.54499999999996, "r_x1": 454.35, "r_y1": 221.54499999999996, "r_x2": 454.35, "r_y2": 213.61900000000003, "r_x3": 435.493, "r_y3": 213.61900000000003, "coord_origin": "TOPLEFT"}, "text": "1.85", "orig": "1.85", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 39, "label": "text", "bbox": {"l": 220.903, "t": 224.356, "r": 248.667, "b": 235.64499999999998, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 35, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 220.903, "r_y0": 235.64499999999998, "r_x1": 248.667, "r_y1": 235.64499999999998, "r_x2": 248.667, "r_y2": 224.356, "r_x3": 220.903, "r_y3": 224.356, "coord_origin": "TOPLEFT"}, "text": "HTML", "orig": "HTML", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 40, "label": "text", "bbox": {"l": 264.744, "t": 224.356, "r": 285.731, "b": 235.64499999999998, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 36, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 264.744, "r_y0": 235.64499999999998, "r_x1": 285.731, "r_y1": 235.64499999999998, "r_x2": 285.731, "r_y2": 224.356, "r_x3": 264.744, "r_y3": 224.356, "coord_origin": "TOPLEFT"}, "text": "0.917", "orig": "0.917", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 41, "label": "text", "bbox": {"l": 302.444, "t": 224.356, "r": 323.431, "b": 235.64499999999998, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 37, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 302.444, "r_y0": 235.64499999999998, "r_x1": 323.431, "r_y1": 235.64499999999998, "r_x2": 323.431, "r_y2": 224.356, "r_x3": 302.444, "r_y3": 224.356, "coord_origin": "TOPLEFT"}, "text": "0.922", "orig": "0.922", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 42, "label": "text", "bbox": {"l": 341.706, "t": 224.356, "r": 358.086, "b": 235.64499999999998, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 38, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 341.706, "r_y0": 235.64499999999998, "r_x1": 358.086, "r_y1": 235.64499999999998, "r_x2": 358.086, "r_y2": 224.356, "r_x3": 341.706, "r_y3": 224.356, "coord_origin": "TOPLEFT"}, "text": "0.92", "orig": "0.92", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 43, "label": "text", "bbox": {"l": 382.052, "t": 224.356, "r": 403.039, "b": 235.64499999999998, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 39, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 382.052, "r_y0": 235.64499999999998, "r_x1": 403.039, "r_y1": 235.64499999999998, "r_x2": 403.039, "r_y2": 224.356, "r_x3": 382.052, "r_y3": 224.356, "coord_origin": "TOPLEFT"}, "text": "0.722", "orig": "0.722", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 44, "label": "text", "bbox": {"l": 436.732, "t": 224.356, "r": 453.112, "b": 235.64499999999998, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 40, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 436.732, "r_y0": 235.64499999999998, "r_x1": 453.112, "r_y1": 235.64499999999998, "r_x2": 453.112, "r_y2": 224.356, "r_x3": 436.732, "r_y3": 224.356, "coord_origin": "TOPLEFT"}, "text": "3.26", "orig": "3.26", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 45, "label": "text", "bbox": {"l": 148.626, "t": 243.18499999999995, "r": 207.152, "b": 254.47400000000005, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 41, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 148.626, "r_y0": 254.47400000000005, "r_x1": 207.152, "r_y1": 254.47400000000005, "r_x2": 207.152, "r_y2": 243.18499999999995, "r_x3": 148.626, "r_y3": 243.18499999999995, "coord_origin": "TOPLEFT"}, "text": "PubTables-1M", "orig": "PubTables-1M", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 46, "label": "text", "bbox": {"l": 222.437, "t": 237.70500000000004, "r": 247.132, "b": 248.99400000000003, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 42, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 222.437, "r_y0": 248.99400000000003, "r_x1": 247.132, "r_y1": 248.99400000000003, "r_x2": 247.132, "r_y2": 237.70500000000004, "r_x3": 222.437, "r_y3": 237.70500000000004, "coord_origin": "TOPLEFT"}, "text": "OTSL", "orig": "OTSL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 47, "label": "text", "bbox": {"l": 264.744, "t": 237.70500000000004, "r": 285.731, "b": 248.99400000000003, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 43, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 264.744, "r_y0": 248.99400000000003, "r_x1": 285.731, "r_y1": 248.99400000000003, "r_x2": 285.731, "r_y2": 237.70500000000004, "r_x3": 264.744, "r_y3": 237.70500000000004, "coord_origin": "TOPLEFT"}, "text": "0.987", "orig": "0.987", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 48, "label": "text", "bbox": {"l": 302.444, "t": 237.70500000000004, "r": 323.431, "b": 248.99400000000003, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 44, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 302.444, "r_y0": 248.99400000000003, "r_x1": 323.431, "r_y1": 248.99400000000003, "r_x2": 323.431, "r_y2": 237.70500000000004, "r_x3": 302.444, "r_y3": 237.70500000000004, "coord_origin": "TOPLEFT"}, "text": "0.964", "orig": "0.964", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 49, "label": "text", "bbox": {"l": 337.815, "t": 239.91999999999996, "r": 361.976, "b": 247.846, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 45, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 337.815, "r_y0": 247.846, "r_x1": 361.976, "r_y1": 247.846, "r_x2": 361.976, "r_y2": 239.91999999999996, "r_x3": 337.815, "r_y3": 239.91999999999996, "coord_origin": "TOPLEFT"}, "text": "0.977", "orig": "0.977", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 50, "label": "text", "bbox": {"l": 380.464, "t": 239.91999999999996, "r": 404.625, "b": 247.846, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 46, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 380.464, "r_y0": 247.846, "r_x1": 404.625, "r_y1": 247.846, "r_x2": 404.625, "r_y2": 239.91999999999996, "r_x3": 380.464, "r_y3": 239.91999999999996, "coord_origin": "TOPLEFT"}, "text": "0.896", "orig": "0.896", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 51, "label": "text", "bbox": {"l": 435.493, "t": 239.91999999999996, "r": 454.35, "b": 247.846, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 47, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 435.493, "r_y0": 247.846, "r_x1": 454.35, "r_y1": 247.846, "r_x2": 454.35, "r_y2": 239.91999999999996, "r_x3": 435.493, "r_y3": 239.91999999999996, "coord_origin": "TOPLEFT"}, "text": "1.79", "orig": "1.79", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 52, "label": "text", "bbox": {"l": 220.903, "t": 250.65700000000004, "r": 248.667, "b": 261.946, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 48, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 220.903, "r_y0": 261.946, "r_x1": 248.667, "r_y1": 261.946, "r_x2": 248.667, "r_y2": 250.65700000000004, "r_x3": 220.903, "r_y3": 250.65700000000004, "coord_origin": "TOPLEFT"}, "text": "HTML", "orig": "HTML", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 53, "label": "text", "bbox": {"l": 264.744, "t": 250.65700000000004, "r": 285.731, "b": 261.946, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 49, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 264.744, "r_y0": 261.946, "r_x1": 285.731, "r_y1": 261.946, "r_x2": 285.731, "r_y2": 250.65700000000004, "r_x3": 264.744, "r_y3": 250.65700000000004, "coord_origin": "TOPLEFT"}, "text": "0.983", "orig": "0.983", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 54, "label": "text", "bbox": {"l": 302.444, "t": 250.65700000000004, "r": 323.431, "b": 261.946, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 50, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 302.444, "r_y0": 261.946, "r_x1": 323.431, "r_y1": 261.946, "r_x2": 323.431, "r_y2": 250.65700000000004, "r_x3": 302.444, "r_y3": 250.65700000000004, "coord_origin": "TOPLEFT"}, "text": "0.944", "orig": "0.944", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 55, "label": "text", "bbox": {"l": 339.403, "t": 250.65700000000004, "r": 360.39, "b": 261.946, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 51, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 339.403, "r_y0": 261.946, "r_x1": 360.39, "r_y1": 261.946, "r_x2": 360.39, "r_y2": 250.65700000000004, "r_x3": 339.403, "r_y3": 250.65700000000004, "coord_origin": "TOPLEFT"}, "text": "0.966", "orig": "0.966", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 56, "label": "text", "bbox": {"l": 382.052, "t": 250.65700000000004, "r": 403.039, "b": 261.946, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 52, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 382.052, "r_y0": 261.946, "r_x1": 403.039, "r_y1": 261.946, "r_x2": 403.039, "r_y2": 250.65700000000004, "r_x3": 382.052, "r_y3": 250.65700000000004, "coord_origin": "TOPLEFT"}, "text": "0.889", "orig": "0.889", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 57, "label": "text", "bbox": {"l": 436.732, "t": 250.65700000000004, "r": 453.112, "b": 261.946, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 53, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 436.732, "r_y0": 261.946, "r_x1": 453.112, "r_y1": 261.946, "r_x2": 453.112, "r_y2": 250.65700000000004, "r_x3": 436.732, "r_y3": 250.65700000000004, "coord_origin": "TOPLEFT"}, "text": "3.26", "orig": "3.26", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}]}, "text": null, "otsl_seq": ["ched", "ched", "ched", "lcel", "lcel", "ched", "ched", "nl", "ucel", "ucel", "ched", "ched", "ched", "ucel", "ucel", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "nl"], "num_rows": 5, "num_cols": 7, "table_cells": [{"bbox": {"l": 160.782, "t": 164.28099999999995, "r": 194.998, "b": 175.57000000000005, "coord_origin": "TOPLEFT"}, "row_span": 2, "col_span": 1, "start_row_offset_idx": 0, "end_row_offset_idx": 2, "start_col_offset_idx": 0, "end_col_offset_idx": 1, "text": "Data set", "column_header": true, "row_header": false, "row_section": false}, {"bbox": {"l": 215.525, "t": 164.25599999999997, "r": 254.045, "b": 175.54499999999996, "coord_origin": "TOPLEFT"}, "row_span": 2, "col_span": 1, "start_row_offset_idx": 0, "end_row_offset_idx": 2, "start_col_offset_idx": 1, "end_col_offset_idx": 2, "text": "Language", "column_header": true, "row_header": false, "row_section": false}, {"bbox": {"l": 300.397, "t": 158.80100000000004, "r": 323.991, "b": 170.09000000000003, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 3, "start_row_offset_idx": 0, "end_row_offset_idx": 1, "start_col_offset_idx": 2, "end_col_offset_idx": 5, "text": "TEDs", "column_header": true, "row_header": false, "row_section": false}, {"bbox": {"l": 370.345, "t": 164.28099999999995, "r": 414.747, "b": 175.57000000000005, "coord_origin": "TOPLEFT"}, "row_span": 2, "col_span": 1, "start_row_offset_idx": 0, "end_row_offset_idx": 2, "start_col_offset_idx": 5, "end_col_offset_idx": 6, "text": "mAP(0.75)", "column_header": true, "row_header": false, "row_section": false}, {"bbox": {"l": 423.114, "t": 158.80100000000004, "r": 466.727, "b": 181.04899999999998, "coord_origin": "TOPLEFT"}, "row_span": 2, "col_span": 1, "start_row_offset_idx": 0, "end_row_offset_idx": 2, "start_col_offset_idx": 6, "end_col_offset_idx": 7, "text": "Inference time (secs)", "column_header": true, "row_header": false, "row_section": false}, {"bbox": {"l": 262.413, "t": 171.75300000000004, "r": 288.06, "b": 183.04200000000003, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 1, "end_row_offset_idx": 2, "start_col_offset_idx": 2, "end_col_offset_idx": 3, "text": "simple", "column_header": true, "row_header": false, "row_section": false}, {"bbox": {"l": 296.429, "t": 171.75300000000004, "r": 329.447, "b": 183.04200000000003, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 1, "end_row_offset_idx": 2, "start_col_offset_idx": 3, "end_col_offset_idx": 4, "text": "complex", "column_header": true, "row_header": false, "row_section": false}, {"bbox": {"l": 345.033, "t": 171.75300000000004, "r": 354.758, "b": 183.04200000000003, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 1, "end_row_offset_idx": 2, "start_col_offset_idx": 4, "end_col_offset_idx": 5, "text": "all", "column_header": true, "row_header": false, "row_section": false}, {"bbox": {"l": 154.538, "t": 190.582, "r": 201.241, "b": 201.87099999999998, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 2, "end_row_offset_idx": 3, "start_col_offset_idx": 0, "end_col_offset_idx": 1, "text": "PubTabNet", "column_header": false, "row_header": false, "row_section": false}, {"bbox": {"l": 220.903, "t": 185.10299999999995, "r": 248.667, "b": 209.34299999999996, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 2, "end_row_offset_idx": 3, "start_col_offset_idx": 1, "end_col_offset_idx": 2, "text": "OTSL HTML", "column_header": false, "row_header": false, "row_section": false}, {"bbox": {"l": 264.744, "t": 185.10299999999995, "r": 285.731, "b": 209.34299999999996, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 2, "end_row_offset_idx": 3, "start_col_offset_idx": 2, "end_col_offset_idx": 3, "text": "0.965 0.969", "column_header": false, "row_header": false, "row_section": false}, {"bbox": {"l": 302.444, "t": 185.10299999999995, "r": 323.431, "b": 209.34299999999996, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 2, "end_row_offset_idx": 3, "start_col_offset_idx": 3, "end_col_offset_idx": 4, "text": "0.934 0.927", "column_header": false, "row_header": false, "row_section": false}, {"bbox": {"l": 339.403, "t": 185.10299999999995, "r": 360.39, "b": 209.34299999999996, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 2, "end_row_offset_idx": 3, "start_col_offset_idx": 4, "end_col_offset_idx": 5, "text": "0.955 0.955", "column_header": false, "row_header": false, "row_section": false}, {"bbox": {"l": 382.052, "t": 187.31799999999998, "r": 403.039, "b": 209.34299999999996, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 2, "end_row_offset_idx": 3, "start_col_offset_idx": 5, "end_col_offset_idx": 6, "text": "0.88 0.857", "column_header": false, "row_header": false, "row_section": false}, {"bbox": {"l": 435.493, "t": 187.31799999999998, "r": 454.35, "b": 209.34299999999996, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 2, "end_row_offset_idx": 3, "start_col_offset_idx": 6, "end_col_offset_idx": 7, "text": "2.73 5.39", "column_header": false, "row_header": false, "row_section": false}, {"bbox": {"l": 155.945, "t": 216.88400000000001, "r": 199.834, "b": 228.173, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 3, "end_row_offset_idx": 4, "start_col_offset_idx": 0, "end_col_offset_idx": 1, "text": "FinTabNet", "column_header": false, "row_header": false, "row_section": false}, {"bbox": {"l": 220.903, "t": 211.404, "r": 248.667, "b": 235.64499999999998, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 3, "end_row_offset_idx": 4, "start_col_offset_idx": 1, "end_col_offset_idx": 2, "text": "OTSL HTML", "column_header": false, "row_header": false, "row_section": false}, {"bbox": {"l": 264.744, "t": 211.404, "r": 285.731, "b": 235.64499999999998, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 3, "end_row_offset_idx": 4, "start_col_offset_idx": 2, "end_col_offset_idx": 3, "text": "0.955 0.917", "column_header": false, "row_header": false, "row_section": false}, {"bbox": {"l": 302.444, "t": 211.404, "r": 323.431, "b": 235.64499999999998, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 3, "end_row_offset_idx": 4, "start_col_offset_idx": 3, "end_col_offset_idx": 4, "text": "0.961 0.922", "column_header": false, "row_header": false, "row_section": false}, {"bbox": {"l": 337.815, "t": 213.61900000000003, "r": 361.976, "b": 235.64499999999998, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 3, "end_row_offset_idx": 4, "start_col_offset_idx": 4, "end_col_offset_idx": 5, "text": "0.959 0.92", "column_header": false, "row_header": false, "row_section": false}, {"bbox": {"l": 380.464, "t": 213.61900000000003, "r": 404.625, "b": 235.64499999999998, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 3, "end_row_offset_idx": 4, "start_col_offset_idx": 5, "end_col_offset_idx": 6, "text": "0.862 0.722", "column_header": false, "row_header": false, "row_section": false}, {"bbox": {"l": 435.493, "t": 213.61900000000003, "r": 454.35, "b": 235.64499999999998, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 3, "end_row_offset_idx": 4, "start_col_offset_idx": 6, "end_col_offset_idx": 7, "text": "1.85 3.26", "column_header": false, "row_header": false, "row_section": false}, {"bbox": {"l": 148.626, "t": 243.18499999999995, "r": 207.152, "b": 254.47400000000005, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 4, "end_row_offset_idx": 5, "start_col_offset_idx": 0, "end_col_offset_idx": 1, "text": "PubTables-1M", "column_header": false, "row_header": false, "row_section": false}, {"bbox": {"l": 220.903, "t": 237.70500000000004, "r": 248.667, "b": 261.946, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 4, "end_row_offset_idx": 5, "start_col_offset_idx": 1, "end_col_offset_idx": 2, "text": "OTSL HTML", "column_header": false, "row_header": false, "row_section": false}, {"bbox": {"l": 264.744, "t": 237.70500000000004, "r": 285.731, "b": 261.946, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 4, "end_row_offset_idx": 5, "start_col_offset_idx": 2, "end_col_offset_idx": 3, "text": "0.987 0.983", "column_header": false, "row_header": false, "row_section": false}, {"bbox": {"l": 302.444, "t": 237.70500000000004, "r": 323.431, "b": 261.946, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 4, "end_row_offset_idx": 5, "start_col_offset_idx": 3, "end_col_offset_idx": 4, "text": "0.964 0.944", "column_header": false, "row_header": false, "row_section": false}, {"bbox": {"l": 337.815, "t": 239.91999999999996, "r": 361.976, "b": 261.946, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 4, "end_row_offset_idx": 5, "start_col_offset_idx": 4, "end_col_offset_idx": 5, "text": "0.977 0.966", "column_header": false, "row_header": false, "row_section": false}, {"bbox": {"l": 380.464, "t": 239.91999999999996, "r": 404.625, "b": 261.946, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 4, "end_row_offset_idx": 5, "start_col_offset_idx": 5, "end_col_offset_idx": 6, "text": "0.896 0.889", "column_header": false, "row_header": false, "row_section": false}, {"bbox": {"l": 435.493, "t": 239.91999999999996, "r": 454.35, "b": 261.946, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 4, "end_row_offset_idx": 5, "start_col_offset_idx": 6, "end_col_offset_idx": 7, "text": "1.79 3.26", "column_header": false, "row_header": false, "row_section": false}]}, {"label": "section_header", "id": 3, "page_no": 9, "cluster": {"id": 3, "label": "section_header", "bbox": {"l": 134.765, "t": 288.915, "r": 257.087, "b": 297.722, "coord_origin": "TOPLEFT"}, "confidence": 0.9546447992324829, "cells": [{"index": 54, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 297.722, "r_x1": 149.402, "r_y1": 297.722, "r_x2": 149.402, "r_y2": 288.915, "r_x3": 134.765, "r_y3": 288.915, "coord_origin": "TOPLEFT"}, "text": "5.3", "orig": "5.3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 55, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 160.859, "r_y0": 297.722, "r_x1": 257.087, "r_y1": 297.722, "r_x2": 257.087, "r_y2": 288.915, "r_x3": 160.859, "r_y3": 288.915, "coord_origin": "TOPLEFT"}, "text": "Qualitative Results", "orig": "Qualitative Results", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "5.3 Qualitative Results"}, {"label": "text", "id": 1, "page_no": 9, "cluster": {"id": 1, "label": "text", "bbox": {"l": 134.765, "t": 309.861, "r": 480.59, "b": 366.478, "coord_origin": "TOPLEFT"}, "confidence": 0.9834085702896118, "cells": [{"index": 56, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 318.658, "r_x1": 189.59, "r_y1": 318.658, "r_x2": 189.59, "r_y2": 309.861, "r_x3": 134.765, "r_y3": 309.861, "coord_origin": "TOPLEFT"}, "text": "To illustrate", "orig": "To illustrate", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 57, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 194.263, "r_y0": 318.658, "r_x1": 208.096, "r_y1": 318.658, "r_x2": 208.096, "r_y2": 309.861, "r_x3": 194.263, "r_y3": 309.861, "coord_origin": "TOPLEFT"}, "text": "the", "orig": "the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 58, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 212.768, "r_y0": 318.658, "r_x1": 258.971, "r_y1": 318.658, "r_x2": 258.971, "r_y2": 309.861, "r_x3": 212.768, "r_y3": 309.861, "coord_origin": "TOPLEFT"}, "text": "qualitative", "orig": "qualitative", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 59, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 263.643, "r_y0": 318.658, "r_x1": 308.822, "r_y1": 318.658, "r_x2": 308.822, "r_y2": 309.861, "r_x3": 263.643, "r_y3": 309.861, "coord_origin": "TOPLEFT"}, "text": "differences", "orig": "differences", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 60, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 313.484, "r_y0": 318.658, "r_x1": 480.588, "r_y1": 318.658, "r_x2": 480.588, "r_y2": 309.861, "r_x3": 313.484, "r_y3": 309.861, "coord_origin": "TOPLEFT"}, "text": "between OTSL and HTML, Figure 5", "orig": "between OTSL and HTML, Figure 5", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 61, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 330.613, "r_x1": 480.589, "r_y1": 330.613, "r_x2": 480.589, "r_y2": 321.816, "r_x3": 134.765, "r_y3": 321.816, "coord_origin": "TOPLEFT"}, "text": "demonstrates less overlap and more accurate bounding boxes with OTSL. In", "orig": "demonstrates less overlap and more accurate bounding boxes with OTSL. In", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 62, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 342.568, "r_x1": 480.587, "r_y1": 342.568, "r_x2": 480.587, "r_y2": 333.771, "r_x3": 134.765, "r_y3": 333.771, "coord_origin": "TOPLEFT"}, "text": "Figure 6, OTSL proves to be more effective in handling tables with longer to-", "orig": "Figure 6, OTSL proves to be more effective in handling tables with longer to-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 63, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 354.523, "r_x1": 480.59, "r_y1": 354.523, "r_x2": 480.59, "r_y2": 345.726, "r_x3": 134.765, "r_y3": 345.726, "coord_origin": "TOPLEFT"}, "text": "ken sequences, resulting in even more precise structure prediction and bounding", "orig": "ken sequences, resulting in even more precise structure prediction and bounding", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 64, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 366.478, "r_x1": 161.657, "r_y1": 366.478, "r_x2": 161.657, "r_y2": 357.681, "r_x3": 134.765, "r_y3": 357.681, "coord_origin": "TOPLEFT"}, "text": "boxes.", "orig": "boxes.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "To illustrate the qualitative differences between OTSL and HTML, Figure 5 demonstrates less overlap and more accurate bounding boxes with OTSL. In Figure 6, OTSL proves to be more effective in handling tables with longer token sequences, resulting in even more precise structure prediction and bounding boxes."}, {"label": "caption", "id": 5, "page_no": 9, "cluster": {"id": 5, "label": "caption", "bbox": {"l": 134.765, "t": 395.375, "r": 480.591, "b": 439.717, "coord_origin": "TOPLEFT"}, "confidence": 0.9482728838920593, "cells": [{"index": 65, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 405.516, "r_x1": 162.644, "r_y1": 405.516, "r_x2": 162.644, "r_y2": 397.59, "r_x3": 134.765, "r_y3": 397.59, "coord_origin": "TOPLEFT"}, "text": "Fig. 5.", "orig": "Fig. 5.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 66, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 167.384, "r_y0": 406.664, "r_x1": 437.456, "r_y1": 406.664, "r_x2": 437.456, "r_y2": 395.375, "r_x3": 167.384, "r_y3": 395.375, "coord_origin": "TOPLEFT"}, "text": "The OTSL model produces more accurate bounding boxes with", "orig": "The OTSL model produces more accurate bounding boxes with", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 67, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 442.2, "r_y0": 406.664, "r_x1": 456.125, "r_y1": 406.664, "r_x2": 456.125, "r_y2": 395.375, "r_x3": 442.2, "r_y3": 395.375, "coord_origin": "TOPLEFT"}, "text": "less", "orig": "less", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 68, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 460.86, "r_y0": 406.664, "r_x1": 480.591, "r_y1": 406.664, "r_x2": 480.591, "r_y2": 395.375, "r_x3": 460.86, "r_y3": 395.375, "coord_origin": "TOPLEFT"}, "text": "over-", "orig": "over-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 69, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 417.623, "r_x1": 147.049, "r_y1": 417.623, "r_x2": 147.049, "r_y2": 406.334, "r_x3": 134.765, "r_y3": 406.334, "coord_origin": "TOPLEFT"}, "text": "lap", "orig": "lap", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 70, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 151.434, "r_y0": 417.623, "r_x1": 480.591, "r_y1": 417.623, "r_x2": 480.591, "r_y2": 406.334, "r_x3": 151.434, "r_y3": 406.334, "coord_origin": "TOPLEFT"}, "text": "(E) than the HTML model (D), when predicting the structure of a sparse ta-", "orig": "(E) than the HTML model (D), when predicting the structure of a sparse ta-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 71, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 428.582, "r_x1": 146.541, "r_y1": 428.582, "r_x2": 146.541, "r_y2": 417.293, "r_x3": 134.765, "r_y3": 417.293, "coord_origin": "TOPLEFT"}, "text": "ble", "orig": "ble", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 72, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 151.391, "r_y0": 428.582, "r_x1": 168.025, "r_y1": 428.582, "r_x2": 168.025, "r_y2": 417.293, "r_x3": 151.391, "r_y3": 417.293, "coord_origin": "TOPLEFT"}, "text": "(A),", "orig": "(A),", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 73, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 172.885, "r_y0": 428.582, "r_x1": 181.066, "r_y1": 428.582, "r_x2": 181.066, "r_y2": 417.293, "r_x3": 172.885, "r_y3": 417.293, "coord_origin": "TOPLEFT"}, "text": "at", "orig": "at", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 74, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 185.925, "r_y0": 428.582, "r_x1": 206.655, "r_y1": 428.582, "r_x2": 206.655, "r_y2": 417.293, "r_x3": 185.925, "r_y3": 417.293, "coord_origin": "TOPLEFT"}, "text": "twice", "orig": "twice", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 75, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 211.506, "r_y0": 428.582, "r_x1": 224.305, "r_y1": 428.582, "r_x2": 224.305, "r_y2": 417.293, "r_x3": 211.506, "r_y3": 417.293, "coord_origin": "TOPLEFT"}, "text": "the", "orig": "the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 76, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 229.165, "r_y0": 428.582, "r_x1": 264.77, "r_y1": 428.582, "r_x2": 264.77, "r_y2": 417.293, "r_x3": 229.165, "r_y3": 417.293, "coord_origin": "TOPLEFT"}, "text": "inference", "orig": "inference", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 77, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 269.621, "r_y0": 428.582, "r_x1": 291.939, "r_y1": 428.582, "r_x2": 291.939, "r_y2": 417.293, "r_x3": 269.621, "r_y3": 417.293, "coord_origin": "TOPLEFT"}, "text": "speed", "orig": "speed", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 78, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 296.799, "r_y0": 428.582, "r_x1": 327.819, "r_y1": 428.582, "r_x2": 327.819, "r_y2": 417.293, "r_x3": 296.799, "r_y3": 417.293, "coord_origin": "TOPLEFT"}, "text": "because", "orig": "because", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 79, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 332.67, "r_y0": 428.582, "r_x1": 340.092, "r_y1": 428.582, "r_x2": 340.092, "r_y2": 417.293, "r_x3": 332.67, "r_y3": 417.293, "coord_origin": "TOPLEFT"}, "text": "of", "orig": "of", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 80, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 344.952, "r_y0": 428.582, "r_x1": 373.2, "r_y1": 428.582, "r_x2": 373.2, "r_y2": 417.293, "r_x3": 344.952, "r_y3": 417.293, "coord_origin": "TOPLEFT"}, "text": "shorter", "orig": "shorter", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 81, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 378.05, "r_y0": 428.582, "r_x1": 413.174, "r_y1": 428.582, "r_x2": 413.174, "r_y2": 417.293, "r_x3": 378.05, "r_y3": 417.293, "coord_origin": "TOPLEFT"}, "text": "sequence", "orig": "sequence", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 82, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 418.024, "r_y0": 428.582, "r_x1": 443.108, "r_y1": 428.582, "r_x2": 443.108, "r_y2": 417.293, "r_x3": 418.024, "r_y3": 417.293, "coord_origin": "TOPLEFT"}, "text": "length", "orig": "length", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 83, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 447.959, "r_y0": 428.582, "r_x1": 480.588, "r_y1": 428.582, "r_x2": 480.588, "r_y2": 417.293, "r_x3": 447.959, "r_y3": 417.293, "coord_origin": "TOPLEFT"}, "text": "(B),(C).", "orig": "(B),(C).", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 84, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 439.541, "r_x1": 304.692, "r_y1": 439.541, "r_x2": 304.692, "r_y2": 428.252, "r_x3": 134.765, "r_y3": 428.252, "coord_origin": "TOPLEFT"}, "text": "\"PMC2807444_006_00.png\" PubTabNet.", "orig": "\"PMC2807444_006_00.png\" PubTabNet.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 125, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 342.634, "r_y0": 439.717, "r_x1": 344.819, "r_y1": 439.717, "r_x2": 344.819, "r_y2": 430.197, "r_x3": 342.634, "r_y3": 430.197, "coord_origin": "TOPLEFT"}, "text": "\u03bc", "orig": "\u03bc", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "Fig. 5. The OTSL model produces more accurate bounding boxes with less overlap (E) than the HTML model (D), when predicting the structure of a sparse table (A), at twice the inference speed because of shorter sequence length (B),(C). \"PMC2807444_006_00.png\" PubTabNet. \u03bc"}, {"label": "picture", "id": 2, "page_no": 9, "cluster": {"id": 2, "label": "picture", "bbox": {"l": 162.67430114746094, "t": 444.62255859375, "r": 451.70062255859375, "b": 663.2135620117188, "coord_origin": "TOPLEFT"}, "confidence": 0.9742383360862732, "cells": [{"index": 85, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 180.125, "r_y0": 518.934, "r_x1": 190.62, "r_y1": 518.934, "r_x2": 190.62, "r_y2": 516.296, "r_x3": 180.125, "r_y3": 516.296, "coord_origin": "TOPLEFT"}, "text": "<table>", "orig": "<table>", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 86, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 183.244, "r_y0": 522.8330000000001, "r_x1": 304.548, "r_y1": 522.8330000000001, "r_x2": 304.548, "r_y2": 520.194, "r_x3": 183.244, "r_y3": 520.194, "coord_origin": "TOPLEFT"}, "text": "<tr><td></td><td colspan=\"4\"></td><td colspan=\"6\"></td><td colspan=\"3\"></td></tr>", "orig": "<tr><td></td><td colspan=\"4\"></td><td colspan=\"6\"></td><td colspan=\"3\"></td></tr>", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 87, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 183.244, "r_y0": 526.731, "r_x1": 388.423, "r_y1": 526.731, "r_x2": 388.423, "r_y2": 524.0930000000001, "r_x3": 183.244, "r_y3": 524.0930000000001, "coord_origin": "TOPLEFT"}, "text": "<tr><td></td><td></td><td></td><td></td><td></td><td></td><td></td><td></td><td></td><td></td><td></td><td></td><td></td><td></td></tr>", "orig": "<tr><td></td><td></td><td></td><td></td><td></td><td></td><td></td><td></td><td></td><td></td><td></td><td></td><td></td><td></td></tr>", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 88, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 183.244, "r_y0": 530.63, "r_x1": 388.423, "r_y1": 530.63, "r_x2": 388.423, "r_y2": 527.992, "r_x3": 183.244, "r_y3": 527.992, "coord_origin": "TOPLEFT"}, "text": "<tr><td></td><td></td><td></td><td></td><td></td><td></td><td></td><td></td><td></td><td></td><td></td><td></td><td></td><td></td></tr>", "orig": "<tr><td></td><td></td><td></td><td></td><td></td><td></td><td></td><td></td><td></td><td></td><td></td><td></td><td></td><td></td></tr>", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 89, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 183.244, "r_y0": 534.529, "r_x1": 388.423, "r_y1": 534.529, "r_x2": 388.423, "r_y2": 531.8910000000001, "r_x3": 183.244, "r_y3": 531.8910000000001, "coord_origin": "TOPLEFT"}, "text": "<tr><td></td><td></td><td></td><td></td><td></td><td></td><td></td><td></td><td></td><td></td><td></td><td></td><td></td><td></td></tr>", "orig": "<tr><td></td><td></td><td></td><td></td><td></td><td></td><td></td><td></td><td></td><td></td><td></td><td></td><td></td><td></td></tr>", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 90, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 183.244, "r_y0": 538.428, "r_x1": 388.423, "r_y1": 538.428, "r_x2": 388.423, "r_y2": 535.79, "r_x3": 183.244, "r_y3": 535.79, "coord_origin": "TOPLEFT"}, "text": "<tr><td></td><td></td><td></td><td></td><td></td><td></td><td></td><td></td><td></td><td></td><td></td><td></td><td></td><td></td></tr>", "orig": "<tr><td></td><td></td><td></td><td></td><td></td><td></td><td></td><td></td><td></td><td></td><td></td><td></td><td></td><td></td></tr>", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 91, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 183.244, "r_y0": 542.327, "r_x1": 388.423, "r_y1": 542.327, "r_x2": 388.423, "r_y2": 539.689, "r_x3": 183.244, "r_y3": 539.689, "coord_origin": "TOPLEFT"}, "text": "<tr><td></td><td></td><td></td><td></td><td></td><td></td><td></td><td></td><td></td><td></td><td></td><td></td><td></td><td></td></tr>", "orig": "<tr><td></td><td></td><td></td><td></td><td></td><td></td><td></td><td></td><td></td><td></td><td></td><td></td><td></td><td></td></tr>", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 92, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 183.244, "r_y0": 546.226, "r_x1": 388.423, "r_y1": 546.226, "r_x2": 388.423, "r_y2": 543.588, "r_x3": 183.244, "r_y3": 543.588, "coord_origin": "TOPLEFT"}, "text": "<tr><td></td><td></td><td></td><td></td><td></td><td></td><td></td><td></td><td></td><td></td><td></td><td></td><td></td><td></td></tr>", "orig": "<tr><td></td><td></td><td></td><td></td><td></td><td></td><td></td><td></td><td></td><td></td><td></td><td></td><td></td><td></td></tr>", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 93, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 183.244, "r_y0": 550.124, "r_x1": 388.423, "r_y1": 550.124, "r_x2": 388.423, "r_y2": 547.486, "r_x3": 183.244, "r_y3": 547.486, "coord_origin": "TOPLEFT"}, "text": "<tr><td></td><td></td><td></td><td></td><td></td><td></td><td></td><td></td><td></td><td></td><td></td><td></td><td></td><td></td></tr>", "orig": "<tr><td></td><td></td><td></td><td></td><td></td><td></td><td></td><td></td><td></td><td></td><td></td><td></td><td></td><td></td></tr>", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 94, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 183.244, "r_y0": 554.023, "r_x1": 388.423, "r_y1": 554.023, "r_x2": 388.423, "r_y2": 551.385, "r_x3": 183.244, "r_y3": 551.385, "coord_origin": "TOPLEFT"}, "text": "<tr><td></td><td></td><td></td><td></td><td></td><td></td><td></td><td></td><td></td><td></td><td></td><td></td><td></td><td></td></tr>", "orig": "<tr><td></td><td></td><td></td><td></td><td></td><td></td><td></td><td></td><td></td><td></td><td></td><td></td><td></td><td></td></tr>", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 95, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 180.125, "r_y0": 557.922, "r_x1": 191.868, "r_y1": 557.922, "r_x2": 191.868, "r_y2": 555.284, "r_x3": 180.125, "r_y3": 555.284, "coord_origin": "TOPLEFT"}, "text": "</table>", "orig": "</table>", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 96, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 407.383, "r_y0": 521.001, "r_x1": 450.486, "r_y1": 521.001, "r_x2": 450.486, "r_y2": 518.363, "r_x3": 407.383, "r_y3": 518.363, "coord_origin": "TOPLEFT"}, "text": "C C L L L C L L L L L C L L NL", "orig": "C C L L L C L L L L L C L L NL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 97, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 407.383, "r_y0": 524.9, "r_x1": 450.486, "r_y1": 524.9, "r_x2": 450.486, "r_y2": 522.262, "r_x3": 407.383, "r_y3": 522.262, "coord_origin": "TOPLEFT"}, "text": "C C C C C C C C C C C C C C NL", "orig": "C C C C C C C C C C C C C C NL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 98, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 407.383, "r_y0": 528.799, "r_x1": 450.486, "r_y1": 528.799, "r_x2": 450.486, "r_y2": 526.1600000000001, "r_x3": 407.383, "r_y3": 526.1600000000001, "coord_origin": "TOPLEFT"}, "text": "C C C C C C C C C C C C C C NL", "orig": "C C C C C C C C C C C C C C NL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 99, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 407.383, "r_y0": 532.697, "r_x1": 450.486, "r_y1": 532.697, "r_x2": 450.486, "r_y2": 530.059, "r_x3": 407.383, "r_y3": 530.059, "coord_origin": "TOPLEFT"}, "text": "C C C C C C C C C C C C C C NL", "orig": "C C C C C C C C C C C C C C NL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 100, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 407.383, "r_y0": 536.596, "r_x1": 450.486, "r_y1": 536.596, "r_x2": 450.486, "r_y2": 533.9580000000001, "r_x3": 407.383, "r_y3": 533.9580000000001, "coord_origin": "TOPLEFT"}, "text": "C C C C C C C C C C C C C C NL", "orig": "C C C C C C C C C C C C C C NL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 101, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 407.383, "r_y0": 540.495, "r_x1": 450.486, "r_y1": 540.495, "r_x2": 450.486, "r_y2": 537.857, "r_x3": 407.383, "r_y3": 537.857, "coord_origin": "TOPLEFT"}, "text": "C C C C C C C C C C C C C C NL", "orig": "C C C C C C C C C C C C C C NL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 102, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 407.383, "r_y0": 544.394, "r_x1": 450.486, "r_y1": 544.394, "r_x2": 450.486, "r_y2": 541.756, "r_x3": 407.383, "r_y3": 541.756, "coord_origin": "TOPLEFT"}, "text": "C C C C C C C C C C C C C C NL", "orig": "C C C C C C C C C C C C C C NL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 103, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 407.383, "r_y0": 548.293, "r_x1": 450.486, "r_y1": 548.293, "r_x2": 450.486, "r_y2": 545.655, "r_x3": 407.383, "r_y3": 545.655, "coord_origin": "TOPLEFT"}, "text": "C C C C C C C C C C C C C C NL", "orig": "C C C C C C C C C C C C C C NL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 104, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 407.383, "r_y0": 552.192, "r_x1": 450.486, "r_y1": 552.192, "r_x2": 450.486, "r_y2": 549.554, "r_x3": 407.383, "r_y3": 549.554, "coord_origin": "TOPLEFT"}, "text": "C C C C C C C C C C C C C C NL", "orig": "C C C C C C C C C C C C C C NL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 105, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 164.529, "r_y0": 515.288, "r_x1": 181.853, "r_y1": 515.288, "r_x2": 181.853, "r_y2": 509.533, "r_x3": 164.529, "r_y3": 509.533, "coord_origin": "TOPLEFT"}, "text": "HTML", "orig": "HTML", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 106, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 183.584, "r_y0": 515.288, "r_x1": 208.901, "r_y1": 515.288, "r_x2": 208.901, "r_y2": 509.533, "r_x3": 183.584, "r_y3": 509.533, "coord_origin": "TOPLEFT"}, "text": "# tokens:", "orig": "# tokens:", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 107, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 210.633, "r_y0": 515.288, "r_x1": 221.04, "r_y1": 515.288, "r_x2": 221.04, "r_y2": 509.533, "r_x3": 210.633, "r_y3": 509.533, "coord_origin": "TOPLEFT"}, "text": "258", "orig": "258", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 108, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 390.202, "r_y0": 515.433, "r_x1": 406.836, "r_y1": 515.433, "r_x2": 406.836, "r_y2": 509.678, "r_x3": 390.202, "r_y3": 509.678, "coord_origin": "TOPLEFT"}, "text": "OTSL", "orig": "OTSL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 109, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 408.569, "r_y0": 515.433, "r_x1": 433.886, "r_y1": 515.433, "r_x2": 433.886, "r_y2": 509.678, "r_x3": 408.569, "r_y3": 509.678, "coord_origin": "TOPLEFT"}, "text": "# tokens:", "orig": "# tokens:", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 110, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 435.617, "r_y0": 515.433, "r_x1": 446.025, "r_y1": 515.433, "r_x2": 446.025, "r_y2": 509.678, "r_x3": 435.617, "r_y3": 509.678, "coord_origin": "TOPLEFT"}, "text": "135", "orig": "135", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 111, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 167.193, "r_y0": 526.36, "r_x1": 172.823, "r_y1": 526.36, "r_x2": 172.823, "r_y2": 519.1659999999999, "r_x3": 167.193, "r_y3": 519.1659999999999, "coord_origin": "TOPLEFT"}, "text": "B", "orig": "B", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 112, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 187.337, "r_y0": 455.912, "r_x1": 192.967, "r_y1": 455.912, "r_x2": 192.967, "r_y2": 448.718, "r_x3": 187.337, "r_y3": 448.718, "coord_origin": "TOPLEFT"}, "text": "A", "orig": "A", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 113, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 167.387, "r_y0": 573.292, "r_x1": 173.016, "r_y1": 573.292, "r_x2": 173.016, "r_y2": 566.0989999999999, "r_x3": 167.387, "r_y3": 566.0989999999999, "coord_origin": "TOPLEFT"}, "text": "D", "orig": "D", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 114, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 248.456, "r_y0": 629.067, "r_x1": 253.657, "r_y1": 629.067, "r_x2": 253.657, "r_y2": 621.874, "r_x3": 248.456, "r_y3": 621.874, "coord_origin": "TOPLEFT"}, "text": "E", "orig": "E", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 115, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 395.901, "r_y0": 526.4870000000001, "r_x1": 401.531, "r_y1": 526.4870000000001, "r_x2": 401.531, "r_y2": 519.293, "r_x3": 395.901, "r_y3": 519.293, "coord_origin": "TOPLEFT"}, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 116, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 177.46, "r_y0": 597.268, "r_x1": 177.455, "r_y1": 580.287, "r_x2": 171.7, "r_y2": 580.289, "r_x3": 171.705, "r_y3": 597.269, "coord_origin": "TOPLEFT"}, "text": "HTML", "orig": "HTML", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 117, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 256.891, "r_y0": 649.923, "r_x1": 256.886, "r_y1": 633.633, "r_x2": 251.131, "r_y2": 633.634, "r_x3": 251.136, "r_y3": 649.925, "coord_origin": "TOPLEFT"}, "text": "OTSL", "orig": "OTSL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 118, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 372.146, "r_y0": 607.287, "r_x1": 427.038, "r_y1": 607.287, "r_x2": 427.038, "r_y2": 601.532, "r_x3": 372.146, "r_y3": 601.532, "coord_origin": "TOPLEFT"}, "text": "HTML model shows", "orig": "HTML model shows", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 119, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 372.146, "r_y0": 613.729, "r_x1": 430.068, "r_y1": 613.729, "r_x2": 430.068, "r_y2": 607.9739999999999, "r_x3": 372.146, "r_y3": 607.9739999999999, "coord_origin": "TOPLEFT"}, "text": "bounding box drifting", "orig": "bounding box drifting", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 120, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 176.88, "r_y0": 648.702, "r_x1": 231.082, "r_y1": 648.702, "r_x2": 231.082, "r_y2": 642.947, "r_x3": 176.88, "r_y3": 642.947, "coord_origin": "TOPLEFT"}, "text": "OTSL model shows", "orig": "OTSL model shows", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 121, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 176.88, "r_y0": 655.144, "r_x1": 230.993, "r_y1": 655.144, "r_x2": 230.993, "r_y2": 649.389, "r_x3": 176.88, "r_y3": 649.389, "coord_origin": "TOPLEFT"}, "text": "clean bounding box", "orig": "clean bounding box", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 122, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 176.88, "r_y0": 661.586, "r_x1": 203.932, "r_y1": 661.586, "r_x2": 203.932, "r_y2": 655.831, "r_x3": 176.88, "r_y3": 655.831, "coord_origin": "TOPLEFT"}, "text": "alignment", "orig": "alignment", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 123, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 215.932, "r_y0": 569.16, "r_x1": 218.47, "r_y1": 569.16, "r_x2": 218.47, "r_y2": 557.563, "r_x3": 215.932, "r_y3": 557.563, "coord_origin": "TOPLEFT"}, "text": "\u2264", "orig": "\u2264", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 124, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 229.057, "r_y0": 569.16, "r_x1": 231.719, "r_y1": 569.16, "r_x2": 231.719, "r_y2": 557.563, "r_x3": 229.057, "r_y3": 557.563, "coord_origin": "TOPLEFT"}, "text": "\u03bc", "orig": "\u03bc", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 126, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 261.209, "r_y0": 451.197, "r_x1": 263.57, "r_y1": 451.197, "r_x2": 263.57, "r_y2": 448.461, "r_x3": 261.209, "r_y3": 448.461, "coord_origin": "TOPLEFT"}, "text": "S", "orig": "S", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 127, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 312.335, "r_y0": 451.197, "r_x1": 313.636, "r_y1": 451.197, "r_x2": 313.636, "r_y2": 448.461, "r_x3": 312.335, "r_y3": 448.461, "coord_origin": "TOPLEFT"}, "text": "I", "orig": "I", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 128, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 377.411, "r_y0": 451.197, "r_x1": 380.057, "r_y1": 451.197, "r_x2": 380.057, "r_y2": 448.461, "r_x3": 377.411, "r_y3": 448.461, "coord_origin": "TOPLEFT"}, "text": "R", "orig": "R", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 129, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 200.64, "r_y0": 456.076, "r_x1": 205.818, "r_y1": 456.076, "r_x2": 205.818, "r_y2": 453.34, "r_x3": 200.64, "r_y3": 453.34, "coord_origin": "TOPLEFT"}, "text": "ST", "orig": "ST", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 130, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 222.208, "r_y0": 456.076, "r_x1": 229.761, "r_y1": 456.076, "r_x2": 229.761, "r_y2": 453.34, "r_x3": 222.208, "r_y3": 453.34, "coord_origin": "TOPLEFT"}, "text": "0.03", "orig": "0.03", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 131, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 243.267, "r_y0": 456.076, "r_x1": 250.82, "r_y1": 456.076, "r_x2": 250.82, "r_y2": 453.34, "r_x3": 243.267, "r_y3": 453.34, "coord_origin": "TOPLEFT"}, "text": "0.06", "orig": "0.06", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 132, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 264.297, "r_y0": 456.076, "r_x1": 271.842, "r_y1": 456.076, "r_x2": 271.842, "r_y2": 453.34, "r_x3": 264.297, "r_y3": 453.34, "coord_origin": "TOPLEFT"}, "text": "0.12", "orig": "0.12", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 133, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 285.319, "r_y0": 456.076, "r_x1": 292.872, "r_y1": 456.076, "r_x2": 292.872, "r_y2": 453.34, "r_x3": 285.319, "r_y3": 453.34, "coord_origin": "TOPLEFT"}, "text": "0.25", "orig": "0.25", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 134, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 306.378, "r_y0": 456.076, "r_x1": 311.766, "r_y1": 456.076, "r_x2": 311.766, "r_y2": 453.34, "r_x3": 306.378, "r_y3": 453.34, "coord_origin": "TOPLEFT"}, "text": "0.5", "orig": "0.5", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 135, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 323.417, "r_y0": 456.076, "r_x1": 325.575, "r_y1": 456.076, "r_x2": 325.575, "r_y2": 453.34, "r_x3": 323.417, "r_y3": 453.34, "coord_origin": "TOPLEFT"}, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 136, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 334.458, "r_y0": 456.076, "r_x1": 336.616, "r_y1": 456.076, "r_x2": 336.616, "r_y2": 453.34, "r_x3": 334.458, "r_y3": 453.34, "coord_origin": "TOPLEFT"}, "text": "2", "orig": "2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 137, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 345.528, "r_y0": 456.076, "r_x1": 347.685, "r_y1": 456.076, "r_x2": 347.685, "r_y2": 453.34, "r_x3": 345.528, "r_y3": 453.34, "coord_origin": "TOPLEFT"}, "text": "4", "orig": "4", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 138, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 356.569, "r_y0": 456.076, "r_x1": 358.726, "r_y1": 456.076, "r_x2": 358.726, "r_y2": 453.34, "r_x3": 356.569, "r_y3": 453.34, "coord_origin": "TOPLEFT"}, "text": "8", "orig": "8", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 139, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 367.638, "r_y0": 456.076, "r_x1": 371.964, "r_y1": 456.076, "r_x2": 371.964, "r_y2": 453.34, "r_x3": 367.638, "r_y3": 453.34, "coord_origin": "TOPLEFT"}, "text": "16", "orig": "16", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 140, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 382.673, "r_y0": 456.076, "r_x1": 386.999, "r_y1": 456.076, "r_x2": 386.999, "r_y2": 453.34, "r_x3": 382.673, "r_y3": 453.34, "coord_origin": "TOPLEFT"}, "text": "32", "orig": "32", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 141, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 397.737, "r_y0": 456.076, "r_x1": 402.063, "r_y1": 456.076, "r_x2": 402.063, "r_y2": 453.34, "r_x3": 397.737, "r_y3": 453.34, "coord_origin": "TOPLEFT"}, "text": "64", "orig": "64", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 142, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 412.789, "r_y0": 457.8, "r_x1": 414.935, "r_y1": 457.8, "r_x2": 414.935, "r_y2": 447.993, "r_x3": 412.789, "r_y3": 447.993, "coord_origin": "TOPLEFT"}, "text": "\u2265", "orig": "\u2265", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 143, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 416.07, "r_y0": 456.076, "r_x1": 422.535, "r_y1": 456.076, "r_x2": 422.535, "r_y2": 453.34, "r_x3": 416.07, "r_y3": 453.34, "coord_origin": "TOPLEFT"}, "text": "128", "orig": "128", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 144, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 200.64, "r_y0": 466.66, "r_x1": 204.563, "r_y1": 466.66, "r_x2": 204.563, "r_y2": 463.924, "r_x3": 200.64, "r_y3": 463.924, "coord_origin": "TOPLEFT"}, "text": "63", "orig": "63", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 145, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 367.626, "r_y0": 466.66, "r_x1": 369.58, "r_y1": 466.66, "r_x2": 369.58, "r_y2": 463.924, "r_x3": 367.626, "r_y3": 463.924, "coord_origin": "TOPLEFT"}, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 146, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 382.661, "r_y0": 466.66, "r_x1": 384.616, "r_y1": 466.66, "r_x2": 384.616, "r_y2": 463.924, "r_x3": 382.661, "r_y3": 463.924, "coord_origin": "TOPLEFT"}, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 147, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 397.725, "r_y0": 466.66, "r_x1": 399.679, "r_y1": 466.66, "r_x2": 399.679, "r_y2": 463.924, "r_x3": 397.725, "r_y3": 463.924, "coord_origin": "TOPLEFT"}, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 148, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 200.64, "r_y0": 471.539, "r_x1": 206.503, "r_y1": 471.539, "r_x2": 206.503, "r_y2": 468.803, "r_x3": 200.64, "r_y3": 468.803, "coord_origin": "TOPLEFT"}, "text": "199", "orig": "199", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 149, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 264.29, "r_y0": 471.539, "r_x1": 266.245, "r_y1": 471.539, "r_x2": 266.245, "r_y2": 468.803, "r_x3": 264.29, "r_y3": 468.803, "coord_origin": "TOPLEFT"}, "text": "5", "orig": "5", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 150, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 306.372, "r_y0": 471.539, "r_x1": 308.326, "r_y1": 471.539, "r_x2": 308.326, "r_y2": 468.803, "r_x3": 306.372, "r_y3": 468.803, "coord_origin": "TOPLEFT"}, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 151, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 345.515, "r_y0": 471.539, "r_x1": 347.47, "r_y1": 471.539, "r_x2": 347.47, "r_y2": 468.803, "r_x3": 345.515, "r_y3": 468.803, "coord_origin": "TOPLEFT"}, "text": "2", "orig": "2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 152, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 356.556, "r_y0": 471.539, "r_x1": 358.511, "r_y1": 471.539, "r_x2": 358.511, "r_y2": 468.803, "r_x3": 356.556, "r_y3": 468.803, "coord_origin": "TOPLEFT"}, "text": "4", "orig": "4", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 153, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 367.626, "r_y0": 471.539, "r_x1": 369.58, "r_y1": 471.539, "r_x2": 369.58, "r_y2": 468.803, "r_x3": 367.626, "r_y3": 468.803, "coord_origin": "TOPLEFT"}, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 154, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 382.661, "r_y0": 471.539, "r_x1": 384.615, "r_y1": 471.539, "r_x2": 384.615, "r_y2": 468.803, "r_x3": 382.661, "r_y3": 468.803, "coord_origin": "TOPLEFT"}, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 155, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 200.64, "r_y0": 476.418, "r_x1": 206.503, "r_y1": 476.418, "r_x2": 206.503, "r_y2": 473.682, "r_x3": 200.64, "r_y3": 473.682, "coord_origin": "TOPLEFT"}, "text": "416", "orig": "416", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 156, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 264.29, "r_y0": 476.418, "r_x1": 266.245, "r_y1": 476.418, "r_x2": 266.245, "r_y2": 473.682, "r_x3": 264.29, "r_y3": 473.682, "coord_origin": "TOPLEFT"}, "text": "4", "orig": "4", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 157, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 200.64, "r_y0": 481.268, "r_x1": 206.503, "r_y1": 481.268, "r_x2": 206.503, "r_y2": 478.532, "r_x3": 200.64, "r_y3": 478.532, "coord_origin": "TOPLEFT"}, "text": "230", "orig": "230", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 158, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 243.264, "r_y0": 481.268, "r_x1": 245.218, "r_y1": 481.268, "r_x2": 245.218, "r_y2": 478.532, "r_x3": 243.264, "r_y3": 478.532, "coord_origin": "TOPLEFT"}, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 159, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 264.29, "r_y0": 481.268, "r_x1": 266.245, "r_y1": 481.268, "r_x2": 266.245, "r_y2": 478.532, "r_x3": 264.29, "r_y3": 478.532, "coord_origin": "TOPLEFT"}, "text": "9", "orig": "9", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 160, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 323.405, "r_y0": 481.268, "r_x1": 325.359, "r_y1": 481.268, "r_x2": 325.359, "r_y2": 478.532, "r_x3": 323.405, "r_y3": 478.532, "coord_origin": "TOPLEFT"}, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 161, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 397.725, "r_y0": 481.268, "r_x1": 399.679, "r_y1": 481.268, "r_x2": 399.679, "r_y2": 478.532, "r_x3": 397.725, "r_y3": 478.532, "coord_origin": "TOPLEFT"}, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 162, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 200.64, "r_y0": 486.147, "r_x1": 206.503, "r_y1": 486.147, "r_x2": 206.503, "r_y2": 483.411, "r_x3": 200.64, "r_y3": 483.411, "coord_origin": "TOPLEFT"}, "text": "276", "orig": "276", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 163, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 382.661, "r_y0": 486.147, "r_x1": 384.616, "r_y1": 486.147, "r_x2": 384.616, "r_y2": 483.411, "r_x3": 382.661, "r_y3": 483.411, "coord_origin": "TOPLEFT"}, "text": "2", "orig": "2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 164, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 397.725, "r_y0": 486.147, "r_x1": 401.648, "r_y1": 486.147, "r_x2": 401.648, "r_y2": 483.411, "r_x3": 397.725, "r_y3": 483.411, "coord_origin": "TOPLEFT"}, "text": "12", "orig": "12", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 165, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 412.789, "r_y0": 486.147, "r_x1": 414.744, "r_y1": 486.147, "r_x2": 414.744, "r_y2": 483.411, "r_x3": 412.789, "r_y3": 483.411, "coord_origin": "TOPLEFT"}, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 166, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 200.64, "r_y0": 491.026, "r_x1": 207.134, "r_y1": 491.026, "r_x2": 207.134, "r_y2": 488.29, "r_x3": 200.64, "r_y3": 488.29, "coord_origin": "TOPLEFT"}, "text": "320", "orig": "320", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 167, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 367.626, "r_y0": 491.026, "r_x1": 369.784, "r_y1": 491.026, "r_x2": 369.784, "r_y2": 488.29, "r_x3": 367.626, "r_y3": 488.29, "coord_origin": "TOPLEFT"}, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 168, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 382.661, "r_y0": 491.026, "r_x1": 384.819, "r_y1": 491.026, "r_x2": 384.819, "r_y2": 488.29, "r_x3": 382.661, "r_y3": 488.29, "coord_origin": "TOPLEFT"}, "text": "4", "orig": "4", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 169, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 397.725, "r_y0": 491.026, "r_x1": 402.051, "r_y1": 491.026, "r_x2": 402.051, "r_y2": 488.29, "r_x3": 397.725, "r_y3": 488.29, "coord_origin": "TOPLEFT"}, "text": "20", "orig": "20", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 170, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 200.64, "r_y0": 495.904, "r_x1": 208.472, "r_y1": 495.904, "r_x2": 208.472, "r_y2": 493.168, "r_x3": 200.64, "r_y3": 493.168, "coord_origin": "TOPLEFT"}, "text": "2013", "orig": "2013", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 171, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 264.29, "r_y0": 495.904, "r_x1": 266.245, "r_y1": 495.904, "r_x2": 266.245, "r_y2": 493.168, "r_x3": 264.29, "r_y3": 493.168, "coord_origin": "TOPLEFT"}, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": [{"id": 58, "label": "text", "bbox": {"l": 180.125, "t": 516.296, "r": 190.62, "b": 518.934, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 85, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 180.125, "r_y0": 518.934, "r_x1": 190.62, "r_y1": 518.934, "r_x2": 190.62, "r_y2": 516.296, "r_x3": 180.125, "r_y3": 516.296, "coord_origin": "TOPLEFT"}, "text": "<table>", "orig": "<table>", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 59, "label": "text", "bbox": {"l": 183.244, "t": 520.194, "r": 304.548, "b": 522.8330000000001, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 86, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 183.244, "r_y0": 522.8330000000001, "r_x1": 304.548, "r_y1": 522.8330000000001, "r_x2": 304.548, "r_y2": 520.194, "r_x3": 183.244, "r_y3": 520.194, "coord_origin": "TOPLEFT"}, "text": "<tr><td></td><td colspan=\"4\"></td><td colspan=\"6\"></td><td colspan=\"3\"></td></tr>", "orig": "<tr><td></td><td colspan=\"4\"></td><td colspan=\"6\"></td><td colspan=\"3\"></td></tr>", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 60, "label": "text", "bbox": {"l": 183.244, "t": 524.0930000000001, "r": 388.423, "b": 526.731, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 87, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 183.244, "r_y0": 526.731, "r_x1": 388.423, "r_y1": 526.731, "r_x2": 388.423, "r_y2": 524.0930000000001, "r_x3": 183.244, "r_y3": 524.0930000000001, "coord_origin": "TOPLEFT"}, "text": "<tr><td></td><td></td><td></td><td></td><td></td><td></td><td></td><td></td><td></td><td></td><td></td><td></td><td></td><td></td></tr>", "orig": "<tr><td></td><td></td><td></td><td></td><td></td><td></td><td></td><td></td><td></td><td></td><td></td><td></td><td></td><td></td></tr>", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 61, "label": "text", "bbox": {"l": 183.244, "t": 527.992, "r": 388.423, "b": 530.63, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 88, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 183.244, "r_y0": 530.63, "r_x1": 388.423, "r_y1": 530.63, "r_x2": 388.423, "r_y2": 527.992, "r_x3": 183.244, "r_y3": 527.992, "coord_origin": "TOPLEFT"}, "text": "<tr><td></td><td></td><td></td><td></td><td></td><td></td><td></td><td></td><td></td><td></td><td></td><td></td><td></td><td></td></tr>", "orig": "<tr><td></td><td></td><td></td><td></td><td></td><td></td><td></td><td></td><td></td><td></td><td></td><td></td><td></td><td></td></tr>", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 62, "label": "text", "bbox": {"l": 183.244, "t": 531.8910000000001, "r": 388.423, "b": 534.529, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 89, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 183.244, "r_y0": 534.529, "r_x1": 388.423, "r_y1": 534.529, "r_x2": 388.423, "r_y2": 531.8910000000001, "r_x3": 183.244, "r_y3": 531.8910000000001, "coord_origin": "TOPLEFT"}, "text": "<tr><td></td><td></td><td></td><td></td><td></td><td></td><td></td><td></td><td></td><td></td><td></td><td></td><td></td><td></td></tr>", "orig": "<tr><td></td><td></td><td></td><td></td><td></td><td></td><td></td><td></td><td></td><td></td><td></td><td></td><td></td><td></td></tr>", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 63, "label": "text", "bbox": {"l": 183.244, "t": 535.79, "r": 388.423, "b": 538.428, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 90, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 183.244, "r_y0": 538.428, "r_x1": 388.423, "r_y1": 538.428, "r_x2": 388.423, "r_y2": 535.79, "r_x3": 183.244, "r_y3": 535.79, "coord_origin": "TOPLEFT"}, "text": "<tr><td></td><td></td><td></td><td></td><td></td><td></td><td></td><td></td><td></td><td></td><td></td><td></td><td></td><td></td></tr>", "orig": "<tr><td></td><td></td><td></td><td></td><td></td><td></td><td></td><td></td><td></td><td></td><td></td><td></td><td></td><td></td></tr>", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 64, "label": "text", "bbox": {"l": 183.244, "t": 539.689, "r": 388.423, "b": 542.327, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 91, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 183.244, "r_y0": 542.327, "r_x1": 388.423, "r_y1": 542.327, "r_x2": 388.423, "r_y2": 539.689, "r_x3": 183.244, "r_y3": 539.689, "coord_origin": "TOPLEFT"}, "text": "<tr><td></td><td></td><td></td><td></td><td></td><td></td><td></td><td></td><td></td><td></td><td></td><td></td><td></td><td></td></tr>", "orig": "<tr><td></td><td></td><td></td><td></td><td></td><td></td><td></td><td></td><td></td><td></td><td></td><td></td><td></td><td></td></tr>", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 65, "label": "text", "bbox": {"l": 183.244, "t": 543.588, "r": 388.423, "b": 546.226, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 92, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 183.244, "r_y0": 546.226, "r_x1": 388.423, "r_y1": 546.226, "r_x2": 388.423, "r_y2": 543.588, "r_x3": 183.244, "r_y3": 543.588, "coord_origin": "TOPLEFT"}, "text": "<tr><td></td><td></td><td></td><td></td><td></td><td></td><td></td><td></td><td></td><td></td><td></td><td></td><td></td><td></td></tr>", "orig": "<tr><td></td><td></td><td></td><td></td><td></td><td></td><td></td><td></td><td></td><td></td><td></td><td></td><td></td><td></td></tr>", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 66, "label": "text", "bbox": {"l": 183.244, "t": 547.486, "r": 388.423, "b": 550.124, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 93, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 183.244, "r_y0": 550.124, "r_x1": 388.423, "r_y1": 550.124, "r_x2": 388.423, "r_y2": 547.486, "r_x3": 183.244, "r_y3": 547.486, "coord_origin": "TOPLEFT"}, "text": "<tr><td></td><td></td><td></td><td></td><td></td><td></td><td></td><td></td><td></td><td></td><td></td><td></td><td></td><td></td></tr>", "orig": "<tr><td></td><td></td><td></td><td></td><td></td><td></td><td></td><td></td><td></td><td></td><td></td><td></td><td></td><td></td></tr>", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 67, "label": "text", "bbox": {"l": 183.244, "t": 551.385, "r": 388.423, "b": 554.023, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 94, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 183.244, "r_y0": 554.023, "r_x1": 388.423, "r_y1": 554.023, "r_x2": 388.423, "r_y2": 551.385, "r_x3": 183.244, "r_y3": 551.385, "coord_origin": "TOPLEFT"}, "text": "<tr><td></td><td></td><td></td><td></td><td></td><td></td><td></td><td></td><td></td><td></td><td></td><td></td><td></td><td></td></tr>", "orig": "<tr><td></td><td></td><td></td><td></td><td></td><td></td><td></td><td></td><td></td><td></td><td></td><td></td><td></td><td></td></tr>", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 68, "label": "text", "bbox": {"l": 180.125, "t": 555.284, "r": 191.868, "b": 557.922, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 95, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 180.125, "r_y0": 557.922, "r_x1": 191.868, "r_y1": 557.922, "r_x2": 191.868, "r_y2": 555.284, "r_x3": 180.125, "r_y3": 555.284, "coord_origin": "TOPLEFT"}, "text": "</table>", "orig": "</table>", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 69, "label": "text", "bbox": {"l": 407.383, "t": 518.363, "r": 450.486, "b": 521.001, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 96, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 407.383, "r_y0": 521.001, "r_x1": 450.486, "r_y1": 521.001, "r_x2": 450.486, "r_y2": 518.363, "r_x3": 407.383, "r_y3": 518.363, "coord_origin": "TOPLEFT"}, "text": "C C L L L C L L L L L C L L NL", "orig": "C C L L L C L L L L L C L L NL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 70, "label": "text", "bbox": {"l": 407.383, "t": 522.262, "r": 450.486, "b": 524.9, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 97, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 407.383, "r_y0": 524.9, "r_x1": 450.486, "r_y1": 524.9, "r_x2": 450.486, "r_y2": 522.262, "r_x3": 407.383, "r_y3": 522.262, "coord_origin": "TOPLEFT"}, "text": "C C C C C C C C C C C C C C NL", "orig": "C C C C C C C C C C C C C C NL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 71, "label": "text", "bbox": {"l": 407.383, "t": 526.1600000000001, "r": 450.486, "b": 528.799, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 98, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 407.383, "r_y0": 528.799, "r_x1": 450.486, "r_y1": 528.799, "r_x2": 450.486, "r_y2": 526.1600000000001, "r_x3": 407.383, "r_y3": 526.1600000000001, "coord_origin": "TOPLEFT"}, "text": "C C C C C C C C C C C C C C NL", "orig": "C C C C C C C C C C C C C C NL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 72, "label": "text", "bbox": {"l": 407.383, "t": 530.059, "r": 450.486, "b": 532.697, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 99, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 407.383, "r_y0": 532.697, "r_x1": 450.486, "r_y1": 532.697, "r_x2": 450.486, "r_y2": 530.059, "r_x3": 407.383, "r_y3": 530.059, "coord_origin": "TOPLEFT"}, "text": "C C C C C C C C C C C C C C NL", "orig": "C C C C C C C C C C C C C C NL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 73, "label": "text", "bbox": {"l": 407.383, "t": 533.9580000000001, "r": 450.486, "b": 536.596, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 100, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 407.383, "r_y0": 536.596, "r_x1": 450.486, "r_y1": 536.596, "r_x2": 450.486, "r_y2": 533.9580000000001, "r_x3": 407.383, "r_y3": 533.9580000000001, "coord_origin": "TOPLEFT"}, "text": "C C C C C C C C C C C C C C NL", "orig": "C C C C C C C C C C C C C C NL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 74, "label": "text", "bbox": {"l": 407.383, "t": 537.857, "r": 450.486, "b": 540.495, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 101, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 407.383, "r_y0": 540.495, "r_x1": 450.486, "r_y1": 540.495, "r_x2": 450.486, "r_y2": 537.857, "r_x3": 407.383, "r_y3": 537.857, "coord_origin": "TOPLEFT"}, "text": "C C C C C C C C C C C C C C NL", "orig": "C C C C C C C C C C C C C C NL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 75, "label": "text", "bbox": {"l": 407.383, "t": 541.756, "r": 450.486, "b": 544.394, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 102, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 407.383, "r_y0": 544.394, "r_x1": 450.486, "r_y1": 544.394, "r_x2": 450.486, "r_y2": 541.756, "r_x3": 407.383, "r_y3": 541.756, "coord_origin": "TOPLEFT"}, "text": "C C C C C C C C C C C C C C NL", "orig": "C C C C C C C C C C C C C C NL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 76, "label": "text", "bbox": {"l": 407.383, "t": 545.655, "r": 450.486, "b": 548.293, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 103, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 407.383, "r_y0": 548.293, "r_x1": 450.486, "r_y1": 548.293, "r_x2": 450.486, "r_y2": 545.655, "r_x3": 407.383, "r_y3": 545.655, "coord_origin": "TOPLEFT"}, "text": "C C C C C C C C C C C C C C NL", "orig": "C C C C C C C C C C C C C C NL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 77, "label": "text", "bbox": {"l": 407.383, "t": 549.554, "r": 450.486, "b": 552.192, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 104, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 407.383, "r_y0": 552.192, "r_x1": 450.486, "r_y1": 552.192, "r_x2": 450.486, "r_y2": 549.554, "r_x3": 407.383, "r_y3": 549.554, "coord_origin": "TOPLEFT"}, "text": "C C C C C C C C C C C C C C NL", "orig": "C C C C C C C C C C C C C C NL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 78, "label": "text", "bbox": {"l": 164.529, "t": 509.533, "r": 181.853, "b": 515.288, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 105, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 164.529, "r_y0": 515.288, "r_x1": 181.853, "r_y1": 515.288, "r_x2": 181.853, "r_y2": 509.533, "r_x3": 164.529, "r_y3": 509.533, "coord_origin": "TOPLEFT"}, "text": "HTML", "orig": "HTML", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 79, "label": "text", "bbox": {"l": 183.584, "t": 509.533, "r": 208.901, "b": 515.288, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 106, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 183.584, "r_y0": 515.288, "r_x1": 208.901, "r_y1": 515.288, "r_x2": 208.901, "r_y2": 509.533, "r_x3": 183.584, "r_y3": 509.533, "coord_origin": "TOPLEFT"}, "text": "# tokens:", "orig": "# tokens:", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 80, "label": "text", "bbox": {"l": 210.633, "t": 509.533, "r": 221.04, "b": 515.288, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 107, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 210.633, "r_y0": 515.288, "r_x1": 221.04, "r_y1": 515.288, "r_x2": 221.04, "r_y2": 509.533, "r_x3": 210.633, "r_y3": 509.533, "coord_origin": "TOPLEFT"}, "text": "258", "orig": "258", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 81, "label": "text", "bbox": {"l": 390.202, "t": 509.678, "r": 406.836, "b": 515.433, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 108, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 390.202, "r_y0": 515.433, "r_x1": 406.836, "r_y1": 515.433, "r_x2": 406.836, "r_y2": 509.678, "r_x3": 390.202, "r_y3": 509.678, "coord_origin": "TOPLEFT"}, "text": "OTSL", "orig": "OTSL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 82, "label": "text", "bbox": {"l": 408.569, "t": 509.678, "r": 433.886, "b": 515.433, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 109, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 408.569, "r_y0": 515.433, "r_x1": 433.886, "r_y1": 515.433, "r_x2": 433.886, "r_y2": 509.678, "r_x3": 408.569, "r_y3": 509.678, "coord_origin": "TOPLEFT"}, "text": "# tokens:", "orig": "# tokens:", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 83, "label": "text", "bbox": {"l": 435.617, "t": 509.678, "r": 446.025, "b": 515.433, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 110, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 435.617, "r_y0": 515.433, "r_x1": 446.025, "r_y1": 515.433, "r_x2": 446.025, "r_y2": 509.678, "r_x3": 435.617, "r_y3": 509.678, "coord_origin": "TOPLEFT"}, "text": "135", "orig": "135", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 84, "label": "text", "bbox": {"l": 167.193, "t": 519.1659999999999, "r": 172.823, "b": 526.36, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 111, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 167.193, "r_y0": 526.36, "r_x1": 172.823, "r_y1": 526.36, "r_x2": 172.823, "r_y2": 519.1659999999999, "r_x3": 167.193, "r_y3": 519.1659999999999, "coord_origin": "TOPLEFT"}, "text": "B", "orig": "B", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 85, "label": "text", "bbox": {"l": 187.337, "t": 448.718, "r": 192.967, "b": 455.912, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 112, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 187.337, "r_y0": 455.912, "r_x1": 192.967, "r_y1": 455.912, "r_x2": 192.967, "r_y2": 448.718, "r_x3": 187.337, "r_y3": 448.718, "coord_origin": "TOPLEFT"}, "text": "A", "orig": "A", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 86, "label": "text", "bbox": {"l": 167.387, "t": 566.0989999999999, "r": 173.016, "b": 573.292, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 113, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 167.387, "r_y0": 573.292, "r_x1": 173.016, "r_y1": 573.292, "r_x2": 173.016, "r_y2": 566.0989999999999, "r_x3": 167.387, "r_y3": 566.0989999999999, "coord_origin": "TOPLEFT"}, "text": "D", "orig": "D", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 87, "label": "text", "bbox": {"l": 248.456, "t": 621.874, "r": 253.657, "b": 629.067, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 114, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 248.456, "r_y0": 629.067, "r_x1": 253.657, "r_y1": 629.067, "r_x2": 253.657, "r_y2": 621.874, "r_x3": 248.456, "r_y3": 621.874, "coord_origin": "TOPLEFT"}, "text": "E", "orig": "E", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 88, "label": "text", "bbox": {"l": 395.901, "t": 519.293, "r": 401.531, "b": 526.4870000000001, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 115, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 395.901, "r_y0": 526.4870000000001, "r_x1": 401.531, "r_y1": 526.4870000000001, "r_x2": 401.531, "r_y2": 519.293, "r_x3": 395.901, "r_y3": 519.293, "coord_origin": "TOPLEFT"}, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 89, "label": "text", "bbox": {"l": 171.7, "t": 580.287, "r": 177.46, "b": 597.269, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 116, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 177.46, "r_y0": 597.268, "r_x1": 177.455, "r_y1": 580.287, "r_x2": 171.7, "r_y2": 580.289, "r_x3": 171.705, "r_y3": 597.269, "coord_origin": "TOPLEFT"}, "text": "HTML", "orig": "HTML", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 90, "label": "text", "bbox": {"l": 251.131, "t": 633.633, "r": 256.891, "b": 649.925, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 117, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 256.891, "r_y0": 649.923, "r_x1": 256.886, "r_y1": 633.633, "r_x2": 251.131, "r_y2": 633.634, "r_x3": 251.136, "r_y3": 649.925, "coord_origin": "TOPLEFT"}, "text": "OTSL", "orig": "OTSL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 91, "label": "text", "bbox": {"l": 372.146, "t": 601.532, "r": 427.038, "b": 607.287, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 118, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 372.146, "r_y0": 607.287, "r_x1": 427.038, "r_y1": 607.287, "r_x2": 427.038, "r_y2": 601.532, "r_x3": 372.146, "r_y3": 601.532, "coord_origin": "TOPLEFT"}, "text": "HTML model shows", "orig": "HTML model shows", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 92, "label": "text", "bbox": {"l": 372.146, "t": 607.9739999999999, "r": 430.068, "b": 613.729, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 119, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 372.146, "r_y0": 613.729, "r_x1": 430.068, "r_y1": 613.729, "r_x2": 430.068, "r_y2": 607.9739999999999, "r_x3": 372.146, "r_y3": 607.9739999999999, "coord_origin": "TOPLEFT"}, "text": "bounding box drifting", "orig": "bounding box drifting", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 93, "label": "text", "bbox": {"l": 176.88, "t": 642.947, "r": 231.082, "b": 648.702, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 120, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 176.88, "r_y0": 648.702, "r_x1": 231.082, "r_y1": 648.702, "r_x2": 231.082, "r_y2": 642.947, "r_x3": 176.88, "r_y3": 642.947, "coord_origin": "TOPLEFT"}, "text": "OTSL model shows", "orig": "OTSL model shows", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 94, "label": "text", "bbox": {"l": 176.88, "t": 649.389, "r": 230.993, "b": 655.144, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 121, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 176.88, "r_y0": 655.144, "r_x1": 230.993, "r_y1": 655.144, "r_x2": 230.993, "r_y2": 649.389, "r_x3": 176.88, "r_y3": 649.389, "coord_origin": "TOPLEFT"}, "text": "clean bounding box", "orig": "clean bounding box", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 95, "label": "text", "bbox": {"l": 176.88, "t": 655.831, "r": 203.932, "b": 661.586, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 122, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 176.88, "r_y0": 661.586, "r_x1": 203.932, "r_y1": 661.586, "r_x2": 203.932, "r_y2": 655.831, "r_x3": 176.88, "r_y3": 655.831, "coord_origin": "TOPLEFT"}, "text": "alignment", "orig": "alignment", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 96, "label": "text", "bbox": {"l": 215.932, "t": 557.563, "r": 218.47, "b": 569.16, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 123, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 215.932, "r_y0": 569.16, "r_x1": 218.47, "r_y1": 569.16, "r_x2": 218.47, "r_y2": 557.563, "r_x3": 215.932, "r_y3": 557.563, "coord_origin": "TOPLEFT"}, "text": "\u2264", "orig": "\u2264", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 97, "label": "text", "bbox": {"l": 229.057, "t": 557.563, "r": 231.719, "b": 569.16, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 124, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 229.057, "r_y0": 569.16, "r_x1": 231.719, "r_y1": 569.16, "r_x2": 231.719, "r_y2": 557.563, "r_x3": 229.057, "r_y3": 557.563, "coord_origin": "TOPLEFT"}, "text": "\u03bc", "orig": "\u03bc", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 98, "label": "text", "bbox": {"l": 261.209, "t": 448.461, "r": 263.57, "b": 451.197, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 126, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 261.209, "r_y0": 451.197, "r_x1": 263.57, "r_y1": 451.197, "r_x2": 263.57, "r_y2": 448.461, "r_x3": 261.209, "r_y3": 448.461, "coord_origin": "TOPLEFT"}, "text": "S", "orig": "S", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 99, "label": "text", "bbox": {"l": 312.335, "t": 448.461, "r": 313.636, "b": 451.197, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 127, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 312.335, "r_y0": 451.197, "r_x1": 313.636, "r_y1": 451.197, "r_x2": 313.636, "r_y2": 448.461, "r_x3": 312.335, "r_y3": 448.461, "coord_origin": "TOPLEFT"}, "text": "I", "orig": "I", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 100, "label": "text", "bbox": {"l": 377.411, "t": 448.461, "r": 380.057, "b": 451.197, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 128, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 377.411, "r_y0": 451.197, "r_x1": 380.057, "r_y1": 451.197, "r_x2": 380.057, "r_y2": 448.461, "r_x3": 377.411, "r_y3": 448.461, "coord_origin": "TOPLEFT"}, "text": "R", "orig": "R", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 101, "label": "text", "bbox": {"l": 200.64, "t": 453.34, "r": 205.818, "b": 456.076, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 129, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 200.64, "r_y0": 456.076, "r_x1": 205.818, "r_y1": 456.076, "r_x2": 205.818, "r_y2": 453.34, "r_x3": 200.64, "r_y3": 453.34, "coord_origin": "TOPLEFT"}, "text": "ST", "orig": "ST", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 102, "label": "text", "bbox": {"l": 222.208, "t": 453.34, "r": 229.761, "b": 456.076, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 130, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 222.208, "r_y0": 456.076, "r_x1": 229.761, "r_y1": 456.076, "r_x2": 229.761, "r_y2": 453.34, "r_x3": 222.208, "r_y3": 453.34, "coord_origin": "TOPLEFT"}, "text": "0.03", "orig": "0.03", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 103, "label": "text", "bbox": {"l": 243.267, "t": 453.34, "r": 250.82, "b": 456.076, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 131, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 243.267, "r_y0": 456.076, "r_x1": 250.82, "r_y1": 456.076, "r_x2": 250.82, "r_y2": 453.34, "r_x3": 243.267, "r_y3": 453.34, "coord_origin": "TOPLEFT"}, "text": "0.06", "orig": "0.06", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 104, "label": "text", "bbox": {"l": 264.297, "t": 453.34, "r": 271.842, "b": 456.076, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 132, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 264.297, "r_y0": 456.076, "r_x1": 271.842, "r_y1": 456.076, "r_x2": 271.842, "r_y2": 453.34, "r_x3": 264.297, "r_y3": 453.34, "coord_origin": "TOPLEFT"}, "text": "0.12", "orig": "0.12", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 105, "label": "text", "bbox": {"l": 285.319, "t": 453.34, "r": 292.872, "b": 456.076, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 133, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 285.319, "r_y0": 456.076, "r_x1": 292.872, "r_y1": 456.076, "r_x2": 292.872, "r_y2": 453.34, "r_x3": 285.319, "r_y3": 453.34, "coord_origin": "TOPLEFT"}, "text": "0.25", "orig": "0.25", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 106, "label": "text", "bbox": {"l": 306.378, "t": 453.34, "r": 311.766, "b": 456.076, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 134, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 306.378, "r_y0": 456.076, "r_x1": 311.766, "r_y1": 456.076, "r_x2": 311.766, "r_y2": 453.34, "r_x3": 306.378, "r_y3": 453.34, "coord_origin": "TOPLEFT"}, "text": "0.5", "orig": "0.5", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 107, "label": "text", "bbox": {"l": 323.417, "t": 453.34, "r": 325.575, "b": 456.076, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 135, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 323.417, "r_y0": 456.076, "r_x1": 325.575, "r_y1": 456.076, "r_x2": 325.575, "r_y2": 453.34, "r_x3": 323.417, "r_y3": 453.34, "coord_origin": "TOPLEFT"}, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 108, "label": "text", "bbox": {"l": 334.458, "t": 453.34, "r": 336.616, "b": 456.076, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 136, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 334.458, "r_y0": 456.076, "r_x1": 336.616, "r_y1": 456.076, "r_x2": 336.616, "r_y2": 453.34, "r_x3": 334.458, "r_y3": 453.34, "coord_origin": "TOPLEFT"}, "text": "2", "orig": "2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 109, "label": "text", "bbox": {"l": 345.528, "t": 453.34, "r": 347.685, "b": 456.076, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 137, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 345.528, "r_y0": 456.076, "r_x1": 347.685, "r_y1": 456.076, "r_x2": 347.685, "r_y2": 453.34, "r_x3": 345.528, "r_y3": 453.34, "coord_origin": "TOPLEFT"}, "text": "4", "orig": "4", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 110, "label": "text", "bbox": {"l": 356.569, "t": 453.34, "r": 358.726, "b": 456.076, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 138, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 356.569, "r_y0": 456.076, "r_x1": 358.726, "r_y1": 456.076, "r_x2": 358.726, "r_y2": 453.34, "r_x3": 356.569, "r_y3": 453.34, "coord_origin": "TOPLEFT"}, "text": "8", "orig": "8", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 111, "label": "text", "bbox": {"l": 367.638, "t": 453.34, "r": 371.964, "b": 456.076, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 139, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 367.638, "r_y0": 456.076, "r_x1": 371.964, "r_y1": 456.076, "r_x2": 371.964, "r_y2": 453.34, "r_x3": 367.638, "r_y3": 453.34, "coord_origin": "TOPLEFT"}, "text": "16", "orig": "16", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 112, "label": "text", "bbox": {"l": 382.673, "t": 453.34, "r": 386.999, "b": 456.076, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 140, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 382.673, "r_y0": 456.076, "r_x1": 386.999, "r_y1": 456.076, "r_x2": 386.999, "r_y2": 453.34, "r_x3": 382.673, "r_y3": 453.34, "coord_origin": "TOPLEFT"}, "text": "32", "orig": "32", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 113, "label": "text", "bbox": {"l": 397.737, "t": 453.34, "r": 402.063, "b": 456.076, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 141, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 397.737, "r_y0": 456.076, "r_x1": 402.063, "r_y1": 456.076, "r_x2": 402.063, "r_y2": 453.34, "r_x3": 397.737, "r_y3": 453.34, "coord_origin": "TOPLEFT"}, "text": "64", "orig": "64", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 114, "label": "text", "bbox": {"l": 412.789, "t": 447.993, "r": 414.935, "b": 457.8, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 142, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 412.789, "r_y0": 457.8, "r_x1": 414.935, "r_y1": 457.8, "r_x2": 414.935, "r_y2": 447.993, "r_x3": 412.789, "r_y3": 447.993, "coord_origin": "TOPLEFT"}, "text": "\u2265", "orig": "\u2265", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 115, "label": "text", "bbox": {"l": 416.07, "t": 453.34, "r": 422.535, "b": 456.076, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 143, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 416.07, "r_y0": 456.076, "r_x1": 422.535, "r_y1": 456.076, "r_x2": 422.535, "r_y2": 453.34, "r_x3": 416.07, "r_y3": 453.34, "coord_origin": "TOPLEFT"}, "text": "128", "orig": "128", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 116, "label": "text", "bbox": {"l": 200.64, "t": 463.924, "r": 204.563, "b": 466.66, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 144, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 200.64, "r_y0": 466.66, "r_x1": 204.563, "r_y1": 466.66, "r_x2": 204.563, "r_y2": 463.924, "r_x3": 200.64, "r_y3": 463.924, "coord_origin": "TOPLEFT"}, "text": "63", "orig": "63", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 117, "label": "text", "bbox": {"l": 367.626, "t": 463.924, "r": 369.58, "b": 466.66, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 145, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 367.626, "r_y0": 466.66, "r_x1": 369.58, "r_y1": 466.66, "r_x2": 369.58, "r_y2": 463.924, "r_x3": 367.626, "r_y3": 463.924, "coord_origin": "TOPLEFT"}, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 118, "label": "text", "bbox": {"l": 382.661, "t": 463.924, "r": 384.616, "b": 466.66, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 146, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 382.661, "r_y0": 466.66, "r_x1": 384.616, "r_y1": 466.66, "r_x2": 384.616, "r_y2": 463.924, "r_x3": 382.661, "r_y3": 463.924, "coord_origin": "TOPLEFT"}, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 119, "label": "text", "bbox": {"l": 397.725, "t": 463.924, "r": 399.679, "b": 466.66, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 147, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 397.725, "r_y0": 466.66, "r_x1": 399.679, "r_y1": 466.66, "r_x2": 399.679, "r_y2": 463.924, "r_x3": 397.725, "r_y3": 463.924, "coord_origin": "TOPLEFT"}, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 120, "label": "text", "bbox": {"l": 200.64, "t": 468.803, "r": 206.503, "b": 471.539, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 148, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 200.64, "r_y0": 471.539, "r_x1": 206.503, "r_y1": 471.539, "r_x2": 206.503, "r_y2": 468.803, "r_x3": 200.64, "r_y3": 468.803, "coord_origin": "TOPLEFT"}, "text": "199", "orig": "199", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 121, "label": "text", "bbox": {"l": 264.29, "t": 468.803, "r": 266.245, "b": 471.539, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 149, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 264.29, "r_y0": 471.539, "r_x1": 266.245, "r_y1": 471.539, "r_x2": 266.245, "r_y2": 468.803, "r_x3": 264.29, "r_y3": 468.803, "coord_origin": "TOPLEFT"}, "text": "5", "orig": "5", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 122, "label": "text", "bbox": {"l": 306.372, "t": 468.803, "r": 308.326, "b": 471.539, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 150, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 306.372, "r_y0": 471.539, "r_x1": 308.326, "r_y1": 471.539, "r_x2": 308.326, "r_y2": 468.803, "r_x3": 306.372, "r_y3": 468.803, "coord_origin": "TOPLEFT"}, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 123, "label": "text", "bbox": {"l": 345.515, "t": 468.803, "r": 347.47, "b": 471.539, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 151, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 345.515, "r_y0": 471.539, "r_x1": 347.47, "r_y1": 471.539, "r_x2": 347.47, "r_y2": 468.803, "r_x3": 345.515, "r_y3": 468.803, "coord_origin": "TOPLEFT"}, "text": "2", "orig": "2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 124, "label": "text", "bbox": {"l": 356.556, "t": 468.803, "r": 358.511, "b": 471.539, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 152, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 356.556, "r_y0": 471.539, "r_x1": 358.511, "r_y1": 471.539, "r_x2": 358.511, "r_y2": 468.803, "r_x3": 356.556, "r_y3": 468.803, "coord_origin": "TOPLEFT"}, "text": "4", "orig": "4", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 125, "label": "text", "bbox": {"l": 367.626, "t": 468.803, "r": 369.58, "b": 471.539, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 153, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 367.626, "r_y0": 471.539, "r_x1": 369.58, "r_y1": 471.539, "r_x2": 369.58, "r_y2": 468.803, "r_x3": 367.626, "r_y3": 468.803, "coord_origin": "TOPLEFT"}, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 126, "label": "text", "bbox": {"l": 382.661, "t": 468.803, "r": 384.615, "b": 471.539, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 154, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 382.661, "r_y0": 471.539, "r_x1": 384.615, "r_y1": 471.539, "r_x2": 384.615, "r_y2": 468.803, "r_x3": 382.661, "r_y3": 468.803, "coord_origin": "TOPLEFT"}, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 127, "label": "text", "bbox": {"l": 200.64, "t": 473.682, "r": 206.503, "b": 476.418, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 155, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 200.64, "r_y0": 476.418, "r_x1": 206.503, "r_y1": 476.418, "r_x2": 206.503, "r_y2": 473.682, "r_x3": 200.64, "r_y3": 473.682, "coord_origin": "TOPLEFT"}, "text": "416", "orig": "416", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 128, "label": "text", "bbox": {"l": 264.29, "t": 473.682, "r": 266.245, "b": 476.418, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 156, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 264.29, "r_y0": 476.418, "r_x1": 266.245, "r_y1": 476.418, "r_x2": 266.245, "r_y2": 473.682, "r_x3": 264.29, "r_y3": 473.682, "coord_origin": "TOPLEFT"}, "text": "4", "orig": "4", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 129, "label": "text", "bbox": {"l": 200.64, "t": 478.532, "r": 206.503, "b": 481.268, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 157, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 200.64, "r_y0": 481.268, "r_x1": 206.503, "r_y1": 481.268, "r_x2": 206.503, "r_y2": 478.532, "r_x3": 200.64, "r_y3": 478.532, "coord_origin": "TOPLEFT"}, "text": "230", "orig": "230", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 130, "label": "text", "bbox": {"l": 243.264, "t": 478.532, "r": 245.218, "b": 481.268, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 158, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 243.264, "r_y0": 481.268, "r_x1": 245.218, "r_y1": 481.268, "r_x2": 245.218, "r_y2": 478.532, "r_x3": 243.264, "r_y3": 478.532, "coord_origin": "TOPLEFT"}, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 131, "label": "text", "bbox": {"l": 264.29, "t": 478.532, "r": 266.245, "b": 481.268, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 159, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 264.29, "r_y0": 481.268, "r_x1": 266.245, "r_y1": 481.268, "r_x2": 266.245, "r_y2": 478.532, "r_x3": 264.29, "r_y3": 478.532, "coord_origin": "TOPLEFT"}, "text": "9", "orig": "9", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 132, "label": "text", "bbox": {"l": 323.405, "t": 478.532, "r": 325.359, "b": 481.268, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 160, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 323.405, "r_y0": 481.268, "r_x1": 325.359, "r_y1": 481.268, "r_x2": 325.359, "r_y2": 478.532, "r_x3": 323.405, "r_y3": 478.532, "coord_origin": "TOPLEFT"}, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 133, "label": "text", "bbox": {"l": 397.725, "t": 478.532, "r": 399.679, "b": 481.268, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 161, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 397.725, "r_y0": 481.268, "r_x1": 399.679, "r_y1": 481.268, "r_x2": 399.679, "r_y2": 478.532, "r_x3": 397.725, "r_y3": 478.532, "coord_origin": "TOPLEFT"}, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 134, "label": "text", "bbox": {"l": 200.64, "t": 483.411, "r": 206.503, "b": 486.147, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 162, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 200.64, "r_y0": 486.147, "r_x1": 206.503, "r_y1": 486.147, "r_x2": 206.503, "r_y2": 483.411, "r_x3": 200.64, "r_y3": 483.411, "coord_origin": "TOPLEFT"}, "text": "276", "orig": "276", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 135, "label": "text", "bbox": {"l": 382.661, "t": 483.411, "r": 384.616, "b": 486.147, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 163, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 382.661, "r_y0": 486.147, "r_x1": 384.616, "r_y1": 486.147, "r_x2": 384.616, "r_y2": 483.411, "r_x3": 382.661, "r_y3": 483.411, "coord_origin": "TOPLEFT"}, "text": "2", "orig": "2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 136, "label": "text", "bbox": {"l": 397.725, "t": 483.411, "r": 401.648, "b": 486.147, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 164, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 397.725, "r_y0": 486.147, "r_x1": 401.648, "r_y1": 486.147, "r_x2": 401.648, "r_y2": 483.411, "r_x3": 397.725, "r_y3": 483.411, "coord_origin": "TOPLEFT"}, "text": "12", "orig": "12", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 137, "label": "text", "bbox": {"l": 412.789, "t": 483.411, "r": 414.744, "b": 486.147, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 165, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 412.789, "r_y0": 486.147, "r_x1": 414.744, "r_y1": 486.147, "r_x2": 414.744, "r_y2": 483.411, "r_x3": 412.789, "r_y3": 483.411, "coord_origin": "TOPLEFT"}, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 138, "label": "text", "bbox": {"l": 200.64, "t": 488.29, "r": 207.134, "b": 491.026, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 166, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 200.64, "r_y0": 491.026, "r_x1": 207.134, "r_y1": 491.026, "r_x2": 207.134, "r_y2": 488.29, "r_x3": 200.64, "r_y3": 488.29, "coord_origin": "TOPLEFT"}, "text": "320", "orig": "320", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 139, "label": "text", "bbox": {"l": 367.626, "t": 488.29, "r": 369.784, "b": 491.026, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 167, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 367.626, "r_y0": 491.026, "r_x1": 369.784, "r_y1": 491.026, "r_x2": 369.784, "r_y2": 488.29, "r_x3": 367.626, "r_y3": 488.29, "coord_origin": "TOPLEFT"}, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 140, "label": "text", "bbox": {"l": 382.661, "t": 488.29, "r": 384.819, "b": 491.026, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 168, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 382.661, "r_y0": 491.026, "r_x1": 384.819, "r_y1": 491.026, "r_x2": 384.819, "r_y2": 488.29, "r_x3": 382.661, "r_y3": 488.29, "coord_origin": "TOPLEFT"}, "text": "4", "orig": "4", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 141, "label": "text", "bbox": {"l": 397.725, "t": 488.29, "r": 402.051, "b": 491.026, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 169, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 397.725, "r_y0": 491.026, "r_x1": 402.051, "r_y1": 491.026, "r_x2": 402.051, "r_y2": 488.29, "r_x3": 397.725, "r_y3": 488.29, "coord_origin": "TOPLEFT"}, "text": "20", "orig": "20", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 142, "label": "text", "bbox": {"l": 200.64, "t": 493.168, "r": 208.472, "b": 495.904, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 170, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 200.64, "r_y0": 495.904, "r_x1": 208.472, "r_y1": 495.904, "r_x2": 208.472, "r_y2": 493.168, "r_x3": 200.64, "r_y3": 493.168, "coord_origin": "TOPLEFT"}, "text": "2013", "orig": "2013", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 143, "label": "text", "bbox": {"l": 264.29, "t": 493.168, "r": 266.245, "b": 495.904, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 171, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 264.29, "r_y0": 495.904, "r_x1": 266.245, "r_y1": 495.904, "r_x2": 266.245, "r_y2": 493.168, "r_x3": 264.29, "r_y3": 493.168, "coord_origin": "TOPLEFT"}, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}]}, "text": "", "annotations": [], "provenance": null, "predicted_class": null, "confidence": null}, {"label": "text", "id": 144, "page_no": 9, "cluster": {"id": 144, "label": "text", "bbox": {"l": 227.915, "t": 665.826, "r": 230.1, "b": 675.346, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 172, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 227.915, "r_y0": 675.346, "r_x1": 230.1, "r_y1": 675.346, "r_x2": 230.1, "r_y2": 665.826, "r_x3": 227.915, "r_y3": 665.826, "coord_origin": "TOPLEFT"}, "text": "\u03bc", "orig": "\u03bc", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "\u03bc"}, {"label": "text", "id": 145, "page_no": 9, "cluster": {"id": 145, "label": "text", "bbox": {"l": 300.581, "t": 683.622, "r": 302.726, "b": 693.429, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 173, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 300.581, "r_y0": 693.429, "r_x1": 302.726, "r_y1": 693.429, "r_x2": 302.726, "r_y2": 683.622, "r_x3": 300.581, "r_y3": 683.622, "coord_origin": "TOPLEFT"}, "text": "\u2265", "orig": "\u2265", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "\u2265"}], "body": [{"label": "caption", "id": 4, "page_no": 9, "cluster": {"id": 4, "label": "caption", "bbox": {"l": 134.765, "t": 113.62099999999998, "r": 480.594, "b": 146.82799999999997, "coord_origin": "TOPLEFT"}, "confidence": 0.9512290954589844, "cells": [{"index": 2, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 123.76199999999994, "r_x1": 173.094, "r_y1": 123.76199999999994, "r_x2": 173.094, "r_y2": 115.83600000000001, "r_x3": 134.765, "r_y3": 115.83600000000001, "coord_origin": "TOPLEFT"}, "text": "Table 2.", "orig": "Table 2.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 3, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 181.303, "r_y0": 124.90999999999997, "r_x1": 480.592, "r_y1": 124.90999999999997, "r_x2": 480.592, "r_y2": 113.62099999999998, "r_x3": 181.303, "r_y3": 113.62099999999998, "coord_origin": "TOPLEFT"}, "text": "TSR and cell detection results compared between OTSL and HTML on", "orig": "TSR and cell detection results compared between OTSL and HTML on", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 4, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 135.86900000000003, "r_x1": 480.594, "r_y1": 135.86900000000003, "r_x2": 480.594, "r_y2": 124.58000000000004, "r_x3": 134.765, "r_y3": 124.58000000000004, "coord_origin": "TOPLEFT"}, "text": "the PubTabNet [22], FinTabNet [21] and PubTables-1M [14] data sets using Table-", "orig": "the PubTabNet [22], FinTabNet [21] and PubTables-1M [14] data sets using Table-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 5, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 146.82799999999997, "r_x1": 305.957, "r_y1": 146.82799999999997, "r_x2": 305.957, "r_y2": 135.539, "r_x3": 134.765, "r_y3": 135.539, "coord_origin": "TOPLEFT"}, "text": "Former [9] (with enc=6, dec=6, heads=8).", "orig": "Former [9] (with enc=6, dec=6, heads=8).", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "Table 2. TSR and cell detection results compared between OTSL and HTML on the PubTabNet [22], FinTabNet [21] and PubTables-1M [14] data sets using TableFormer [9] (with enc=6, dec=6, heads=8)."}, {"label": "table", "id": 0, "page_no": 9, "cluster": {"id": 0, "label": "table", "bbox": {"l": 143.6376495361328, "t": 156.3477020263672, "r": 470.8485412597656, "b": 263.2624816894531, "coord_origin": "TOPLEFT"}, "confidence": 0.9884640574455261, "cells": [{"index": 6, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 160.782, "r_y0": 175.57000000000005, "r_x1": 194.998, "r_y1": 175.57000000000005, "r_x2": 194.998, "r_y2": 164.28099999999995, "r_x3": 160.782, "r_y3": 164.28099999999995, "coord_origin": "TOPLEFT"}, "text": "Data set", "orig": "Data set", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 7, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 215.525, "r_y0": 175.54499999999996, "r_x1": 254.045, "r_y1": 175.54499999999996, "r_x2": 254.045, "r_y2": 164.25599999999997, "r_x3": 215.525, "r_y3": 164.25599999999997, "coord_origin": "TOPLEFT"}, "text": "Language", "orig": "Language", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 8, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 300.397, "r_y0": 170.09000000000003, "r_x1": 323.991, "r_y1": 170.09000000000003, "r_x2": 323.991, "r_y2": 158.80100000000004, "r_x3": 300.397, "r_y3": 158.80100000000004, "coord_origin": "TOPLEFT"}, "text": "TEDs", "orig": "TEDs", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 9, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 370.345, "r_y0": 175.57000000000005, "r_x1": 414.747, "r_y1": 175.57000000000005, "r_x2": 414.747, "r_y2": 164.28099999999995, "r_x3": 370.345, "r_y3": 164.28099999999995, "coord_origin": "TOPLEFT"}, "text": "mAP(0.75)", "orig": "mAP(0.75)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 10, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 426.737, "r_y0": 170.09000000000003, "r_x1": 463.108, "r_y1": 170.09000000000003, "r_x2": 463.108, "r_y2": 158.80100000000004, "r_x3": 426.737, "r_y3": 158.80100000000004, "coord_origin": "TOPLEFT"}, "text": "Inference", "orig": "Inference", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 11, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 423.114, "r_y0": 181.04899999999998, "r_x1": 466.727, "r_y1": 181.04899999999998, "r_x2": 466.727, "r_y2": 169.76, "r_x3": 423.114, "r_y3": 169.76, "coord_origin": "TOPLEFT"}, "text": "time (secs)", "orig": "time (secs)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 12, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 262.413, "r_y0": 183.04200000000003, "r_x1": 288.06, "r_y1": 183.04200000000003, "r_x2": 288.06, "r_y2": 171.75300000000004, "r_x3": 262.413, "r_y3": 171.75300000000004, "coord_origin": "TOPLEFT"}, "text": "simple", "orig": "simple", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 13, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 296.429, "r_y0": 183.04200000000003, "r_x1": 329.447, "r_y1": 183.04200000000003, "r_x2": 329.447, "r_y2": 171.75300000000004, "r_x3": 296.429, "r_y3": 171.75300000000004, "coord_origin": "TOPLEFT"}, "text": "complex", "orig": "complex", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 14, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 345.033, "r_y0": 183.04200000000003, "r_x1": 354.758, "r_y1": 183.04200000000003, "r_x2": 354.758, "r_y2": 171.75300000000004, "r_x3": 345.033, "r_y3": 171.75300000000004, "coord_origin": "TOPLEFT"}, "text": "all", "orig": "all", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 15, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 154.538, "r_y0": 201.87099999999998, "r_x1": 201.241, "r_y1": 201.87099999999998, "r_x2": 201.241, "r_y2": 190.582, "r_x3": 154.538, "r_y3": 190.582, "coord_origin": "TOPLEFT"}, "text": "PubTabNet", "orig": "PubTabNet", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 16, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 222.437, "r_y0": 196.39200000000005, "r_x1": 247.132, "r_y1": 196.39200000000005, "r_x2": 247.132, "r_y2": 185.10299999999995, "r_x3": 222.437, "r_y3": 185.10299999999995, "coord_origin": "TOPLEFT"}, "text": "OTSL", "orig": "OTSL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 17, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 264.744, "r_y0": 196.39200000000005, "r_x1": 285.731, "r_y1": 196.39200000000005, "r_x2": 285.731, "r_y2": 185.10299999999995, "r_x3": 264.744, "r_y3": 185.10299999999995, "coord_origin": "TOPLEFT"}, "text": "0.965", "orig": "0.965", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 18, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 302.444, "r_y0": 196.39200000000005, "r_x1": 323.431, "r_y1": 196.39200000000005, "r_x2": 323.431, "r_y2": 185.10299999999995, "r_x3": 302.444, "r_y3": 185.10299999999995, "coord_origin": "TOPLEFT"}, "text": "0.934", "orig": "0.934", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 19, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 339.403, "r_y0": 196.39200000000005, "r_x1": 360.39, "r_y1": 196.39200000000005, "r_x2": 360.39, "r_y2": 185.10299999999995, "r_x3": 339.403, "r_y3": 185.10299999999995, "coord_origin": "TOPLEFT"}, "text": "0.955", "orig": "0.955", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 20, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 383.116, "r_y0": 195.24400000000003, "r_x1": 401.973, "r_y1": 195.24400000000003, "r_x2": 401.973, "r_y2": 187.31799999999998, "r_x3": 383.116, "r_y3": 187.31799999999998, "coord_origin": "TOPLEFT"}, "text": "0.88", "orig": "0.88", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 21, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 435.493, "r_y0": 195.24400000000003, "r_x1": 454.35, "r_y1": 195.24400000000003, "r_x2": 454.35, "r_y2": 187.31799999999998, "r_x3": 435.493, "r_y3": 187.31799999999998, "coord_origin": "TOPLEFT"}, "text": "2.73", "orig": "2.73", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 22, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 220.903, "r_y0": 209.34299999999996, "r_x1": 248.667, "r_y1": 209.34299999999996, "r_x2": 248.667, "r_y2": 198.05399999999997, "r_x3": 220.903, "r_y3": 198.05399999999997, "coord_origin": "TOPLEFT"}, "text": "HTML", "orig": "HTML", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 23, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 264.744, "r_y0": 209.34299999999996, "r_x1": 285.731, "r_y1": 209.34299999999996, "r_x2": 285.731, "r_y2": 198.05399999999997, "r_x3": 264.744, "r_y3": 198.05399999999997, "coord_origin": "TOPLEFT"}, "text": "0.969", "orig": "0.969", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 24, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 302.444, "r_y0": 209.34299999999996, "r_x1": 323.431, "r_y1": 209.34299999999996, "r_x2": 323.431, "r_y2": 198.05399999999997, "r_x3": 302.444, "r_y3": 198.05399999999997, "coord_origin": "TOPLEFT"}, "text": "0.927", "orig": "0.927", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 25, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 339.403, "r_y0": 209.34299999999996, "r_x1": 360.39, "r_y1": 209.34299999999996, "r_x2": 360.39, "r_y2": 198.05399999999997, "r_x3": 339.403, "r_y3": 198.05399999999997, "coord_origin": "TOPLEFT"}, "text": "0.955", "orig": "0.955", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 26, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 382.052, "r_y0": 209.34299999999996, "r_x1": 403.039, "r_y1": 209.34299999999996, "r_x2": 403.039, "r_y2": 198.05399999999997, "r_x3": 382.052, "r_y3": 198.05399999999997, "coord_origin": "TOPLEFT"}, "text": "0.857", "orig": "0.857", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 27, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 436.732, "r_y0": 209.34299999999996, "r_x1": 453.112, "r_y1": 209.34299999999996, "r_x2": 453.112, "r_y2": 198.05399999999997, "r_x3": 436.732, "r_y3": 198.05399999999997, "coord_origin": "TOPLEFT"}, "text": "5.39", "orig": "5.39", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 28, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 155.945, "r_y0": 228.173, "r_x1": 199.834, "r_y1": 228.173, "r_x2": 199.834, "r_y2": 216.88400000000001, "r_x3": 155.945, "r_y3": 216.88400000000001, "coord_origin": "TOPLEFT"}, "text": "FinTabNet", "orig": "FinTabNet", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 29, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 222.437, "r_y0": 222.69299999999998, "r_x1": 247.132, "r_y1": 222.69299999999998, "r_x2": 247.132, "r_y2": 211.404, "r_x3": 222.437, "r_y3": 211.404, "coord_origin": "TOPLEFT"}, "text": "OTSL", "orig": "OTSL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 30, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 264.744, "r_y0": 222.69299999999998, "r_x1": 285.731, "r_y1": 222.69299999999998, "r_x2": 285.731, "r_y2": 211.404, "r_x3": 264.744, "r_y3": 211.404, "coord_origin": "TOPLEFT"}, "text": "0.955", "orig": "0.955", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 31, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 302.444, "r_y0": 222.69299999999998, "r_x1": 323.431, "r_y1": 222.69299999999998, "r_x2": 323.431, "r_y2": 211.404, "r_x3": 302.444, "r_y3": 211.404, "coord_origin": "TOPLEFT"}, "text": "0.961", "orig": "0.961", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 32, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 337.815, "r_y0": 221.54499999999996, "r_x1": 361.976, "r_y1": 221.54499999999996, "r_x2": 361.976, "r_y2": 213.61900000000003, "r_x3": 337.815, "r_y3": 213.61900000000003, "coord_origin": "TOPLEFT"}, "text": "0.959", "orig": "0.959", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 33, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 380.464, "r_y0": 221.54499999999996, "r_x1": 404.625, "r_y1": 221.54499999999996, "r_x2": 404.625, "r_y2": 213.61900000000003, "r_x3": 380.464, "r_y3": 213.61900000000003, "coord_origin": "TOPLEFT"}, "text": "0.862", "orig": "0.862", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 34, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 435.493, "r_y0": 221.54499999999996, "r_x1": 454.35, "r_y1": 221.54499999999996, "r_x2": 454.35, "r_y2": 213.61900000000003, "r_x3": 435.493, "r_y3": 213.61900000000003, "coord_origin": "TOPLEFT"}, "text": "1.85", "orig": "1.85", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 35, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 220.903, "r_y0": 235.64499999999998, "r_x1": 248.667, "r_y1": 235.64499999999998, "r_x2": 248.667, "r_y2": 224.356, "r_x3": 220.903, "r_y3": 224.356, "coord_origin": "TOPLEFT"}, "text": "HTML", "orig": "HTML", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 36, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 264.744, "r_y0": 235.64499999999998, "r_x1": 285.731, "r_y1": 235.64499999999998, "r_x2": 285.731, "r_y2": 224.356, "r_x3": 264.744, "r_y3": 224.356, "coord_origin": "TOPLEFT"}, "text": "0.917", "orig": "0.917", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 37, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 302.444, "r_y0": 235.64499999999998, "r_x1": 323.431, "r_y1": 235.64499999999998, "r_x2": 323.431, "r_y2": 224.356, "r_x3": 302.444, "r_y3": 224.356, "coord_origin": "TOPLEFT"}, "text": "0.922", "orig": "0.922", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 38, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 341.706, "r_y0": 235.64499999999998, "r_x1": 358.086, "r_y1": 235.64499999999998, "r_x2": 358.086, "r_y2": 224.356, "r_x3": 341.706, "r_y3": 224.356, "coord_origin": "TOPLEFT"}, "text": "0.92", "orig": "0.92", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 39, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 382.052, "r_y0": 235.64499999999998, "r_x1": 403.039, "r_y1": 235.64499999999998, "r_x2": 403.039, "r_y2": 224.356, "r_x3": 382.052, "r_y3": 224.356, "coord_origin": "TOPLEFT"}, "text": "0.722", "orig": "0.722", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 40, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 436.732, "r_y0": 235.64499999999998, "r_x1": 453.112, "r_y1": 235.64499999999998, "r_x2": 453.112, "r_y2": 224.356, "r_x3": 436.732, "r_y3": 224.356, "coord_origin": "TOPLEFT"}, "text": "3.26", "orig": "3.26", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 41, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 148.626, "r_y0": 254.47400000000005, "r_x1": 207.152, "r_y1": 254.47400000000005, "r_x2": 207.152, "r_y2": 243.18499999999995, "r_x3": 148.626, "r_y3": 243.18499999999995, "coord_origin": "TOPLEFT"}, "text": "PubTables-1M", "orig": "PubTables-1M", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 42, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 222.437, "r_y0": 248.99400000000003, "r_x1": 247.132, "r_y1": 248.99400000000003, "r_x2": 247.132, "r_y2": 237.70500000000004, "r_x3": 222.437, "r_y3": 237.70500000000004, "coord_origin": "TOPLEFT"}, "text": "OTSL", "orig": "OTSL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 43, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 264.744, "r_y0": 248.99400000000003, "r_x1": 285.731, "r_y1": 248.99400000000003, "r_x2": 285.731, "r_y2": 237.70500000000004, "r_x3": 264.744, "r_y3": 237.70500000000004, "coord_origin": "TOPLEFT"}, "text": "0.987", "orig": "0.987", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 44, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 302.444, "r_y0": 248.99400000000003, "r_x1": 323.431, "r_y1": 248.99400000000003, "r_x2": 323.431, "r_y2": 237.70500000000004, "r_x3": 302.444, "r_y3": 237.70500000000004, "coord_origin": "TOPLEFT"}, "text": "0.964", "orig": "0.964", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 45, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 337.815, "r_y0": 247.846, "r_x1": 361.976, "r_y1": 247.846, "r_x2": 361.976, "r_y2": 239.91999999999996, "r_x3": 337.815, "r_y3": 239.91999999999996, "coord_origin": "TOPLEFT"}, "text": "0.977", "orig": "0.977", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 46, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 380.464, "r_y0": 247.846, "r_x1": 404.625, "r_y1": 247.846, "r_x2": 404.625, "r_y2": 239.91999999999996, "r_x3": 380.464, "r_y3": 239.91999999999996, "coord_origin": "TOPLEFT"}, "text": "0.896", "orig": "0.896", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 47, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 435.493, "r_y0": 247.846, "r_x1": 454.35, "r_y1": 247.846, "r_x2": 454.35, "r_y2": 239.91999999999996, "r_x3": 435.493, "r_y3": 239.91999999999996, "coord_origin": "TOPLEFT"}, "text": "1.79", "orig": "1.79", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 48, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 220.903, "r_y0": 261.946, "r_x1": 248.667, "r_y1": 261.946, "r_x2": 248.667, "r_y2": 250.65700000000004, "r_x3": 220.903, "r_y3": 250.65700000000004, "coord_origin": "TOPLEFT"}, "text": "HTML", "orig": "HTML", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 49, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 264.744, "r_y0": 261.946, "r_x1": 285.731, "r_y1": 261.946, "r_x2": 285.731, "r_y2": 250.65700000000004, "r_x3": 264.744, "r_y3": 250.65700000000004, "coord_origin": "TOPLEFT"}, "text": "0.983", "orig": "0.983", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 50, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 302.444, "r_y0": 261.946, "r_x1": 323.431, "r_y1": 261.946, "r_x2": 323.431, "r_y2": 250.65700000000004, "r_x3": 302.444, "r_y3": 250.65700000000004, "coord_origin": "TOPLEFT"}, "text": "0.944", "orig": "0.944", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 51, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 339.403, "r_y0": 261.946, "r_x1": 360.39, "r_y1": 261.946, "r_x2": 360.39, "r_y2": 250.65700000000004, "r_x3": 339.403, "r_y3": 250.65700000000004, "coord_origin": "TOPLEFT"}, "text": "0.966", "orig": "0.966", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 52, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 382.052, "r_y0": 261.946, "r_x1": 403.039, "r_y1": 261.946, "r_x2": 403.039, "r_y2": 250.65700000000004, "r_x3": 382.052, "r_y3": 250.65700000000004, "coord_origin": "TOPLEFT"}, "text": "0.889", "orig": "0.889", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 53, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 436.732, "r_y0": 261.946, "r_x1": 453.112, "r_y1": 261.946, "r_x2": 453.112, "r_y2": 250.65700000000004, "r_x3": 436.732, "r_y3": 250.65700000000004, "coord_origin": "TOPLEFT"}, "text": "3.26", "orig": "3.26", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": [{"id": 10, "label": "text", "bbox": {"l": 160.782, "t": 164.28099999999995, "r": 194.998, "b": 175.57000000000005, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 6, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 160.782, "r_y0": 175.57000000000005, "r_x1": 194.998, "r_y1": 175.57000000000005, "r_x2": 194.998, "r_y2": 164.28099999999995, "r_x3": 160.782, "r_y3": 164.28099999999995, "coord_origin": "TOPLEFT"}, "text": "Data set", "orig": "Data set", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 11, "label": "text", "bbox": {"l": 215.525, "t": 164.25599999999997, "r": 254.045, "b": 175.54499999999996, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 7, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 215.525, "r_y0": 175.54499999999996, "r_x1": 254.045, "r_y1": 175.54499999999996, "r_x2": 254.045, "r_y2": 164.25599999999997, "r_x3": 215.525, "r_y3": 164.25599999999997, "coord_origin": "TOPLEFT"}, "text": "Language", "orig": "Language", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 12, "label": "text", "bbox": {"l": 300.397, "t": 158.80100000000004, "r": 323.991, "b": 170.09000000000003, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 8, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 300.397, "r_y0": 170.09000000000003, "r_x1": 323.991, "r_y1": 170.09000000000003, "r_x2": 323.991, "r_y2": 158.80100000000004, "r_x3": 300.397, "r_y3": 158.80100000000004, "coord_origin": "TOPLEFT"}, "text": "TEDs", "orig": "TEDs", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 13, "label": "text", "bbox": {"l": 370.345, "t": 164.28099999999995, "r": 414.747, "b": 175.57000000000005, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 9, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 370.345, "r_y0": 175.57000000000005, "r_x1": 414.747, "r_y1": 175.57000000000005, "r_x2": 414.747, "r_y2": 164.28099999999995, "r_x3": 370.345, "r_y3": 164.28099999999995, "coord_origin": "TOPLEFT"}, "text": "mAP(0.75)", "orig": "mAP(0.75)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 14, "label": "text", "bbox": {"l": 426.737, "t": 158.80100000000004, "r": 463.108, "b": 170.09000000000003, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 10, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 426.737, "r_y0": 170.09000000000003, "r_x1": 463.108, "r_y1": 170.09000000000003, "r_x2": 463.108, "r_y2": 158.80100000000004, "r_x3": 426.737, "r_y3": 158.80100000000004, "coord_origin": "TOPLEFT"}, "text": "Inference", "orig": "Inference", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 15, "label": "text", "bbox": {"l": 423.114, "t": 169.76, "r": 466.727, "b": 181.04899999999998, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 11, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 423.114, "r_y0": 181.04899999999998, "r_x1": 466.727, "r_y1": 181.04899999999998, "r_x2": 466.727, "r_y2": 169.76, "r_x3": 423.114, "r_y3": 169.76, "coord_origin": "TOPLEFT"}, "text": "time (secs)", "orig": "time (secs)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 16, "label": "text", "bbox": {"l": 262.413, "t": 171.75300000000004, "r": 288.06, "b": 183.04200000000003, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 12, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 262.413, "r_y0": 183.04200000000003, "r_x1": 288.06, "r_y1": 183.04200000000003, "r_x2": 288.06, "r_y2": 171.75300000000004, "r_x3": 262.413, "r_y3": 171.75300000000004, "coord_origin": "TOPLEFT"}, "text": "simple", "orig": "simple", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 17, "label": "text", "bbox": {"l": 296.429, "t": 171.75300000000004, "r": 329.447, "b": 183.04200000000003, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 13, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 296.429, "r_y0": 183.04200000000003, "r_x1": 329.447, "r_y1": 183.04200000000003, "r_x2": 329.447, "r_y2": 171.75300000000004, "r_x3": 296.429, "r_y3": 171.75300000000004, "coord_origin": "TOPLEFT"}, "text": "complex", "orig": "complex", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 18, "label": "text", "bbox": {"l": 345.033, "t": 171.75300000000004, "r": 354.758, "b": 183.04200000000003, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 14, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 345.033, "r_y0": 183.04200000000003, "r_x1": 354.758, "r_y1": 183.04200000000003, "r_x2": 354.758, "r_y2": 171.75300000000004, "r_x3": 345.033, "r_y3": 171.75300000000004, "coord_origin": "TOPLEFT"}, "text": "all", "orig": "all", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 19, "label": "text", "bbox": {"l": 154.538, "t": 190.582, "r": 201.241, "b": 201.87099999999998, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 15, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 154.538, "r_y0": 201.87099999999998, "r_x1": 201.241, "r_y1": 201.87099999999998, "r_x2": 201.241, "r_y2": 190.582, "r_x3": 154.538, "r_y3": 190.582, "coord_origin": "TOPLEFT"}, "text": "PubTabNet", "orig": "PubTabNet", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 20, "label": "text", "bbox": {"l": 222.437, "t": 185.10299999999995, "r": 247.132, "b": 196.39200000000005, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 16, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 222.437, "r_y0": 196.39200000000005, "r_x1": 247.132, "r_y1": 196.39200000000005, "r_x2": 247.132, "r_y2": 185.10299999999995, "r_x3": 222.437, "r_y3": 185.10299999999995, "coord_origin": "TOPLEFT"}, "text": "OTSL", "orig": "OTSL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 21, "label": "text", "bbox": {"l": 264.744, "t": 185.10299999999995, "r": 285.731, "b": 196.39200000000005, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 17, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 264.744, "r_y0": 196.39200000000005, "r_x1": 285.731, "r_y1": 196.39200000000005, "r_x2": 285.731, "r_y2": 185.10299999999995, "r_x3": 264.744, "r_y3": 185.10299999999995, "coord_origin": "TOPLEFT"}, "text": "0.965", "orig": "0.965", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 22, "label": "text", "bbox": {"l": 302.444, "t": 185.10299999999995, "r": 323.431, "b": 196.39200000000005, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 18, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 302.444, "r_y0": 196.39200000000005, "r_x1": 323.431, "r_y1": 196.39200000000005, "r_x2": 323.431, "r_y2": 185.10299999999995, "r_x3": 302.444, "r_y3": 185.10299999999995, "coord_origin": "TOPLEFT"}, "text": "0.934", "orig": "0.934", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 23, "label": "text", "bbox": {"l": 339.403, "t": 185.10299999999995, "r": 360.39, "b": 196.39200000000005, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 19, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 339.403, "r_y0": 196.39200000000005, "r_x1": 360.39, "r_y1": 196.39200000000005, "r_x2": 360.39, "r_y2": 185.10299999999995, "r_x3": 339.403, "r_y3": 185.10299999999995, "coord_origin": "TOPLEFT"}, "text": "0.955", "orig": "0.955", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 24, "label": "text", "bbox": {"l": 383.116, "t": 187.31799999999998, "r": 401.973, "b": 195.24400000000003, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 20, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 383.116, "r_y0": 195.24400000000003, "r_x1": 401.973, "r_y1": 195.24400000000003, "r_x2": 401.973, "r_y2": 187.31799999999998, "r_x3": 383.116, "r_y3": 187.31799999999998, "coord_origin": "TOPLEFT"}, "text": "0.88", "orig": "0.88", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 25, "label": "text", "bbox": {"l": 435.493, "t": 187.31799999999998, "r": 454.35, "b": 195.24400000000003, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 21, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 435.493, "r_y0": 195.24400000000003, "r_x1": 454.35, "r_y1": 195.24400000000003, "r_x2": 454.35, "r_y2": 187.31799999999998, "r_x3": 435.493, "r_y3": 187.31799999999998, "coord_origin": "TOPLEFT"}, "text": "2.73", "orig": "2.73", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 26, "label": "text", "bbox": {"l": 220.903, "t": 198.05399999999997, "r": 248.667, "b": 209.34299999999996, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 22, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 220.903, "r_y0": 209.34299999999996, "r_x1": 248.667, "r_y1": 209.34299999999996, "r_x2": 248.667, "r_y2": 198.05399999999997, "r_x3": 220.903, "r_y3": 198.05399999999997, "coord_origin": "TOPLEFT"}, "text": "HTML", "orig": "HTML", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 27, "label": "text", "bbox": {"l": 264.744, "t": 198.05399999999997, "r": 285.731, "b": 209.34299999999996, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 23, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 264.744, "r_y0": 209.34299999999996, "r_x1": 285.731, "r_y1": 209.34299999999996, "r_x2": 285.731, "r_y2": 198.05399999999997, "r_x3": 264.744, "r_y3": 198.05399999999997, "coord_origin": "TOPLEFT"}, "text": "0.969", "orig": "0.969", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 28, "label": "text", "bbox": {"l": 302.444, "t": 198.05399999999997, "r": 323.431, "b": 209.34299999999996, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 24, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 302.444, "r_y0": 209.34299999999996, "r_x1": 323.431, "r_y1": 209.34299999999996, "r_x2": 323.431, "r_y2": 198.05399999999997, "r_x3": 302.444, "r_y3": 198.05399999999997, "coord_origin": "TOPLEFT"}, "text": "0.927", "orig": "0.927", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 29, "label": "text", "bbox": {"l": 339.403, "t": 198.05399999999997, "r": 360.39, "b": 209.34299999999996, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 25, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 339.403, "r_y0": 209.34299999999996, "r_x1": 360.39, "r_y1": 209.34299999999996, "r_x2": 360.39, "r_y2": 198.05399999999997, "r_x3": 339.403, "r_y3": 198.05399999999997, "coord_origin": "TOPLEFT"}, "text": "0.955", "orig": "0.955", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 30, "label": "text", "bbox": {"l": 382.052, "t": 198.05399999999997, "r": 403.039, "b": 209.34299999999996, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 26, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 382.052, "r_y0": 209.34299999999996, "r_x1": 403.039, "r_y1": 209.34299999999996, "r_x2": 403.039, "r_y2": 198.05399999999997, "r_x3": 382.052, "r_y3": 198.05399999999997, "coord_origin": "TOPLEFT"}, "text": "0.857", "orig": "0.857", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 31, "label": "text", "bbox": {"l": 436.732, "t": 198.05399999999997, "r": 453.112, "b": 209.34299999999996, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 27, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 436.732, "r_y0": 209.34299999999996, "r_x1": 453.112, "r_y1": 209.34299999999996, "r_x2": 453.112, "r_y2": 198.05399999999997, "r_x3": 436.732, "r_y3": 198.05399999999997, "coord_origin": "TOPLEFT"}, "text": "5.39", "orig": "5.39", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 32, "label": "text", "bbox": {"l": 155.945, "t": 216.88400000000001, "r": 199.834, "b": 228.173, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 28, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 155.945, "r_y0": 228.173, "r_x1": 199.834, "r_y1": 228.173, "r_x2": 199.834, "r_y2": 216.88400000000001, "r_x3": 155.945, "r_y3": 216.88400000000001, "coord_origin": "TOPLEFT"}, "text": "FinTabNet", "orig": "FinTabNet", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 33, "label": "text", "bbox": {"l": 222.437, "t": 211.404, "r": 247.132, "b": 222.69299999999998, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 29, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 222.437, "r_y0": 222.69299999999998, "r_x1": 247.132, "r_y1": 222.69299999999998, "r_x2": 247.132, "r_y2": 211.404, "r_x3": 222.437, "r_y3": 211.404, "coord_origin": "TOPLEFT"}, "text": "OTSL", "orig": "OTSL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 34, "label": "text", "bbox": {"l": 264.744, "t": 211.404, "r": 285.731, "b": 222.69299999999998, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 30, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 264.744, "r_y0": 222.69299999999998, "r_x1": 285.731, "r_y1": 222.69299999999998, "r_x2": 285.731, "r_y2": 211.404, "r_x3": 264.744, "r_y3": 211.404, "coord_origin": "TOPLEFT"}, "text": "0.955", "orig": "0.955", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 35, "label": "text", "bbox": {"l": 302.444, "t": 211.404, "r": 323.431, "b": 222.69299999999998, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 31, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 302.444, "r_y0": 222.69299999999998, "r_x1": 323.431, "r_y1": 222.69299999999998, "r_x2": 323.431, "r_y2": 211.404, "r_x3": 302.444, "r_y3": 211.404, "coord_origin": "TOPLEFT"}, "text": "0.961", "orig": "0.961", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 36, "label": "text", "bbox": {"l": 337.815, "t": 213.61900000000003, "r": 361.976, "b": 221.54499999999996, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 32, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 337.815, "r_y0": 221.54499999999996, "r_x1": 361.976, "r_y1": 221.54499999999996, "r_x2": 361.976, "r_y2": 213.61900000000003, "r_x3": 337.815, "r_y3": 213.61900000000003, "coord_origin": "TOPLEFT"}, "text": "0.959", "orig": "0.959", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 37, "label": "text", "bbox": {"l": 380.464, "t": 213.61900000000003, "r": 404.625, "b": 221.54499999999996, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 33, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 380.464, "r_y0": 221.54499999999996, "r_x1": 404.625, "r_y1": 221.54499999999996, "r_x2": 404.625, "r_y2": 213.61900000000003, "r_x3": 380.464, "r_y3": 213.61900000000003, "coord_origin": "TOPLEFT"}, "text": "0.862", "orig": "0.862", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 38, "label": "text", "bbox": {"l": 435.493, "t": 213.61900000000003, "r": 454.35, "b": 221.54499999999996, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 34, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 435.493, "r_y0": 221.54499999999996, "r_x1": 454.35, "r_y1": 221.54499999999996, "r_x2": 454.35, "r_y2": 213.61900000000003, "r_x3": 435.493, "r_y3": 213.61900000000003, "coord_origin": "TOPLEFT"}, "text": "1.85", "orig": "1.85", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 39, "label": "text", "bbox": {"l": 220.903, "t": 224.356, "r": 248.667, "b": 235.64499999999998, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 35, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 220.903, "r_y0": 235.64499999999998, "r_x1": 248.667, "r_y1": 235.64499999999998, "r_x2": 248.667, "r_y2": 224.356, "r_x3": 220.903, "r_y3": 224.356, "coord_origin": "TOPLEFT"}, "text": "HTML", "orig": "HTML", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 40, "label": "text", "bbox": {"l": 264.744, "t": 224.356, "r": 285.731, "b": 235.64499999999998, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 36, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 264.744, "r_y0": 235.64499999999998, "r_x1": 285.731, "r_y1": 235.64499999999998, "r_x2": 285.731, "r_y2": 224.356, "r_x3": 264.744, "r_y3": 224.356, "coord_origin": "TOPLEFT"}, "text": "0.917", "orig": "0.917", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 41, "label": "text", "bbox": {"l": 302.444, "t": 224.356, "r": 323.431, "b": 235.64499999999998, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 37, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 302.444, "r_y0": 235.64499999999998, "r_x1": 323.431, "r_y1": 235.64499999999998, "r_x2": 323.431, "r_y2": 224.356, "r_x3": 302.444, "r_y3": 224.356, "coord_origin": "TOPLEFT"}, "text": "0.922", "orig": "0.922", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 42, "label": "text", "bbox": {"l": 341.706, "t": 224.356, "r": 358.086, "b": 235.64499999999998, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 38, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 341.706, "r_y0": 235.64499999999998, "r_x1": 358.086, "r_y1": 235.64499999999998, "r_x2": 358.086, "r_y2": 224.356, "r_x3": 341.706, "r_y3": 224.356, "coord_origin": "TOPLEFT"}, "text": "0.92", "orig": "0.92", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 43, "label": "text", "bbox": {"l": 382.052, "t": 224.356, "r": 403.039, "b": 235.64499999999998, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 39, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 382.052, "r_y0": 235.64499999999998, "r_x1": 403.039, "r_y1": 235.64499999999998, "r_x2": 403.039, "r_y2": 224.356, "r_x3": 382.052, "r_y3": 224.356, "coord_origin": "TOPLEFT"}, "text": "0.722", "orig": "0.722", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 44, "label": "text", "bbox": {"l": 436.732, "t": 224.356, "r": 453.112, "b": 235.64499999999998, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 40, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 436.732, "r_y0": 235.64499999999998, "r_x1": 453.112, "r_y1": 235.64499999999998, "r_x2": 453.112, "r_y2": 224.356, "r_x3": 436.732, "r_y3": 224.356, "coord_origin": "TOPLEFT"}, "text": "3.26", "orig": "3.26", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 45, "label": "text", "bbox": {"l": 148.626, "t": 243.18499999999995, "r": 207.152, "b": 254.47400000000005, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 41, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 148.626, "r_y0": 254.47400000000005, "r_x1": 207.152, "r_y1": 254.47400000000005, "r_x2": 207.152, "r_y2": 243.18499999999995, "r_x3": 148.626, "r_y3": 243.18499999999995, "coord_origin": "TOPLEFT"}, "text": "PubTables-1M", "orig": "PubTables-1M", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 46, "label": "text", "bbox": {"l": 222.437, "t": 237.70500000000004, "r": 247.132, "b": 248.99400000000003, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 42, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 222.437, "r_y0": 248.99400000000003, "r_x1": 247.132, "r_y1": 248.99400000000003, "r_x2": 247.132, "r_y2": 237.70500000000004, "r_x3": 222.437, "r_y3": 237.70500000000004, "coord_origin": "TOPLEFT"}, "text": "OTSL", "orig": "OTSL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 47, "label": "text", "bbox": {"l": 264.744, "t": 237.70500000000004, "r": 285.731, "b": 248.99400000000003, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 43, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 264.744, "r_y0": 248.99400000000003, "r_x1": 285.731, "r_y1": 248.99400000000003, "r_x2": 285.731, "r_y2": 237.70500000000004, "r_x3": 264.744, "r_y3": 237.70500000000004, "coord_origin": "TOPLEFT"}, "text": "0.987", "orig": "0.987", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 48, "label": "text", "bbox": {"l": 302.444, "t": 237.70500000000004, "r": 323.431, "b": 248.99400000000003, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 44, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 302.444, "r_y0": 248.99400000000003, "r_x1": 323.431, "r_y1": 248.99400000000003, "r_x2": 323.431, "r_y2": 237.70500000000004, "r_x3": 302.444, "r_y3": 237.70500000000004, "coord_origin": "TOPLEFT"}, "text": "0.964", "orig": "0.964", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 49, "label": "text", "bbox": {"l": 337.815, "t": 239.91999999999996, "r": 361.976, "b": 247.846, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 45, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 337.815, "r_y0": 247.846, "r_x1": 361.976, "r_y1": 247.846, "r_x2": 361.976, "r_y2": 239.91999999999996, "r_x3": 337.815, "r_y3": 239.91999999999996, "coord_origin": "TOPLEFT"}, "text": "0.977", "orig": "0.977", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 50, "label": "text", "bbox": {"l": 380.464, "t": 239.91999999999996, "r": 404.625, "b": 247.846, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 46, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 380.464, "r_y0": 247.846, "r_x1": 404.625, "r_y1": 247.846, "r_x2": 404.625, "r_y2": 239.91999999999996, "r_x3": 380.464, "r_y3": 239.91999999999996, "coord_origin": "TOPLEFT"}, "text": "0.896", "orig": "0.896", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 51, "label": "text", "bbox": {"l": 435.493, "t": 239.91999999999996, "r": 454.35, "b": 247.846, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 47, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 435.493, "r_y0": 247.846, "r_x1": 454.35, "r_y1": 247.846, "r_x2": 454.35, "r_y2": 239.91999999999996, "r_x3": 435.493, "r_y3": 239.91999999999996, "coord_origin": "TOPLEFT"}, "text": "1.79", "orig": "1.79", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 52, "label": "text", "bbox": {"l": 220.903, "t": 250.65700000000004, "r": 248.667, "b": 261.946, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 48, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 220.903, "r_y0": 261.946, "r_x1": 248.667, "r_y1": 261.946, "r_x2": 248.667, "r_y2": 250.65700000000004, "r_x3": 220.903, "r_y3": 250.65700000000004, "coord_origin": "TOPLEFT"}, "text": "HTML", "orig": "HTML", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 53, "label": "text", "bbox": {"l": 264.744, "t": 250.65700000000004, "r": 285.731, "b": 261.946, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 49, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 264.744, "r_y0": 261.946, "r_x1": 285.731, "r_y1": 261.946, "r_x2": 285.731, "r_y2": 250.65700000000004, "r_x3": 264.744, "r_y3": 250.65700000000004, "coord_origin": "TOPLEFT"}, "text": "0.983", "orig": "0.983", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 54, "label": "text", "bbox": {"l": 302.444, "t": 250.65700000000004, "r": 323.431, "b": 261.946, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 50, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 302.444, "r_y0": 261.946, "r_x1": 323.431, "r_y1": 261.946, "r_x2": 323.431, "r_y2": 250.65700000000004, "r_x3": 302.444, "r_y3": 250.65700000000004, "coord_origin": "TOPLEFT"}, "text": "0.944", "orig": "0.944", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 55, "label": "text", "bbox": {"l": 339.403, "t": 250.65700000000004, "r": 360.39, "b": 261.946, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 51, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 339.403, "r_y0": 261.946, "r_x1": 360.39, "r_y1": 261.946, "r_x2": 360.39, "r_y2": 250.65700000000004, "r_x3": 339.403, "r_y3": 250.65700000000004, "coord_origin": "TOPLEFT"}, "text": "0.966", "orig": "0.966", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 56, "label": "text", "bbox": {"l": 382.052, "t": 250.65700000000004, "r": 403.039, "b": 261.946, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 52, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 382.052, "r_y0": 261.946, "r_x1": 403.039, "r_y1": 261.946, "r_x2": 403.039, "r_y2": 250.65700000000004, "r_x3": 382.052, "r_y3": 250.65700000000004, "coord_origin": "TOPLEFT"}, "text": "0.889", "orig": "0.889", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 57, "label": "text", "bbox": {"l": 436.732, "t": 250.65700000000004, "r": 453.112, "b": 261.946, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 53, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 436.732, "r_y0": 261.946, "r_x1": 453.112, "r_y1": 261.946, "r_x2": 453.112, "r_y2": 250.65700000000004, "r_x3": 436.732, "r_y3": 250.65700000000004, "coord_origin": "TOPLEFT"}, "text": "3.26", "orig": "3.26", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}]}, "text": null, "otsl_seq": ["ched", "ched", "ched", "lcel", "lcel", "ched", "ched", "nl", "ucel", "ucel", "ched", "ched", "ched", "ucel", "ucel", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "nl"], "num_rows": 5, "num_cols": 7, "table_cells": [{"bbox": {"l": 160.782, "t": 164.28099999999995, "r": 194.998, "b": 175.57000000000005, "coord_origin": "TOPLEFT"}, "row_span": 2, "col_span": 1, "start_row_offset_idx": 0, "end_row_offset_idx": 2, "start_col_offset_idx": 0, "end_col_offset_idx": 1, "text": "Data set", "column_header": true, "row_header": false, "row_section": false}, {"bbox": {"l": 215.525, "t": 164.25599999999997, "r": 254.045, "b": 175.54499999999996, "coord_origin": "TOPLEFT"}, "row_span": 2, "col_span": 1, "start_row_offset_idx": 0, "end_row_offset_idx": 2, "start_col_offset_idx": 1, "end_col_offset_idx": 2, "text": "Language", "column_header": true, "row_header": false, "row_section": false}, {"bbox": {"l": 300.397, "t": 158.80100000000004, "r": 323.991, "b": 170.09000000000003, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 3, "start_row_offset_idx": 0, "end_row_offset_idx": 1, "start_col_offset_idx": 2, "end_col_offset_idx": 5, "text": "TEDs", "column_header": true, "row_header": false, "row_section": false}, {"bbox": {"l": 370.345, "t": 164.28099999999995, "r": 414.747, "b": 175.57000000000005, "coord_origin": "TOPLEFT"}, "row_span": 2, "col_span": 1, "start_row_offset_idx": 0, "end_row_offset_idx": 2, "start_col_offset_idx": 5, "end_col_offset_idx": 6, "text": "mAP(0.75)", "column_header": true, "row_header": false, "row_section": false}, {"bbox": {"l": 423.114, "t": 158.80100000000004, "r": 466.727, "b": 181.04899999999998, "coord_origin": "TOPLEFT"}, "row_span": 2, "col_span": 1, "start_row_offset_idx": 0, "end_row_offset_idx": 2, "start_col_offset_idx": 6, "end_col_offset_idx": 7, "text": "Inference time (secs)", "column_header": true, "row_header": false, "row_section": false}, {"bbox": {"l": 262.413, "t": 171.75300000000004, "r": 288.06, "b": 183.04200000000003, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 1, "end_row_offset_idx": 2, "start_col_offset_idx": 2, "end_col_offset_idx": 3, "text": "simple", "column_header": true, "row_header": false, "row_section": false}, {"bbox": {"l": 296.429, "t": 171.75300000000004, "r": 329.447, "b": 183.04200000000003, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 1, "end_row_offset_idx": 2, "start_col_offset_idx": 3, "end_col_offset_idx": 4, "text": "complex", "column_header": true, "row_header": false, "row_section": false}, {"bbox": {"l": 345.033, "t": 171.75300000000004, "r": 354.758, "b": 183.04200000000003, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 1, "end_row_offset_idx": 2, "start_col_offset_idx": 4, "end_col_offset_idx": 5, "text": "all", "column_header": true, "row_header": false, "row_section": false}, {"bbox": {"l": 154.538, "t": 190.582, "r": 201.241, "b": 201.87099999999998, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 2, "end_row_offset_idx": 3, "start_col_offset_idx": 0, "end_col_offset_idx": 1, "text": "PubTabNet", "column_header": false, "row_header": false, "row_section": false}, {"bbox": {"l": 220.903, "t": 185.10299999999995, "r": 248.667, "b": 209.34299999999996, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 2, "end_row_offset_idx": 3, "start_col_offset_idx": 1, "end_col_offset_idx": 2, "text": "OTSL HTML", "column_header": false, "row_header": false, "row_section": false}, {"bbox": {"l": 264.744, "t": 185.10299999999995, "r": 285.731, "b": 209.34299999999996, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 2, "end_row_offset_idx": 3, "start_col_offset_idx": 2, "end_col_offset_idx": 3, "text": "0.965 0.969", "column_header": false, "row_header": false, "row_section": false}, {"bbox": {"l": 302.444, "t": 185.10299999999995, "r": 323.431, "b": 209.34299999999996, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 2, "end_row_offset_idx": 3, "start_col_offset_idx": 3, "end_col_offset_idx": 4, "text": "0.934 0.927", "column_header": false, "row_header": false, "row_section": false}, {"bbox": {"l": 339.403, "t": 185.10299999999995, "r": 360.39, "b": 209.34299999999996, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 2, "end_row_offset_idx": 3, "start_col_offset_idx": 4, "end_col_offset_idx": 5, "text": "0.955 0.955", "column_header": false, "row_header": false, "row_section": false}, {"bbox": {"l": 382.052, "t": 187.31799999999998, "r": 403.039, "b": 209.34299999999996, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 2, "end_row_offset_idx": 3, "start_col_offset_idx": 5, "end_col_offset_idx": 6, "text": "0.88 0.857", "column_header": false, "row_header": false, "row_section": false}, {"bbox": {"l": 435.493, "t": 187.31799999999998, "r": 454.35, "b": 209.34299999999996, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 2, "end_row_offset_idx": 3, "start_col_offset_idx": 6, "end_col_offset_idx": 7, "text": "2.73 5.39", "column_header": false, "row_header": false, "row_section": false}, {"bbox": {"l": 155.945, "t": 216.88400000000001, "r": 199.834, "b": 228.173, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 3, "end_row_offset_idx": 4, "start_col_offset_idx": 0, "end_col_offset_idx": 1, "text": "FinTabNet", "column_header": false, "row_header": false, "row_section": false}, {"bbox": {"l": 220.903, "t": 211.404, "r": 248.667, "b": 235.64499999999998, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 3, "end_row_offset_idx": 4, "start_col_offset_idx": 1, "end_col_offset_idx": 2, "text": "OTSL HTML", "column_header": false, "row_header": false, "row_section": false}, {"bbox": {"l": 264.744, "t": 211.404, "r": 285.731, "b": 235.64499999999998, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 3, "end_row_offset_idx": 4, "start_col_offset_idx": 2, "end_col_offset_idx": 3, "text": "0.955 0.917", "column_header": false, "row_header": false, "row_section": false}, {"bbox": {"l": 302.444, "t": 211.404, "r": 323.431, "b": 235.64499999999998, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 3, "end_row_offset_idx": 4, "start_col_offset_idx": 3, "end_col_offset_idx": 4, "text": "0.961 0.922", "column_header": false, "row_header": false, "row_section": false}, {"bbox": {"l": 337.815, "t": 213.61900000000003, "r": 361.976, "b": 235.64499999999998, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 3, "end_row_offset_idx": 4, "start_col_offset_idx": 4, "end_col_offset_idx": 5, "text": "0.959 0.92", "column_header": false, "row_header": false, "row_section": false}, {"bbox": {"l": 380.464, "t": 213.61900000000003, "r": 404.625, "b": 235.64499999999998, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 3, "end_row_offset_idx": 4, "start_col_offset_idx": 5, "end_col_offset_idx": 6, "text": "0.862 0.722", "column_header": false, "row_header": false, "row_section": false}, {"bbox": {"l": 435.493, "t": 213.61900000000003, "r": 454.35, "b": 235.64499999999998, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 3, "end_row_offset_idx": 4, "start_col_offset_idx": 6, "end_col_offset_idx": 7, "text": "1.85 3.26", "column_header": false, "row_header": false, "row_section": false}, {"bbox": {"l": 148.626, "t": 243.18499999999995, "r": 207.152, "b": 254.47400000000005, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 4, "end_row_offset_idx": 5, "start_col_offset_idx": 0, "end_col_offset_idx": 1, "text": "PubTables-1M", "column_header": false, "row_header": false, "row_section": false}, {"bbox": {"l": 220.903, "t": 237.70500000000004, "r": 248.667, "b": 261.946, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 4, "end_row_offset_idx": 5, "start_col_offset_idx": 1, "end_col_offset_idx": 2, "text": "OTSL HTML", "column_header": false, "row_header": false, "row_section": false}, {"bbox": {"l": 264.744, "t": 237.70500000000004, "r": 285.731, "b": 261.946, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 4, "end_row_offset_idx": 5, "start_col_offset_idx": 2, "end_col_offset_idx": 3, "text": "0.987 0.983", "column_header": false, "row_header": false, "row_section": false}, {"bbox": {"l": 302.444, "t": 237.70500000000004, "r": 323.431, "b": 261.946, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 4, "end_row_offset_idx": 5, "start_col_offset_idx": 3, "end_col_offset_idx": 4, "text": "0.964 0.944", "column_header": false, "row_header": false, "row_section": false}, {"bbox": {"l": 337.815, "t": 239.91999999999996, "r": 361.976, "b": 261.946, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 4, "end_row_offset_idx": 5, "start_col_offset_idx": 4, "end_col_offset_idx": 5, "text": "0.977 0.966", "column_header": false, "row_header": false, "row_section": false}, {"bbox": {"l": 380.464, "t": 239.91999999999996, "r": 404.625, "b": 261.946, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 4, "end_row_offset_idx": 5, "start_col_offset_idx": 5, "end_col_offset_idx": 6, "text": "0.896 0.889", "column_header": false, "row_header": false, "row_section": false}, {"bbox": {"l": 435.493, "t": 239.91999999999996, "r": 454.35, "b": 261.946, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 4, "end_row_offset_idx": 5, "start_col_offset_idx": 6, "end_col_offset_idx": 7, "text": "1.79 3.26", "column_header": false, "row_header": false, "row_section": false}]}, {"label": "section_header", "id": 3, "page_no": 9, "cluster": {"id": 3, "label": "section_header", "bbox": {"l": 134.765, "t": 288.915, "r": 257.087, "b": 297.722, "coord_origin": "TOPLEFT"}, "confidence": 0.9546447992324829, "cells": [{"index": 54, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 297.722, "r_x1": 149.402, "r_y1": 297.722, "r_x2": 149.402, "r_y2": 288.915, "r_x3": 134.765, "r_y3": 288.915, "coord_origin": "TOPLEFT"}, "text": "5.3", "orig": "5.3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 55, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 160.859, "r_y0": 297.722, "r_x1": 257.087, "r_y1": 297.722, "r_x2": 257.087, "r_y2": 288.915, "r_x3": 160.859, "r_y3": 288.915, "coord_origin": "TOPLEFT"}, "text": "Qualitative Results", "orig": "Qualitative Results", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "5.3 Qualitative Results"}, {"label": "text", "id": 1, "page_no": 9, "cluster": {"id": 1, "label": "text", "bbox": {"l": 134.765, "t": 309.861, "r": 480.59, "b": 366.478, "coord_origin": "TOPLEFT"}, "confidence": 0.9834085702896118, "cells": [{"index": 56, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 318.658, "r_x1": 189.59, "r_y1": 318.658, "r_x2": 189.59, "r_y2": 309.861, "r_x3": 134.765, "r_y3": 309.861, "coord_origin": "TOPLEFT"}, "text": "To illustrate", "orig": "To illustrate", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 57, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 194.263, "r_y0": 318.658, "r_x1": 208.096, "r_y1": 318.658, "r_x2": 208.096, "r_y2": 309.861, "r_x3": 194.263, "r_y3": 309.861, "coord_origin": "TOPLEFT"}, "text": "the", "orig": "the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 58, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 212.768, "r_y0": 318.658, "r_x1": 258.971, "r_y1": 318.658, "r_x2": 258.971, "r_y2": 309.861, "r_x3": 212.768, "r_y3": 309.861, "coord_origin": "TOPLEFT"}, "text": "qualitative", "orig": "qualitative", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 59, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 263.643, "r_y0": 318.658, "r_x1": 308.822, "r_y1": 318.658, "r_x2": 308.822, "r_y2": 309.861, "r_x3": 263.643, "r_y3": 309.861, "coord_origin": "TOPLEFT"}, "text": "differences", "orig": "differences", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 60, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 313.484, "r_y0": 318.658, "r_x1": 480.588, "r_y1": 318.658, "r_x2": 480.588, "r_y2": 309.861, "r_x3": 313.484, "r_y3": 309.861, "coord_origin": "TOPLEFT"}, "text": "between OTSL and HTML, Figure 5", "orig": "between OTSL and HTML, Figure 5", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 61, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 330.613, "r_x1": 480.589, "r_y1": 330.613, "r_x2": 480.589, "r_y2": 321.816, "r_x3": 134.765, "r_y3": 321.816, "coord_origin": "TOPLEFT"}, "text": "demonstrates less overlap and more accurate bounding boxes with OTSL. In", "orig": "demonstrates less overlap and more accurate bounding boxes with OTSL. In", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 62, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 342.568, "r_x1": 480.587, "r_y1": 342.568, "r_x2": 480.587, "r_y2": 333.771, "r_x3": 134.765, "r_y3": 333.771, "coord_origin": "TOPLEFT"}, "text": "Figure 6, OTSL proves to be more effective in handling tables with longer to-", "orig": "Figure 6, OTSL proves to be more effective in handling tables with longer to-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 63, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 354.523, "r_x1": 480.59, "r_y1": 354.523, "r_x2": 480.59, "r_y2": 345.726, "r_x3": 134.765, "r_y3": 345.726, "coord_origin": "TOPLEFT"}, "text": "ken sequences, resulting in even more precise structure prediction and bounding", "orig": "ken sequences, resulting in even more precise structure prediction and bounding", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 64, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 366.478, "r_x1": 161.657, "r_y1": 366.478, "r_x2": 161.657, "r_y2": 357.681, "r_x3": 134.765, "r_y3": 357.681, "coord_origin": "TOPLEFT"}, "text": "boxes.", "orig": "boxes.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "To illustrate the qualitative differences between OTSL and HTML, Figure 5 demonstrates less overlap and more accurate bounding boxes with OTSL. In Figure 6, OTSL proves to be more effective in handling tables with longer token sequences, resulting in even more precise structure prediction and bounding boxes."}, {"label": "caption", "id": 5, "page_no": 9, "cluster": {"id": 5, "label": "caption", "bbox": {"l": 134.765, "t": 395.375, "r": 480.591, "b": 439.717, "coord_origin": "TOPLEFT"}, "confidence": 0.9482728838920593, "cells": [{"index": 65, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 405.516, "r_x1": 162.644, "r_y1": 405.516, "r_x2": 162.644, "r_y2": 397.59, "r_x3": 134.765, "r_y3": 397.59, "coord_origin": "TOPLEFT"}, "text": "Fig. 5.", "orig": "Fig. 5.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 66, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 167.384, "r_y0": 406.664, "r_x1": 437.456, "r_y1": 406.664, "r_x2": 437.456, "r_y2": 395.375, "r_x3": 167.384, "r_y3": 395.375, "coord_origin": "TOPLEFT"}, "text": "The OTSL model produces more accurate bounding boxes with", "orig": "The OTSL model produces more accurate bounding boxes with", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 67, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 442.2, "r_y0": 406.664, "r_x1": 456.125, "r_y1": 406.664, "r_x2": 456.125, "r_y2": 395.375, "r_x3": 442.2, "r_y3": 395.375, "coord_origin": "TOPLEFT"}, "text": "less", "orig": "less", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 68, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 460.86, "r_y0": 406.664, "r_x1": 480.591, "r_y1": 406.664, "r_x2": 480.591, "r_y2": 395.375, "r_x3": 460.86, "r_y3": 395.375, "coord_origin": "TOPLEFT"}, "text": "over-", "orig": "over-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 69, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 417.623, "r_x1": 147.049, "r_y1": 417.623, "r_x2": 147.049, "r_y2": 406.334, "r_x3": 134.765, "r_y3": 406.334, "coord_origin": "TOPLEFT"}, "text": "lap", "orig": "lap", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 70, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 151.434, "r_y0": 417.623, "r_x1": 480.591, "r_y1": 417.623, "r_x2": 480.591, "r_y2": 406.334, "r_x3": 151.434, "r_y3": 406.334, "coord_origin": "TOPLEFT"}, "text": "(E) than the HTML model (D), when predicting the structure of a sparse ta-", "orig": "(E) than the HTML model (D), when predicting the structure of a sparse ta-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 71, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 428.582, "r_x1": 146.541, "r_y1": 428.582, "r_x2": 146.541, "r_y2": 417.293, "r_x3": 134.765, "r_y3": 417.293, "coord_origin": "TOPLEFT"}, "text": "ble", "orig": "ble", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 72, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 151.391, "r_y0": 428.582, "r_x1": 168.025, "r_y1": 428.582, "r_x2": 168.025, "r_y2": 417.293, "r_x3": 151.391, "r_y3": 417.293, "coord_origin": "TOPLEFT"}, "text": "(A),", "orig": "(A),", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 73, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 172.885, "r_y0": 428.582, "r_x1": 181.066, "r_y1": 428.582, "r_x2": 181.066, "r_y2": 417.293, "r_x3": 172.885, "r_y3": 417.293, "coord_origin": "TOPLEFT"}, "text": "at", "orig": "at", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 74, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 185.925, "r_y0": 428.582, "r_x1": 206.655, "r_y1": 428.582, "r_x2": 206.655, "r_y2": 417.293, "r_x3": 185.925, "r_y3": 417.293, "coord_origin": "TOPLEFT"}, "text": "twice", "orig": "twice", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 75, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 211.506, "r_y0": 428.582, "r_x1": 224.305, "r_y1": 428.582, "r_x2": 224.305, "r_y2": 417.293, "r_x3": 211.506, "r_y3": 417.293, "coord_origin": "TOPLEFT"}, "text": "the", "orig": "the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 76, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 229.165, "r_y0": 428.582, "r_x1": 264.77, "r_y1": 428.582, "r_x2": 264.77, "r_y2": 417.293, "r_x3": 229.165, "r_y3": 417.293, "coord_origin": "TOPLEFT"}, "text": "inference", "orig": "inference", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 77, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 269.621, "r_y0": 428.582, "r_x1": 291.939, "r_y1": 428.582, "r_x2": 291.939, "r_y2": 417.293, "r_x3": 269.621, "r_y3": 417.293, "coord_origin": "TOPLEFT"}, "text": "speed", "orig": "speed", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 78, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 296.799, "r_y0": 428.582, "r_x1": 327.819, "r_y1": 428.582, "r_x2": 327.819, "r_y2": 417.293, "r_x3": 296.799, "r_y3": 417.293, "coord_origin": "TOPLEFT"}, "text": "because", "orig": "because", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 79, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 332.67, "r_y0": 428.582, "r_x1": 340.092, "r_y1": 428.582, "r_x2": 340.092, "r_y2": 417.293, "r_x3": 332.67, "r_y3": 417.293, "coord_origin": "TOPLEFT"}, "text": "of", "orig": "of", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 80, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 344.952, "r_y0": 428.582, "r_x1": 373.2, "r_y1": 428.582, "r_x2": 373.2, "r_y2": 417.293, "r_x3": 344.952, "r_y3": 417.293, "coord_origin": "TOPLEFT"}, "text": "shorter", "orig": "shorter", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 81, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 378.05, "r_y0": 428.582, "r_x1": 413.174, "r_y1": 428.582, "r_x2": 413.174, "r_y2": 417.293, "r_x3": 378.05, "r_y3": 417.293, "coord_origin": "TOPLEFT"}, "text": "sequence", "orig": "sequence", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 82, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 418.024, "r_y0": 428.582, "r_x1": 443.108, "r_y1": 428.582, "r_x2": 443.108, "r_y2": 417.293, "r_x3": 418.024, "r_y3": 417.293, "coord_origin": "TOPLEFT"}, "text": "length", "orig": "length", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 83, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 447.959, "r_y0": 428.582, "r_x1": 480.588, "r_y1": 428.582, "r_x2": 480.588, "r_y2": 417.293, "r_x3": 447.959, "r_y3": 417.293, "coord_origin": "TOPLEFT"}, "text": "(B),(C).", "orig": "(B),(C).", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 84, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 439.541, "r_x1": 304.692, "r_y1": 439.541, "r_x2": 304.692, "r_y2": 428.252, "r_x3": 134.765, "r_y3": 428.252, "coord_origin": "TOPLEFT"}, "text": "\"PMC2807444_006_00.png\" PubTabNet.", "orig": "\"PMC2807444_006_00.png\" PubTabNet.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 125, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 342.634, "r_y0": 439.717, "r_x1": 344.819, "r_y1": 439.717, "r_x2": 344.819, "r_y2": 430.197, "r_x3": 342.634, "r_y3": 430.197, "coord_origin": "TOPLEFT"}, "text": "\u03bc", "orig": "\u03bc", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "Fig. 5. The OTSL model produces more accurate bounding boxes with less overlap (E) than the HTML model (D), when predicting the structure of a sparse table (A), at twice the inference speed because of shorter sequence length (B),(C). \"PMC2807444_006_00.png\" PubTabNet. \u03bc"}, {"label": "picture", "id": 2, "page_no": 9, "cluster": {"id": 2, "label": "picture", "bbox": {"l": 162.67430114746094, "t": 444.62255859375, "r": 451.70062255859375, "b": 663.2135620117188, "coord_origin": "TOPLEFT"}, "confidence": 0.9742383360862732, "cells": [{"index": 85, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 180.125, "r_y0": 518.934, "r_x1": 190.62, "r_y1": 518.934, "r_x2": 190.62, "r_y2": 516.296, "r_x3": 180.125, "r_y3": 516.296, "coord_origin": "TOPLEFT"}, "text": "<table>", "orig": "<table>", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 86, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 183.244, "r_y0": 522.8330000000001, "r_x1": 304.548, "r_y1": 522.8330000000001, "r_x2": 304.548, "r_y2": 520.194, "r_x3": 183.244, "r_y3": 520.194, "coord_origin": "TOPLEFT"}, "text": "<tr><td></td><td colspan=\"4\"></td><td colspan=\"6\"></td><td colspan=\"3\"></td></tr>", "orig": "<tr><td></td><td colspan=\"4\"></td><td colspan=\"6\"></td><td colspan=\"3\"></td></tr>", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 87, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 183.244, "r_y0": 526.731, "r_x1": 388.423, "r_y1": 526.731, "r_x2": 388.423, "r_y2": 524.0930000000001, "r_x3": 183.244, "r_y3": 524.0930000000001, "coord_origin": "TOPLEFT"}, "text": "<tr><td></td><td></td><td></td><td></td><td></td><td></td><td></td><td></td><td></td><td></td><td></td><td></td><td></td><td></td></tr>", "orig": "<tr><td></td><td></td><td></td><td></td><td></td><td></td><td></td><td></td><td></td><td></td><td></td><td></td><td></td><td></td></tr>", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 88, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 183.244, "r_y0": 530.63, "r_x1": 388.423, "r_y1": 530.63, "r_x2": 388.423, "r_y2": 527.992, "r_x3": 183.244, "r_y3": 527.992, "coord_origin": "TOPLEFT"}, "text": "<tr><td></td><td></td><td></td><td></td><td></td><td></td><td></td><td></td><td></td><td></td><td></td><td></td><td></td><td></td></tr>", "orig": "<tr><td></td><td></td><td></td><td></td><td></td><td></td><td></td><td></td><td></td><td></td><td></td><td></td><td></td><td></td></tr>", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 89, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 183.244, "r_y0": 534.529, "r_x1": 388.423, "r_y1": 534.529, "r_x2": 388.423, "r_y2": 531.8910000000001, "r_x3": 183.244, "r_y3": 531.8910000000001, "coord_origin": "TOPLEFT"}, "text": "<tr><td></td><td></td><td></td><td></td><td></td><td></td><td></td><td></td><td></td><td></td><td></td><td></td><td></td><td></td></tr>", "orig": "<tr><td></td><td></td><td></td><td></td><td></td><td></td><td></td><td></td><td></td><td></td><td></td><td></td><td></td><td></td></tr>", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 90, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 183.244, "r_y0": 538.428, "r_x1": 388.423, "r_y1": 538.428, "r_x2": 388.423, "r_y2": 535.79, "r_x3": 183.244, "r_y3": 535.79, "coord_origin": "TOPLEFT"}, "text": "<tr><td></td><td></td><td></td><td></td><td></td><td></td><td></td><td></td><td></td><td></td><td></td><td></td><td></td><td></td></tr>", "orig": "<tr><td></td><td></td><td></td><td></td><td></td><td></td><td></td><td></td><td></td><td></td><td></td><td></td><td></td><td></td></tr>", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 91, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 183.244, "r_y0": 542.327, "r_x1": 388.423, "r_y1": 542.327, "r_x2": 388.423, "r_y2": 539.689, "r_x3": 183.244, "r_y3": 539.689, "coord_origin": "TOPLEFT"}, "text": "<tr><td></td><td></td><td></td><td></td><td></td><td></td><td></td><td></td><td></td><td></td><td></td><td></td><td></td><td></td></tr>", "orig": "<tr><td></td><td></td><td></td><td></td><td></td><td></td><td></td><td></td><td></td><td></td><td></td><td></td><td></td><td></td></tr>", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 92, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 183.244, "r_y0": 546.226, "r_x1": 388.423, "r_y1": 546.226, "r_x2": 388.423, "r_y2": 543.588, "r_x3": 183.244, "r_y3": 543.588, "coord_origin": "TOPLEFT"}, "text": "<tr><td></td><td></td><td></td><td></td><td></td><td></td><td></td><td></td><td></td><td></td><td></td><td></td><td></td><td></td></tr>", "orig": "<tr><td></td><td></td><td></td><td></td><td></td><td></td><td></td><td></td><td></td><td></td><td></td><td></td><td></td><td></td></tr>", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 93, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 183.244, "r_y0": 550.124, "r_x1": 388.423, "r_y1": 550.124, "r_x2": 388.423, "r_y2": 547.486, "r_x3": 183.244, "r_y3": 547.486, "coord_origin": "TOPLEFT"}, "text": "<tr><td></td><td></td><td></td><td></td><td></td><td></td><td></td><td></td><td></td><td></td><td></td><td></td><td></td><td></td></tr>", "orig": "<tr><td></td><td></td><td></td><td></td><td></td><td></td><td></td><td></td><td></td><td></td><td></td><td></td><td></td><td></td></tr>", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 94, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 183.244, "r_y0": 554.023, "r_x1": 388.423, "r_y1": 554.023, "r_x2": 388.423, "r_y2": 551.385, "r_x3": 183.244, "r_y3": 551.385, "coord_origin": "TOPLEFT"}, "text": "<tr><td></td><td></td><td></td><td></td><td></td><td></td><td></td><td></td><td></td><td></td><td></td><td></td><td></td><td></td></tr>", "orig": "<tr><td></td><td></td><td></td><td></td><td></td><td></td><td></td><td></td><td></td><td></td><td></td><td></td><td></td><td></td></tr>", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 95, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 180.125, "r_y0": 557.922, "r_x1": 191.868, "r_y1": 557.922, "r_x2": 191.868, "r_y2": 555.284, "r_x3": 180.125, "r_y3": 555.284, "coord_origin": "TOPLEFT"}, "text": "</table>", "orig": "</table>", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 96, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 407.383, "r_y0": 521.001, "r_x1": 450.486, "r_y1": 521.001, "r_x2": 450.486, "r_y2": 518.363, "r_x3": 407.383, "r_y3": 518.363, "coord_origin": "TOPLEFT"}, "text": "C C L L L C L L L L L C L L NL", "orig": "C C L L L C L L L L L C L L NL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 97, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 407.383, "r_y0": 524.9, "r_x1": 450.486, "r_y1": 524.9, "r_x2": 450.486, "r_y2": 522.262, "r_x3": 407.383, "r_y3": 522.262, "coord_origin": "TOPLEFT"}, "text": "C C C C C C C C C C C C C C NL", "orig": "C C C C C C C C C C C C C C NL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 98, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 407.383, "r_y0": 528.799, "r_x1": 450.486, "r_y1": 528.799, "r_x2": 450.486, "r_y2": 526.1600000000001, "r_x3": 407.383, "r_y3": 526.1600000000001, "coord_origin": "TOPLEFT"}, "text": "C C C C C C C C C C C C C C NL", "orig": "C C C C C C C C C C C C C C NL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 99, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 407.383, "r_y0": 532.697, "r_x1": 450.486, "r_y1": 532.697, "r_x2": 450.486, "r_y2": 530.059, "r_x3": 407.383, "r_y3": 530.059, "coord_origin": "TOPLEFT"}, "text": "C C C C C C C C C C C C C C NL", "orig": "C C C C C C C C C C C C C C NL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 100, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 407.383, "r_y0": 536.596, "r_x1": 450.486, "r_y1": 536.596, "r_x2": 450.486, "r_y2": 533.9580000000001, "r_x3": 407.383, "r_y3": 533.9580000000001, "coord_origin": "TOPLEFT"}, "text": "C C C C C C C C C C C C C C NL", "orig": "C C C C C C C C C C C C C C NL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 101, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 407.383, "r_y0": 540.495, "r_x1": 450.486, "r_y1": 540.495, "r_x2": 450.486, "r_y2": 537.857, "r_x3": 407.383, "r_y3": 537.857, "coord_origin": "TOPLEFT"}, "text": "C C C C C C C C C C C C C C NL", "orig": "C C C C C C C C C C C C C C NL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 102, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 407.383, "r_y0": 544.394, "r_x1": 450.486, "r_y1": 544.394, "r_x2": 450.486, "r_y2": 541.756, "r_x3": 407.383, "r_y3": 541.756, "coord_origin": "TOPLEFT"}, "text": "C C C C C C C C C C C C C C NL", "orig": "C C C C C C C C C C C C C C NL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 103, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 407.383, "r_y0": 548.293, "r_x1": 450.486, "r_y1": 548.293, "r_x2": 450.486, "r_y2": 545.655, "r_x3": 407.383, "r_y3": 545.655, "coord_origin": "TOPLEFT"}, "text": "C C C C C C C C C C C C C C NL", "orig": "C C C C C C C C C C C C C C NL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 104, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 407.383, "r_y0": 552.192, "r_x1": 450.486, "r_y1": 552.192, "r_x2": 450.486, "r_y2": 549.554, "r_x3": 407.383, "r_y3": 549.554, "coord_origin": "TOPLEFT"}, "text": "C C C C C C C C C C C C C C NL", "orig": "C C C C C C C C C C C C C C NL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 105, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 164.529, "r_y0": 515.288, "r_x1": 181.853, "r_y1": 515.288, "r_x2": 181.853, "r_y2": 509.533, "r_x3": 164.529, "r_y3": 509.533, "coord_origin": "TOPLEFT"}, "text": "HTML", "orig": "HTML", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 106, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 183.584, "r_y0": 515.288, "r_x1": 208.901, "r_y1": 515.288, "r_x2": 208.901, "r_y2": 509.533, "r_x3": 183.584, "r_y3": 509.533, "coord_origin": "TOPLEFT"}, "text": "# tokens:", "orig": "# tokens:", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 107, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 210.633, "r_y0": 515.288, "r_x1": 221.04, "r_y1": 515.288, "r_x2": 221.04, "r_y2": 509.533, "r_x3": 210.633, "r_y3": 509.533, "coord_origin": "TOPLEFT"}, "text": "258", "orig": "258", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 108, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 390.202, "r_y0": 515.433, "r_x1": 406.836, "r_y1": 515.433, "r_x2": 406.836, "r_y2": 509.678, "r_x3": 390.202, "r_y3": 509.678, "coord_origin": "TOPLEFT"}, "text": "OTSL", "orig": "OTSL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 109, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 408.569, "r_y0": 515.433, "r_x1": 433.886, "r_y1": 515.433, "r_x2": 433.886, "r_y2": 509.678, "r_x3": 408.569, "r_y3": 509.678, "coord_origin": "TOPLEFT"}, "text": "# tokens:", "orig": "# tokens:", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 110, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 435.617, "r_y0": 515.433, "r_x1": 446.025, "r_y1": 515.433, "r_x2": 446.025, "r_y2": 509.678, "r_x3": 435.617, "r_y3": 509.678, "coord_origin": "TOPLEFT"}, "text": "135", "orig": "135", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 111, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 167.193, "r_y0": 526.36, "r_x1": 172.823, "r_y1": 526.36, "r_x2": 172.823, "r_y2": 519.1659999999999, "r_x3": 167.193, "r_y3": 519.1659999999999, "coord_origin": "TOPLEFT"}, "text": "B", "orig": "B", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 112, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 187.337, "r_y0": 455.912, "r_x1": 192.967, "r_y1": 455.912, "r_x2": 192.967, "r_y2": 448.718, "r_x3": 187.337, "r_y3": 448.718, "coord_origin": "TOPLEFT"}, "text": "A", "orig": "A", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 113, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 167.387, "r_y0": 573.292, "r_x1": 173.016, "r_y1": 573.292, "r_x2": 173.016, "r_y2": 566.0989999999999, "r_x3": 167.387, "r_y3": 566.0989999999999, "coord_origin": "TOPLEFT"}, "text": "D", "orig": "D", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 114, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 248.456, "r_y0": 629.067, "r_x1": 253.657, "r_y1": 629.067, "r_x2": 253.657, "r_y2": 621.874, "r_x3": 248.456, "r_y3": 621.874, "coord_origin": "TOPLEFT"}, "text": "E", "orig": "E", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 115, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 395.901, "r_y0": 526.4870000000001, "r_x1": 401.531, "r_y1": 526.4870000000001, "r_x2": 401.531, "r_y2": 519.293, "r_x3": 395.901, "r_y3": 519.293, "coord_origin": "TOPLEFT"}, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 116, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 177.46, "r_y0": 597.268, "r_x1": 177.455, "r_y1": 580.287, "r_x2": 171.7, "r_y2": 580.289, "r_x3": 171.705, "r_y3": 597.269, "coord_origin": "TOPLEFT"}, "text": "HTML", "orig": "HTML", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 117, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 256.891, "r_y0": 649.923, "r_x1": 256.886, "r_y1": 633.633, "r_x2": 251.131, "r_y2": 633.634, "r_x3": 251.136, "r_y3": 649.925, "coord_origin": "TOPLEFT"}, "text": "OTSL", "orig": "OTSL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 118, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 372.146, "r_y0": 607.287, "r_x1": 427.038, "r_y1": 607.287, "r_x2": 427.038, "r_y2": 601.532, "r_x3": 372.146, "r_y3": 601.532, "coord_origin": "TOPLEFT"}, "text": "HTML model shows", "orig": "HTML model shows", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 119, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 372.146, "r_y0": 613.729, "r_x1": 430.068, "r_y1": 613.729, "r_x2": 430.068, "r_y2": 607.9739999999999, "r_x3": 372.146, "r_y3": 607.9739999999999, "coord_origin": "TOPLEFT"}, "text": "bounding box drifting", "orig": "bounding box drifting", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 120, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 176.88, "r_y0": 648.702, "r_x1": 231.082, "r_y1": 648.702, "r_x2": 231.082, "r_y2": 642.947, "r_x3": 176.88, "r_y3": 642.947, "coord_origin": "TOPLEFT"}, "text": "OTSL model shows", "orig": "OTSL model shows", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 121, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 176.88, "r_y0": 655.144, "r_x1": 230.993, "r_y1": 655.144, "r_x2": 230.993, "r_y2": 649.389, "r_x3": 176.88, "r_y3": 649.389, "coord_origin": "TOPLEFT"}, "text": "clean bounding box", "orig": "clean bounding box", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 122, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 176.88, "r_y0": 661.586, "r_x1": 203.932, "r_y1": 661.586, "r_x2": 203.932, "r_y2": 655.831, "r_x3": 176.88, "r_y3": 655.831, "coord_origin": "TOPLEFT"}, "text": "alignment", "orig": "alignment", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 123, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 215.932, "r_y0": 569.16, "r_x1": 218.47, "r_y1": 569.16, "r_x2": 218.47, "r_y2": 557.563, "r_x3": 215.932, "r_y3": 557.563, "coord_origin": "TOPLEFT"}, "text": "\u2264", "orig": "\u2264", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 124, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 229.057, "r_y0": 569.16, "r_x1": 231.719, "r_y1": 569.16, "r_x2": 231.719, "r_y2": 557.563, "r_x3": 229.057, "r_y3": 557.563, "coord_origin": "TOPLEFT"}, "text": "\u03bc", "orig": "\u03bc", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 126, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 261.209, "r_y0": 451.197, "r_x1": 263.57, "r_y1": 451.197, "r_x2": 263.57, "r_y2": 448.461, "r_x3": 261.209, "r_y3": 448.461, "coord_origin": "TOPLEFT"}, "text": "S", "orig": "S", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 127, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 312.335, "r_y0": 451.197, "r_x1": 313.636, "r_y1": 451.197, "r_x2": 313.636, "r_y2": 448.461, "r_x3": 312.335, "r_y3": 448.461, "coord_origin": "TOPLEFT"}, "text": "I", "orig": "I", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 128, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 377.411, "r_y0": 451.197, "r_x1": 380.057, "r_y1": 451.197, "r_x2": 380.057, "r_y2": 448.461, "r_x3": 377.411, "r_y3": 448.461, "coord_origin": "TOPLEFT"}, "text": "R", "orig": "R", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 129, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 200.64, "r_y0": 456.076, "r_x1": 205.818, "r_y1": 456.076, "r_x2": 205.818, "r_y2": 453.34, "r_x3": 200.64, "r_y3": 453.34, "coord_origin": "TOPLEFT"}, "text": "ST", "orig": "ST", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 130, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 222.208, "r_y0": 456.076, "r_x1": 229.761, "r_y1": 456.076, "r_x2": 229.761, "r_y2": 453.34, "r_x3": 222.208, "r_y3": 453.34, "coord_origin": "TOPLEFT"}, "text": "0.03", "orig": "0.03", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 131, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 243.267, "r_y0": 456.076, "r_x1": 250.82, "r_y1": 456.076, "r_x2": 250.82, "r_y2": 453.34, "r_x3": 243.267, "r_y3": 453.34, "coord_origin": "TOPLEFT"}, "text": "0.06", "orig": "0.06", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 132, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 264.297, "r_y0": 456.076, "r_x1": 271.842, "r_y1": 456.076, "r_x2": 271.842, "r_y2": 453.34, "r_x3": 264.297, "r_y3": 453.34, "coord_origin": "TOPLEFT"}, "text": "0.12", "orig": "0.12", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 133, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 285.319, "r_y0": 456.076, "r_x1": 292.872, "r_y1": 456.076, "r_x2": 292.872, "r_y2": 453.34, "r_x3": 285.319, "r_y3": 453.34, "coord_origin": "TOPLEFT"}, "text": "0.25", "orig": "0.25", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 134, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 306.378, "r_y0": 456.076, "r_x1": 311.766, "r_y1": 456.076, "r_x2": 311.766, "r_y2": 453.34, "r_x3": 306.378, "r_y3": 453.34, "coord_origin": "TOPLEFT"}, "text": "0.5", "orig": "0.5", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 135, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 323.417, "r_y0": 456.076, "r_x1": 325.575, "r_y1": 456.076, "r_x2": 325.575, "r_y2": 453.34, "r_x3": 323.417, "r_y3": 453.34, "coord_origin": "TOPLEFT"}, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 136, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 334.458, "r_y0": 456.076, "r_x1": 336.616, "r_y1": 456.076, "r_x2": 336.616, "r_y2": 453.34, "r_x3": 334.458, "r_y3": 453.34, "coord_origin": "TOPLEFT"}, "text": "2", "orig": "2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 137, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 345.528, "r_y0": 456.076, "r_x1": 347.685, "r_y1": 456.076, "r_x2": 347.685, "r_y2": 453.34, "r_x3": 345.528, "r_y3": 453.34, "coord_origin": "TOPLEFT"}, "text": "4", "orig": "4", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 138, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 356.569, "r_y0": 456.076, "r_x1": 358.726, "r_y1": 456.076, "r_x2": 358.726, "r_y2": 453.34, "r_x3": 356.569, "r_y3": 453.34, "coord_origin": "TOPLEFT"}, "text": "8", "orig": "8", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 139, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 367.638, "r_y0": 456.076, "r_x1": 371.964, "r_y1": 456.076, "r_x2": 371.964, "r_y2": 453.34, "r_x3": 367.638, "r_y3": 453.34, "coord_origin": "TOPLEFT"}, "text": "16", "orig": "16", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 140, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 382.673, "r_y0": 456.076, "r_x1": 386.999, "r_y1": 456.076, "r_x2": 386.999, "r_y2": 453.34, "r_x3": 382.673, "r_y3": 453.34, "coord_origin": "TOPLEFT"}, "text": "32", "orig": "32", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 141, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 397.737, "r_y0": 456.076, "r_x1": 402.063, "r_y1": 456.076, "r_x2": 402.063, "r_y2": 453.34, "r_x3": 397.737, "r_y3": 453.34, "coord_origin": "TOPLEFT"}, "text": "64", "orig": "64", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 142, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 412.789, "r_y0": 457.8, "r_x1": 414.935, "r_y1": 457.8, "r_x2": 414.935, "r_y2": 447.993, "r_x3": 412.789, "r_y3": 447.993, "coord_origin": "TOPLEFT"}, "text": "\u2265", "orig": "\u2265", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 143, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 416.07, "r_y0": 456.076, "r_x1": 422.535, "r_y1": 456.076, "r_x2": 422.535, "r_y2": 453.34, "r_x3": 416.07, "r_y3": 453.34, "coord_origin": "TOPLEFT"}, "text": "128", "orig": "128", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 144, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 200.64, "r_y0": 466.66, "r_x1": 204.563, "r_y1": 466.66, "r_x2": 204.563, "r_y2": 463.924, "r_x3": 200.64, "r_y3": 463.924, "coord_origin": "TOPLEFT"}, "text": "63", "orig": "63", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 145, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 367.626, "r_y0": 466.66, "r_x1": 369.58, "r_y1": 466.66, "r_x2": 369.58, "r_y2": 463.924, "r_x3": 367.626, "r_y3": 463.924, "coord_origin": "TOPLEFT"}, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 146, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 382.661, "r_y0": 466.66, "r_x1": 384.616, "r_y1": 466.66, "r_x2": 384.616, "r_y2": 463.924, "r_x3": 382.661, "r_y3": 463.924, "coord_origin": "TOPLEFT"}, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 147, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 397.725, "r_y0": 466.66, "r_x1": 399.679, "r_y1": 466.66, "r_x2": 399.679, "r_y2": 463.924, "r_x3": 397.725, "r_y3": 463.924, "coord_origin": "TOPLEFT"}, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 148, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 200.64, "r_y0": 471.539, "r_x1": 206.503, "r_y1": 471.539, "r_x2": 206.503, "r_y2": 468.803, "r_x3": 200.64, "r_y3": 468.803, "coord_origin": "TOPLEFT"}, "text": "199", "orig": "199", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 149, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 264.29, "r_y0": 471.539, "r_x1": 266.245, "r_y1": 471.539, "r_x2": 266.245, "r_y2": 468.803, "r_x3": 264.29, "r_y3": 468.803, "coord_origin": "TOPLEFT"}, "text": "5", "orig": "5", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 150, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 306.372, "r_y0": 471.539, "r_x1": 308.326, "r_y1": 471.539, "r_x2": 308.326, "r_y2": 468.803, "r_x3": 306.372, "r_y3": 468.803, "coord_origin": "TOPLEFT"}, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 151, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 345.515, "r_y0": 471.539, "r_x1": 347.47, "r_y1": 471.539, "r_x2": 347.47, "r_y2": 468.803, "r_x3": 345.515, "r_y3": 468.803, "coord_origin": "TOPLEFT"}, "text": "2", "orig": "2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 152, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 356.556, "r_y0": 471.539, "r_x1": 358.511, "r_y1": 471.539, "r_x2": 358.511, "r_y2": 468.803, "r_x3": 356.556, "r_y3": 468.803, "coord_origin": "TOPLEFT"}, "text": "4", "orig": "4", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 153, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 367.626, "r_y0": 471.539, "r_x1": 369.58, "r_y1": 471.539, "r_x2": 369.58, "r_y2": 468.803, "r_x3": 367.626, "r_y3": 468.803, "coord_origin": "TOPLEFT"}, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 154, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 382.661, "r_y0": 471.539, "r_x1": 384.615, "r_y1": 471.539, "r_x2": 384.615, "r_y2": 468.803, "r_x3": 382.661, "r_y3": 468.803, "coord_origin": "TOPLEFT"}, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 155, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 200.64, "r_y0": 476.418, "r_x1": 206.503, "r_y1": 476.418, "r_x2": 206.503, "r_y2": 473.682, "r_x3": 200.64, "r_y3": 473.682, "coord_origin": "TOPLEFT"}, "text": "416", "orig": "416", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 156, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 264.29, "r_y0": 476.418, "r_x1": 266.245, "r_y1": 476.418, "r_x2": 266.245, "r_y2": 473.682, "r_x3": 264.29, "r_y3": 473.682, "coord_origin": "TOPLEFT"}, "text": "4", "orig": "4", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 157, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 200.64, "r_y0": 481.268, "r_x1": 206.503, "r_y1": 481.268, "r_x2": 206.503, "r_y2": 478.532, "r_x3": 200.64, "r_y3": 478.532, "coord_origin": "TOPLEFT"}, "text": "230", "orig": "230", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 158, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 243.264, "r_y0": 481.268, "r_x1": 245.218, "r_y1": 481.268, "r_x2": 245.218, "r_y2": 478.532, "r_x3": 243.264, "r_y3": 478.532, "coord_origin": "TOPLEFT"}, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 159, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 264.29, "r_y0": 481.268, "r_x1": 266.245, "r_y1": 481.268, "r_x2": 266.245, "r_y2": 478.532, "r_x3": 264.29, "r_y3": 478.532, "coord_origin": "TOPLEFT"}, "text": "9", "orig": "9", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 160, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 323.405, "r_y0": 481.268, "r_x1": 325.359, "r_y1": 481.268, "r_x2": 325.359, "r_y2": 478.532, "r_x3": 323.405, "r_y3": 478.532, "coord_origin": "TOPLEFT"}, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 161, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 397.725, "r_y0": 481.268, "r_x1": 399.679, "r_y1": 481.268, "r_x2": 399.679, "r_y2": 478.532, "r_x3": 397.725, "r_y3": 478.532, "coord_origin": "TOPLEFT"}, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 162, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 200.64, "r_y0": 486.147, "r_x1": 206.503, "r_y1": 486.147, "r_x2": 206.503, "r_y2": 483.411, "r_x3": 200.64, "r_y3": 483.411, "coord_origin": "TOPLEFT"}, "text": "276", "orig": "276", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 163, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 382.661, "r_y0": 486.147, "r_x1": 384.616, "r_y1": 486.147, "r_x2": 384.616, "r_y2": 483.411, "r_x3": 382.661, "r_y3": 483.411, "coord_origin": "TOPLEFT"}, "text": "2", "orig": "2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 164, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 397.725, "r_y0": 486.147, "r_x1": 401.648, "r_y1": 486.147, "r_x2": 401.648, "r_y2": 483.411, "r_x3": 397.725, "r_y3": 483.411, "coord_origin": "TOPLEFT"}, "text": "12", "orig": "12", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 165, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 412.789, "r_y0": 486.147, "r_x1": 414.744, "r_y1": 486.147, "r_x2": 414.744, "r_y2": 483.411, "r_x3": 412.789, "r_y3": 483.411, "coord_origin": "TOPLEFT"}, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 166, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 200.64, "r_y0": 491.026, "r_x1": 207.134, "r_y1": 491.026, "r_x2": 207.134, "r_y2": 488.29, "r_x3": 200.64, "r_y3": 488.29, "coord_origin": "TOPLEFT"}, "text": "320", "orig": "320", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 167, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 367.626, "r_y0": 491.026, "r_x1": 369.784, "r_y1": 491.026, "r_x2": 369.784, "r_y2": 488.29, "r_x3": 367.626, "r_y3": 488.29, "coord_origin": "TOPLEFT"}, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 168, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 382.661, "r_y0": 491.026, "r_x1": 384.819, "r_y1": 491.026, "r_x2": 384.819, "r_y2": 488.29, "r_x3": 382.661, "r_y3": 488.29, "coord_origin": "TOPLEFT"}, "text": "4", "orig": "4", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 169, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 397.725, "r_y0": 491.026, "r_x1": 402.051, "r_y1": 491.026, "r_x2": 402.051, "r_y2": 488.29, "r_x3": 397.725, "r_y3": 488.29, "coord_origin": "TOPLEFT"}, "text": "20", "orig": "20", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 170, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 200.64, "r_y0": 495.904, "r_x1": 208.472, "r_y1": 495.904, "r_x2": 208.472, "r_y2": 493.168, "r_x3": 200.64, "r_y3": 493.168, "coord_origin": "TOPLEFT"}, "text": "2013", "orig": "2013", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 171, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 264.29, "r_y0": 495.904, "r_x1": 266.245, "r_y1": 495.904, "r_x2": 266.245, "r_y2": 493.168, "r_x3": 264.29, "r_y3": 493.168, "coord_origin": "TOPLEFT"}, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": [{"id": 58, "label": "text", "bbox": {"l": 180.125, "t": 516.296, "r": 190.62, "b": 518.934, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 85, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 180.125, "r_y0": 518.934, "r_x1": 190.62, "r_y1": 518.934, "r_x2": 190.62, "r_y2": 516.296, "r_x3": 180.125, "r_y3": 516.296, "coord_origin": "TOPLEFT"}, "text": "<table>", "orig": "<table>", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 59, "label": "text", "bbox": {"l": 183.244, "t": 520.194, "r": 304.548, "b": 522.8330000000001, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 86, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 183.244, "r_y0": 522.8330000000001, "r_x1": 304.548, "r_y1": 522.8330000000001, "r_x2": 304.548, "r_y2": 520.194, "r_x3": 183.244, "r_y3": 520.194, "coord_origin": "TOPLEFT"}, "text": "<tr><td></td><td colspan=\"4\"></td><td colspan=\"6\"></td><td colspan=\"3\"></td></tr>", "orig": "<tr><td></td><td colspan=\"4\"></td><td colspan=\"6\"></td><td colspan=\"3\"></td></tr>", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 60, "label": "text", "bbox": {"l": 183.244, "t": 524.0930000000001, "r": 388.423, "b": 526.731, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 87, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 183.244, "r_y0": 526.731, "r_x1": 388.423, "r_y1": 526.731, "r_x2": 388.423, "r_y2": 524.0930000000001, "r_x3": 183.244, "r_y3": 524.0930000000001, "coord_origin": "TOPLEFT"}, "text": "<tr><td></td><td></td><td></td><td></td><td></td><td></td><td></td><td></td><td></td><td></td><td></td><td></td><td></td><td></td></tr>", "orig": "<tr><td></td><td></td><td></td><td></td><td></td><td></td><td></td><td></td><td></td><td></td><td></td><td></td><td></td><td></td></tr>", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 61, "label": "text", "bbox": {"l": 183.244, "t": 527.992, "r": 388.423, "b": 530.63, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 88, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 183.244, "r_y0": 530.63, "r_x1": 388.423, "r_y1": 530.63, "r_x2": 388.423, "r_y2": 527.992, "r_x3": 183.244, "r_y3": 527.992, "coord_origin": "TOPLEFT"}, "text": "<tr><td></td><td></td><td></td><td></td><td></td><td></td><td></td><td></td><td></td><td></td><td></td><td></td><td></td><td></td></tr>", "orig": "<tr><td></td><td></td><td></td><td></td><td></td><td></td><td></td><td></td><td></td><td></td><td></td><td></td><td></td><td></td></tr>", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 62, "label": "text", "bbox": {"l": 183.244, "t": 531.8910000000001, "r": 388.423, "b": 534.529, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 89, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 183.244, "r_y0": 534.529, "r_x1": 388.423, "r_y1": 534.529, "r_x2": 388.423, "r_y2": 531.8910000000001, "r_x3": 183.244, "r_y3": 531.8910000000001, "coord_origin": "TOPLEFT"}, "text": "<tr><td></td><td></td><td></td><td></td><td></td><td></td><td></td><td></td><td></td><td></td><td></td><td></td><td></td><td></td></tr>", "orig": "<tr><td></td><td></td><td></td><td></td><td></td><td></td><td></td><td></td><td></td><td></td><td></td><td></td><td></td><td></td></tr>", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 63, "label": "text", "bbox": {"l": 183.244, "t": 535.79, "r": 388.423, "b": 538.428, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 90, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 183.244, "r_y0": 538.428, "r_x1": 388.423, "r_y1": 538.428, "r_x2": 388.423, "r_y2": 535.79, "r_x3": 183.244, "r_y3": 535.79, "coord_origin": "TOPLEFT"}, "text": "<tr><td></td><td></td><td></td><td></td><td></td><td></td><td></td><td></td><td></td><td></td><td></td><td></td><td></td><td></td></tr>", "orig": "<tr><td></td><td></td><td></td><td></td><td></td><td></td><td></td><td></td><td></td><td></td><td></td><td></td><td></td><td></td></tr>", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 64, "label": "text", "bbox": {"l": 183.244, "t": 539.689, "r": 388.423, "b": 542.327, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 91, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 183.244, "r_y0": 542.327, "r_x1": 388.423, "r_y1": 542.327, "r_x2": 388.423, "r_y2": 539.689, "r_x3": 183.244, "r_y3": 539.689, "coord_origin": "TOPLEFT"}, "text": "<tr><td></td><td></td><td></td><td></td><td></td><td></td><td></td><td></td><td></td><td></td><td></td><td></td><td></td><td></td></tr>", "orig": "<tr><td></td><td></td><td></td><td></td><td></td><td></td><td></td><td></td><td></td><td></td><td></td><td></td><td></td><td></td></tr>", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 65, "label": "text", "bbox": {"l": 183.244, "t": 543.588, "r": 388.423, "b": 546.226, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 92, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 183.244, "r_y0": 546.226, "r_x1": 388.423, "r_y1": 546.226, "r_x2": 388.423, "r_y2": 543.588, "r_x3": 183.244, "r_y3": 543.588, "coord_origin": "TOPLEFT"}, "text": "<tr><td></td><td></td><td></td><td></td><td></td><td></td><td></td><td></td><td></td><td></td><td></td><td></td><td></td><td></td></tr>", "orig": "<tr><td></td><td></td><td></td><td></td><td></td><td></td><td></td><td></td><td></td><td></td><td></td><td></td><td></td><td></td></tr>", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 66, "label": "text", "bbox": {"l": 183.244, "t": 547.486, "r": 388.423, "b": 550.124, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 93, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 183.244, "r_y0": 550.124, "r_x1": 388.423, "r_y1": 550.124, "r_x2": 388.423, "r_y2": 547.486, "r_x3": 183.244, "r_y3": 547.486, "coord_origin": "TOPLEFT"}, "text": "<tr><td></td><td></td><td></td><td></td><td></td><td></td><td></td><td></td><td></td><td></td><td></td><td></td><td></td><td></td></tr>", "orig": "<tr><td></td><td></td><td></td><td></td><td></td><td></td><td></td><td></td><td></td><td></td><td></td><td></td><td></td><td></td></tr>", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 67, "label": "text", "bbox": {"l": 183.244, "t": 551.385, "r": 388.423, "b": 554.023, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 94, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 183.244, "r_y0": 554.023, "r_x1": 388.423, "r_y1": 554.023, "r_x2": 388.423, "r_y2": 551.385, "r_x3": 183.244, "r_y3": 551.385, "coord_origin": "TOPLEFT"}, "text": "<tr><td></td><td></td><td></td><td></td><td></td><td></td><td></td><td></td><td></td><td></td><td></td><td></td><td></td><td></td></tr>", "orig": "<tr><td></td><td></td><td></td><td></td><td></td><td></td><td></td><td></td><td></td><td></td><td></td><td></td><td></td><td></td></tr>", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 68, "label": "text", "bbox": {"l": 180.125, "t": 555.284, "r": 191.868, "b": 557.922, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 95, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 180.125, "r_y0": 557.922, "r_x1": 191.868, "r_y1": 557.922, "r_x2": 191.868, "r_y2": 555.284, "r_x3": 180.125, "r_y3": 555.284, "coord_origin": "TOPLEFT"}, "text": "</table>", "orig": "</table>", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 69, "label": "text", "bbox": {"l": 407.383, "t": 518.363, "r": 450.486, "b": 521.001, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 96, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 407.383, "r_y0": 521.001, "r_x1": 450.486, "r_y1": 521.001, "r_x2": 450.486, "r_y2": 518.363, "r_x3": 407.383, "r_y3": 518.363, "coord_origin": "TOPLEFT"}, "text": "C C L L L C L L L L L C L L NL", "orig": "C C L L L C L L L L L C L L NL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 70, "label": "text", "bbox": {"l": 407.383, "t": 522.262, "r": 450.486, "b": 524.9, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 97, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 407.383, "r_y0": 524.9, "r_x1": 450.486, "r_y1": 524.9, "r_x2": 450.486, "r_y2": 522.262, "r_x3": 407.383, "r_y3": 522.262, "coord_origin": "TOPLEFT"}, "text": "C C C C C C C C C C C C C C NL", "orig": "C C C C C C C C C C C C C C NL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 71, "label": "text", "bbox": {"l": 407.383, "t": 526.1600000000001, "r": 450.486, "b": 528.799, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 98, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 407.383, "r_y0": 528.799, "r_x1": 450.486, "r_y1": 528.799, "r_x2": 450.486, "r_y2": 526.1600000000001, "r_x3": 407.383, "r_y3": 526.1600000000001, "coord_origin": "TOPLEFT"}, "text": "C C C C C C C C C C C C C C NL", "orig": "C C C C C C C C C C C C C C NL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 72, "label": "text", "bbox": {"l": 407.383, "t": 530.059, "r": 450.486, "b": 532.697, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 99, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 407.383, "r_y0": 532.697, "r_x1": 450.486, "r_y1": 532.697, "r_x2": 450.486, "r_y2": 530.059, "r_x3": 407.383, "r_y3": 530.059, "coord_origin": "TOPLEFT"}, "text": "C C C C C C C C C C C C C C NL", "orig": "C C C C C C C C C C C C C C NL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 73, "label": "text", "bbox": {"l": 407.383, "t": 533.9580000000001, "r": 450.486, "b": 536.596, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 100, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 407.383, "r_y0": 536.596, "r_x1": 450.486, "r_y1": 536.596, "r_x2": 450.486, "r_y2": 533.9580000000001, "r_x3": 407.383, "r_y3": 533.9580000000001, "coord_origin": "TOPLEFT"}, "text": "C C C C C C C C C C C C C C NL", "orig": "C C C C C C C C C C C C C C NL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 74, "label": "text", "bbox": {"l": 407.383, "t": 537.857, "r": 450.486, "b": 540.495, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 101, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 407.383, "r_y0": 540.495, "r_x1": 450.486, "r_y1": 540.495, "r_x2": 450.486, "r_y2": 537.857, "r_x3": 407.383, "r_y3": 537.857, "coord_origin": "TOPLEFT"}, "text": "C C C C C C C C C C C C C C NL", "orig": "C C C C C C C C C C C C C C NL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 75, "label": "text", "bbox": {"l": 407.383, "t": 541.756, "r": 450.486, "b": 544.394, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 102, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 407.383, "r_y0": 544.394, "r_x1": 450.486, "r_y1": 544.394, "r_x2": 450.486, "r_y2": 541.756, "r_x3": 407.383, "r_y3": 541.756, "coord_origin": "TOPLEFT"}, "text": "C C C C C C C C C C C C C C NL", "orig": "C C C C C C C C C C C C C C NL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 76, "label": "text", "bbox": {"l": 407.383, "t": 545.655, "r": 450.486, "b": 548.293, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 103, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 407.383, "r_y0": 548.293, "r_x1": 450.486, "r_y1": 548.293, "r_x2": 450.486, "r_y2": 545.655, "r_x3": 407.383, "r_y3": 545.655, "coord_origin": "TOPLEFT"}, "text": "C C C C C C C C C C C C C C NL", "orig": "C C C C C C C C C C C C C C NL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 77, "label": "text", "bbox": {"l": 407.383, "t": 549.554, "r": 450.486, "b": 552.192, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 104, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 407.383, "r_y0": 552.192, "r_x1": 450.486, "r_y1": 552.192, "r_x2": 450.486, "r_y2": 549.554, "r_x3": 407.383, "r_y3": 549.554, "coord_origin": "TOPLEFT"}, "text": "C C C C C C C C C C C C C C NL", "orig": "C C C C C C C C C C C C C C NL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 78, "label": "text", "bbox": {"l": 164.529, "t": 509.533, "r": 181.853, "b": 515.288, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 105, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 164.529, "r_y0": 515.288, "r_x1": 181.853, "r_y1": 515.288, "r_x2": 181.853, "r_y2": 509.533, "r_x3": 164.529, "r_y3": 509.533, "coord_origin": "TOPLEFT"}, "text": "HTML", "orig": "HTML", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 79, "label": "text", "bbox": {"l": 183.584, "t": 509.533, "r": 208.901, "b": 515.288, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 106, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 183.584, "r_y0": 515.288, "r_x1": 208.901, "r_y1": 515.288, "r_x2": 208.901, "r_y2": 509.533, "r_x3": 183.584, "r_y3": 509.533, "coord_origin": "TOPLEFT"}, "text": "# tokens:", "orig": "# tokens:", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 80, "label": "text", "bbox": {"l": 210.633, "t": 509.533, "r": 221.04, "b": 515.288, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 107, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 210.633, "r_y0": 515.288, "r_x1": 221.04, "r_y1": 515.288, "r_x2": 221.04, "r_y2": 509.533, "r_x3": 210.633, "r_y3": 509.533, "coord_origin": "TOPLEFT"}, "text": "258", "orig": "258", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 81, "label": "text", "bbox": {"l": 390.202, "t": 509.678, "r": 406.836, "b": 515.433, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 108, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 390.202, "r_y0": 515.433, "r_x1": 406.836, "r_y1": 515.433, "r_x2": 406.836, "r_y2": 509.678, "r_x3": 390.202, "r_y3": 509.678, "coord_origin": "TOPLEFT"}, "text": "OTSL", "orig": "OTSL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 82, "label": "text", "bbox": {"l": 408.569, "t": 509.678, "r": 433.886, "b": 515.433, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 109, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 408.569, "r_y0": 515.433, "r_x1": 433.886, "r_y1": 515.433, "r_x2": 433.886, "r_y2": 509.678, "r_x3": 408.569, "r_y3": 509.678, "coord_origin": "TOPLEFT"}, "text": "# tokens:", "orig": "# tokens:", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 83, "label": "text", "bbox": {"l": 435.617, "t": 509.678, "r": 446.025, "b": 515.433, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 110, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 435.617, "r_y0": 515.433, "r_x1": 446.025, "r_y1": 515.433, "r_x2": 446.025, "r_y2": 509.678, "r_x3": 435.617, "r_y3": 509.678, "coord_origin": "TOPLEFT"}, "text": "135", "orig": "135", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 84, "label": "text", "bbox": {"l": 167.193, "t": 519.1659999999999, "r": 172.823, "b": 526.36, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 111, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 167.193, "r_y0": 526.36, "r_x1": 172.823, "r_y1": 526.36, "r_x2": 172.823, "r_y2": 519.1659999999999, "r_x3": 167.193, "r_y3": 519.1659999999999, "coord_origin": "TOPLEFT"}, "text": "B", "orig": "B", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 85, "label": "text", "bbox": {"l": 187.337, "t": 448.718, "r": 192.967, "b": 455.912, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 112, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 187.337, "r_y0": 455.912, "r_x1": 192.967, "r_y1": 455.912, "r_x2": 192.967, "r_y2": 448.718, "r_x3": 187.337, "r_y3": 448.718, "coord_origin": "TOPLEFT"}, "text": "A", "orig": "A", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 86, "label": "text", "bbox": {"l": 167.387, "t": 566.0989999999999, "r": 173.016, "b": 573.292, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 113, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 167.387, "r_y0": 573.292, "r_x1": 173.016, "r_y1": 573.292, "r_x2": 173.016, "r_y2": 566.0989999999999, "r_x3": 167.387, "r_y3": 566.0989999999999, "coord_origin": "TOPLEFT"}, "text": "D", "orig": "D", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 87, "label": "text", "bbox": {"l": 248.456, "t": 621.874, "r": 253.657, "b": 629.067, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 114, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 248.456, "r_y0": 629.067, "r_x1": 253.657, "r_y1": 629.067, "r_x2": 253.657, "r_y2": 621.874, "r_x3": 248.456, "r_y3": 621.874, "coord_origin": "TOPLEFT"}, "text": "E", "orig": "E", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 88, "label": "text", "bbox": {"l": 395.901, "t": 519.293, "r": 401.531, "b": 526.4870000000001, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 115, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 395.901, "r_y0": 526.4870000000001, "r_x1": 401.531, "r_y1": 526.4870000000001, "r_x2": 401.531, "r_y2": 519.293, "r_x3": 395.901, "r_y3": 519.293, "coord_origin": "TOPLEFT"}, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 89, "label": "text", "bbox": {"l": 171.7, "t": 580.287, "r": 177.46, "b": 597.269, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 116, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 177.46, "r_y0": 597.268, "r_x1": 177.455, "r_y1": 580.287, "r_x2": 171.7, "r_y2": 580.289, "r_x3": 171.705, "r_y3": 597.269, "coord_origin": "TOPLEFT"}, "text": "HTML", "orig": "HTML", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 90, "label": "text", "bbox": {"l": 251.131, "t": 633.633, "r": 256.891, "b": 649.925, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 117, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 256.891, "r_y0": 649.923, "r_x1": 256.886, "r_y1": 633.633, "r_x2": 251.131, "r_y2": 633.634, "r_x3": 251.136, "r_y3": 649.925, "coord_origin": "TOPLEFT"}, "text": "OTSL", "orig": "OTSL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 91, "label": "text", "bbox": {"l": 372.146, "t": 601.532, "r": 427.038, "b": 607.287, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 118, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 372.146, "r_y0": 607.287, "r_x1": 427.038, "r_y1": 607.287, "r_x2": 427.038, "r_y2": 601.532, "r_x3": 372.146, "r_y3": 601.532, "coord_origin": "TOPLEFT"}, "text": "HTML model shows", "orig": "HTML model shows", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 92, "label": "text", "bbox": {"l": 372.146, "t": 607.9739999999999, "r": 430.068, "b": 613.729, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 119, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 372.146, "r_y0": 613.729, "r_x1": 430.068, "r_y1": 613.729, "r_x2": 430.068, "r_y2": 607.9739999999999, "r_x3": 372.146, "r_y3": 607.9739999999999, "coord_origin": "TOPLEFT"}, "text": "bounding box drifting", "orig": "bounding box drifting", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 93, "label": "text", "bbox": {"l": 176.88, "t": 642.947, "r": 231.082, "b": 648.702, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 120, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 176.88, "r_y0": 648.702, "r_x1": 231.082, "r_y1": 648.702, "r_x2": 231.082, "r_y2": 642.947, "r_x3": 176.88, "r_y3": 642.947, "coord_origin": "TOPLEFT"}, "text": "OTSL model shows", "orig": "OTSL model shows", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 94, "label": "text", "bbox": {"l": 176.88, "t": 649.389, "r": 230.993, "b": 655.144, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 121, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 176.88, "r_y0": 655.144, "r_x1": 230.993, "r_y1": 655.144, "r_x2": 230.993, "r_y2": 649.389, "r_x3": 176.88, "r_y3": 649.389, "coord_origin": "TOPLEFT"}, "text": "clean bounding box", "orig": "clean bounding box", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 95, "label": "text", "bbox": {"l": 176.88, "t": 655.831, "r": 203.932, "b": 661.586, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 122, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 176.88, "r_y0": 661.586, "r_x1": 203.932, "r_y1": 661.586, "r_x2": 203.932, "r_y2": 655.831, "r_x3": 176.88, "r_y3": 655.831, "coord_origin": "TOPLEFT"}, "text": "alignment", "orig": "alignment", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 96, "label": "text", "bbox": {"l": 215.932, "t": 557.563, "r": 218.47, "b": 569.16, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 123, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 215.932, "r_y0": 569.16, "r_x1": 218.47, "r_y1": 569.16, "r_x2": 218.47, "r_y2": 557.563, "r_x3": 215.932, "r_y3": 557.563, "coord_origin": "TOPLEFT"}, "text": "\u2264", "orig": "\u2264", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 97, "label": "text", "bbox": {"l": 229.057, "t": 557.563, "r": 231.719, "b": 569.16, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 124, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 229.057, "r_y0": 569.16, "r_x1": 231.719, "r_y1": 569.16, "r_x2": 231.719, "r_y2": 557.563, "r_x3": 229.057, "r_y3": 557.563, "coord_origin": "TOPLEFT"}, "text": "\u03bc", "orig": "\u03bc", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 98, "label": "text", "bbox": {"l": 261.209, "t": 448.461, "r": 263.57, "b": 451.197, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 126, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 261.209, "r_y0": 451.197, "r_x1": 263.57, "r_y1": 451.197, "r_x2": 263.57, "r_y2": 448.461, "r_x3": 261.209, "r_y3": 448.461, "coord_origin": "TOPLEFT"}, "text": "S", "orig": "S", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 99, "label": "text", "bbox": {"l": 312.335, "t": 448.461, "r": 313.636, "b": 451.197, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 127, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 312.335, "r_y0": 451.197, "r_x1": 313.636, "r_y1": 451.197, "r_x2": 313.636, "r_y2": 448.461, "r_x3": 312.335, "r_y3": 448.461, "coord_origin": "TOPLEFT"}, "text": "I", "orig": "I", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 100, "label": "text", "bbox": {"l": 377.411, "t": 448.461, "r": 380.057, "b": 451.197, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 128, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 377.411, "r_y0": 451.197, "r_x1": 380.057, "r_y1": 451.197, "r_x2": 380.057, "r_y2": 448.461, "r_x3": 377.411, "r_y3": 448.461, "coord_origin": "TOPLEFT"}, "text": "R", "orig": "R", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 101, "label": "text", "bbox": {"l": 200.64, "t": 453.34, "r": 205.818, "b": 456.076, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 129, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 200.64, "r_y0": 456.076, "r_x1": 205.818, "r_y1": 456.076, "r_x2": 205.818, "r_y2": 453.34, "r_x3": 200.64, "r_y3": 453.34, "coord_origin": "TOPLEFT"}, "text": "ST", "orig": "ST", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 102, "label": "text", "bbox": {"l": 222.208, "t": 453.34, "r": 229.761, "b": 456.076, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 130, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 222.208, "r_y0": 456.076, "r_x1": 229.761, "r_y1": 456.076, "r_x2": 229.761, "r_y2": 453.34, "r_x3": 222.208, "r_y3": 453.34, "coord_origin": "TOPLEFT"}, "text": "0.03", "orig": "0.03", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 103, "label": "text", "bbox": {"l": 243.267, "t": 453.34, "r": 250.82, "b": 456.076, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 131, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 243.267, "r_y0": 456.076, "r_x1": 250.82, "r_y1": 456.076, "r_x2": 250.82, "r_y2": 453.34, "r_x3": 243.267, "r_y3": 453.34, "coord_origin": "TOPLEFT"}, "text": "0.06", "orig": "0.06", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 104, "label": "text", "bbox": {"l": 264.297, "t": 453.34, "r": 271.842, "b": 456.076, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 132, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 264.297, "r_y0": 456.076, "r_x1": 271.842, "r_y1": 456.076, "r_x2": 271.842, "r_y2": 453.34, "r_x3": 264.297, "r_y3": 453.34, "coord_origin": "TOPLEFT"}, "text": "0.12", "orig": "0.12", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 105, "label": "text", "bbox": {"l": 285.319, "t": 453.34, "r": 292.872, "b": 456.076, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 133, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 285.319, "r_y0": 456.076, "r_x1": 292.872, "r_y1": 456.076, "r_x2": 292.872, "r_y2": 453.34, "r_x3": 285.319, "r_y3": 453.34, "coord_origin": "TOPLEFT"}, "text": "0.25", "orig": "0.25", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 106, "label": "text", "bbox": {"l": 306.378, "t": 453.34, "r": 311.766, "b": 456.076, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 134, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 306.378, "r_y0": 456.076, "r_x1": 311.766, "r_y1": 456.076, "r_x2": 311.766, "r_y2": 453.34, "r_x3": 306.378, "r_y3": 453.34, "coord_origin": "TOPLEFT"}, "text": "0.5", "orig": "0.5", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 107, "label": "text", "bbox": {"l": 323.417, "t": 453.34, "r": 325.575, "b": 456.076, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 135, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 323.417, "r_y0": 456.076, "r_x1": 325.575, "r_y1": 456.076, "r_x2": 325.575, "r_y2": 453.34, "r_x3": 323.417, "r_y3": 453.34, "coord_origin": "TOPLEFT"}, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 108, "label": "text", "bbox": {"l": 334.458, "t": 453.34, "r": 336.616, "b": 456.076, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 136, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 334.458, "r_y0": 456.076, "r_x1": 336.616, "r_y1": 456.076, "r_x2": 336.616, "r_y2": 453.34, "r_x3": 334.458, "r_y3": 453.34, "coord_origin": "TOPLEFT"}, "text": "2", "orig": "2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 109, "label": "text", "bbox": {"l": 345.528, "t": 453.34, "r": 347.685, "b": 456.076, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 137, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 345.528, "r_y0": 456.076, "r_x1": 347.685, "r_y1": 456.076, "r_x2": 347.685, "r_y2": 453.34, "r_x3": 345.528, "r_y3": 453.34, "coord_origin": "TOPLEFT"}, "text": "4", "orig": "4", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 110, "label": "text", "bbox": {"l": 356.569, "t": 453.34, "r": 358.726, "b": 456.076, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 138, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 356.569, "r_y0": 456.076, "r_x1": 358.726, "r_y1": 456.076, "r_x2": 358.726, "r_y2": 453.34, "r_x3": 356.569, "r_y3": 453.34, "coord_origin": "TOPLEFT"}, "text": "8", "orig": "8", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 111, "label": "text", "bbox": {"l": 367.638, "t": 453.34, "r": 371.964, "b": 456.076, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 139, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 367.638, "r_y0": 456.076, "r_x1": 371.964, "r_y1": 456.076, "r_x2": 371.964, "r_y2": 453.34, "r_x3": 367.638, "r_y3": 453.34, "coord_origin": "TOPLEFT"}, "text": "16", "orig": "16", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 112, "label": "text", "bbox": {"l": 382.673, "t": 453.34, "r": 386.999, "b": 456.076, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 140, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 382.673, "r_y0": 456.076, "r_x1": 386.999, "r_y1": 456.076, "r_x2": 386.999, "r_y2": 453.34, "r_x3": 382.673, "r_y3": 453.34, "coord_origin": "TOPLEFT"}, "text": "32", "orig": "32", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 113, "label": "text", "bbox": {"l": 397.737, "t": 453.34, "r": 402.063, "b": 456.076, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 141, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 397.737, "r_y0": 456.076, "r_x1": 402.063, "r_y1": 456.076, "r_x2": 402.063, "r_y2": 453.34, "r_x3": 397.737, "r_y3": 453.34, "coord_origin": "TOPLEFT"}, "text": "64", "orig": "64", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 114, "label": "text", "bbox": {"l": 412.789, "t": 447.993, "r": 414.935, "b": 457.8, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 142, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 412.789, "r_y0": 457.8, "r_x1": 414.935, "r_y1": 457.8, "r_x2": 414.935, "r_y2": 447.993, "r_x3": 412.789, "r_y3": 447.993, "coord_origin": "TOPLEFT"}, "text": "\u2265", "orig": "\u2265", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 115, "label": "text", "bbox": {"l": 416.07, "t": 453.34, "r": 422.535, "b": 456.076, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 143, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 416.07, "r_y0": 456.076, "r_x1": 422.535, "r_y1": 456.076, "r_x2": 422.535, "r_y2": 453.34, "r_x3": 416.07, "r_y3": 453.34, "coord_origin": "TOPLEFT"}, "text": "128", "orig": "128", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 116, "label": "text", "bbox": {"l": 200.64, "t": 463.924, "r": 204.563, "b": 466.66, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 144, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 200.64, "r_y0": 466.66, "r_x1": 204.563, "r_y1": 466.66, "r_x2": 204.563, "r_y2": 463.924, "r_x3": 200.64, "r_y3": 463.924, "coord_origin": "TOPLEFT"}, "text": "63", "orig": "63", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 117, "label": "text", "bbox": {"l": 367.626, "t": 463.924, "r": 369.58, "b": 466.66, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 145, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 367.626, "r_y0": 466.66, "r_x1": 369.58, "r_y1": 466.66, "r_x2": 369.58, "r_y2": 463.924, "r_x3": 367.626, "r_y3": 463.924, "coord_origin": "TOPLEFT"}, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 118, "label": "text", "bbox": {"l": 382.661, "t": 463.924, "r": 384.616, "b": 466.66, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 146, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 382.661, "r_y0": 466.66, "r_x1": 384.616, "r_y1": 466.66, "r_x2": 384.616, "r_y2": 463.924, "r_x3": 382.661, "r_y3": 463.924, "coord_origin": "TOPLEFT"}, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 119, "label": "text", "bbox": {"l": 397.725, "t": 463.924, "r": 399.679, "b": 466.66, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 147, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 397.725, "r_y0": 466.66, "r_x1": 399.679, "r_y1": 466.66, "r_x2": 399.679, "r_y2": 463.924, "r_x3": 397.725, "r_y3": 463.924, "coord_origin": "TOPLEFT"}, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 120, "label": "text", "bbox": {"l": 200.64, "t": 468.803, "r": 206.503, "b": 471.539, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 148, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 200.64, "r_y0": 471.539, "r_x1": 206.503, "r_y1": 471.539, "r_x2": 206.503, "r_y2": 468.803, "r_x3": 200.64, "r_y3": 468.803, "coord_origin": "TOPLEFT"}, "text": "199", "orig": "199", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 121, "label": "text", "bbox": {"l": 264.29, "t": 468.803, "r": 266.245, "b": 471.539, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 149, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 264.29, "r_y0": 471.539, "r_x1": 266.245, "r_y1": 471.539, "r_x2": 266.245, "r_y2": 468.803, "r_x3": 264.29, "r_y3": 468.803, "coord_origin": "TOPLEFT"}, "text": "5", "orig": "5", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 122, "label": "text", "bbox": {"l": 306.372, "t": 468.803, "r": 308.326, "b": 471.539, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 150, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 306.372, "r_y0": 471.539, "r_x1": 308.326, "r_y1": 471.539, "r_x2": 308.326, "r_y2": 468.803, "r_x3": 306.372, "r_y3": 468.803, "coord_origin": "TOPLEFT"}, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 123, "label": "text", "bbox": {"l": 345.515, "t": 468.803, "r": 347.47, "b": 471.539, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 151, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 345.515, "r_y0": 471.539, "r_x1": 347.47, "r_y1": 471.539, "r_x2": 347.47, "r_y2": 468.803, "r_x3": 345.515, "r_y3": 468.803, "coord_origin": "TOPLEFT"}, "text": "2", "orig": "2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 124, "label": "text", "bbox": {"l": 356.556, "t": 468.803, "r": 358.511, "b": 471.539, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 152, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 356.556, "r_y0": 471.539, "r_x1": 358.511, "r_y1": 471.539, "r_x2": 358.511, "r_y2": 468.803, "r_x3": 356.556, "r_y3": 468.803, "coord_origin": "TOPLEFT"}, "text": "4", "orig": "4", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 125, "label": "text", "bbox": {"l": 367.626, "t": 468.803, "r": 369.58, "b": 471.539, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 153, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 367.626, "r_y0": 471.539, "r_x1": 369.58, "r_y1": 471.539, "r_x2": 369.58, "r_y2": 468.803, "r_x3": 367.626, "r_y3": 468.803, "coord_origin": "TOPLEFT"}, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 126, "label": "text", "bbox": {"l": 382.661, "t": 468.803, "r": 384.615, "b": 471.539, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 154, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 382.661, "r_y0": 471.539, "r_x1": 384.615, "r_y1": 471.539, "r_x2": 384.615, "r_y2": 468.803, "r_x3": 382.661, "r_y3": 468.803, "coord_origin": "TOPLEFT"}, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 127, "label": "text", "bbox": {"l": 200.64, "t": 473.682, "r": 206.503, "b": 476.418, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 155, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 200.64, "r_y0": 476.418, "r_x1": 206.503, "r_y1": 476.418, "r_x2": 206.503, "r_y2": 473.682, "r_x3": 200.64, "r_y3": 473.682, "coord_origin": "TOPLEFT"}, "text": "416", "orig": "416", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 128, "label": "text", "bbox": {"l": 264.29, "t": 473.682, "r": 266.245, "b": 476.418, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 156, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 264.29, "r_y0": 476.418, "r_x1": 266.245, "r_y1": 476.418, "r_x2": 266.245, "r_y2": 473.682, "r_x3": 264.29, "r_y3": 473.682, "coord_origin": "TOPLEFT"}, "text": "4", "orig": "4", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 129, "label": "text", "bbox": {"l": 200.64, "t": 478.532, "r": 206.503, "b": 481.268, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 157, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 200.64, "r_y0": 481.268, "r_x1": 206.503, "r_y1": 481.268, "r_x2": 206.503, "r_y2": 478.532, "r_x3": 200.64, "r_y3": 478.532, "coord_origin": "TOPLEFT"}, "text": "230", "orig": "230", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 130, "label": "text", "bbox": {"l": 243.264, "t": 478.532, "r": 245.218, "b": 481.268, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 158, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 243.264, "r_y0": 481.268, "r_x1": 245.218, "r_y1": 481.268, "r_x2": 245.218, "r_y2": 478.532, "r_x3": 243.264, "r_y3": 478.532, "coord_origin": "TOPLEFT"}, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 131, "label": "text", "bbox": {"l": 264.29, "t": 478.532, "r": 266.245, "b": 481.268, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 159, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 264.29, "r_y0": 481.268, "r_x1": 266.245, "r_y1": 481.268, "r_x2": 266.245, "r_y2": 478.532, "r_x3": 264.29, "r_y3": 478.532, "coord_origin": "TOPLEFT"}, "text": "9", "orig": "9", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 132, "label": "text", "bbox": {"l": 323.405, "t": 478.532, "r": 325.359, "b": 481.268, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 160, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 323.405, "r_y0": 481.268, "r_x1": 325.359, "r_y1": 481.268, "r_x2": 325.359, "r_y2": 478.532, "r_x3": 323.405, "r_y3": 478.532, "coord_origin": "TOPLEFT"}, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 133, "label": "text", "bbox": {"l": 397.725, "t": 478.532, "r": 399.679, "b": 481.268, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 161, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 397.725, "r_y0": 481.268, "r_x1": 399.679, "r_y1": 481.268, "r_x2": 399.679, "r_y2": 478.532, "r_x3": 397.725, "r_y3": 478.532, "coord_origin": "TOPLEFT"}, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 134, "label": "text", "bbox": {"l": 200.64, "t": 483.411, "r": 206.503, "b": 486.147, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 162, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 200.64, "r_y0": 486.147, "r_x1": 206.503, "r_y1": 486.147, "r_x2": 206.503, "r_y2": 483.411, "r_x3": 200.64, "r_y3": 483.411, "coord_origin": "TOPLEFT"}, "text": "276", "orig": "276", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 135, "label": "text", "bbox": {"l": 382.661, "t": 483.411, "r": 384.616, "b": 486.147, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 163, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 382.661, "r_y0": 486.147, "r_x1": 384.616, "r_y1": 486.147, "r_x2": 384.616, "r_y2": 483.411, "r_x3": 382.661, "r_y3": 483.411, "coord_origin": "TOPLEFT"}, "text": "2", "orig": "2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 136, "label": "text", "bbox": {"l": 397.725, "t": 483.411, "r": 401.648, "b": 486.147, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 164, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 397.725, "r_y0": 486.147, "r_x1": 401.648, "r_y1": 486.147, "r_x2": 401.648, "r_y2": 483.411, "r_x3": 397.725, "r_y3": 483.411, "coord_origin": "TOPLEFT"}, "text": "12", "orig": "12", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 137, "label": "text", "bbox": {"l": 412.789, "t": 483.411, "r": 414.744, "b": 486.147, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 165, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 412.789, "r_y0": 486.147, "r_x1": 414.744, "r_y1": 486.147, "r_x2": 414.744, "r_y2": 483.411, "r_x3": 412.789, "r_y3": 483.411, "coord_origin": "TOPLEFT"}, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 138, "label": "text", "bbox": {"l": 200.64, "t": 488.29, "r": 207.134, "b": 491.026, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 166, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 200.64, "r_y0": 491.026, "r_x1": 207.134, "r_y1": 491.026, "r_x2": 207.134, "r_y2": 488.29, "r_x3": 200.64, "r_y3": 488.29, "coord_origin": "TOPLEFT"}, "text": "320", "orig": "320", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 139, "label": "text", "bbox": {"l": 367.626, "t": 488.29, "r": 369.784, "b": 491.026, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 167, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 367.626, "r_y0": 491.026, "r_x1": 369.784, "r_y1": 491.026, "r_x2": 369.784, "r_y2": 488.29, "r_x3": 367.626, "r_y3": 488.29, "coord_origin": "TOPLEFT"}, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 140, "label": "text", "bbox": {"l": 382.661, "t": 488.29, "r": 384.819, "b": 491.026, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 168, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 382.661, "r_y0": 491.026, "r_x1": 384.819, "r_y1": 491.026, "r_x2": 384.819, "r_y2": 488.29, "r_x3": 382.661, "r_y3": 488.29, "coord_origin": "TOPLEFT"}, "text": "4", "orig": "4", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 141, "label": "text", "bbox": {"l": 397.725, "t": 488.29, "r": 402.051, "b": 491.026, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 169, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 397.725, "r_y0": 491.026, "r_x1": 402.051, "r_y1": 491.026, "r_x2": 402.051, "r_y2": 488.29, "r_x3": 397.725, "r_y3": 488.29, "coord_origin": "TOPLEFT"}, "text": "20", "orig": "20", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 142, "label": "text", "bbox": {"l": 200.64, "t": 493.168, "r": 208.472, "b": 495.904, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 170, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 200.64, "r_y0": 495.904, "r_x1": 208.472, "r_y1": 495.904, "r_x2": 208.472, "r_y2": 493.168, "r_x3": 200.64, "r_y3": 493.168, "coord_origin": "TOPLEFT"}, "text": "2013", "orig": "2013", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 143, "label": "text", "bbox": {"l": 264.29, "t": 493.168, "r": 266.245, "b": 495.904, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 171, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 264.29, "r_y0": 495.904, "r_x1": 266.245, "r_y1": 495.904, "r_x2": 266.245, "r_y2": 493.168, "r_x3": 264.29, "r_y3": 493.168, "coord_origin": "TOPLEFT"}, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}]}, "text": "", "annotations": [], "provenance": null, "predicted_class": null, "confidence": null}, {"label": "text", "id": 144, "page_no": 9, "cluster": {"id": 144, "label": "text", "bbox": {"l": 227.915, "t": 665.826, "r": 230.1, "b": 675.346, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 172, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 227.915, "r_y0": 675.346, "r_x1": 230.1, "r_y1": 675.346, "r_x2": 230.1, "r_y2": 665.826, "r_x3": 227.915, "r_y3": 665.826, "coord_origin": "TOPLEFT"}, "text": "\u03bc", "orig": "\u03bc", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "\u03bc"}, {"label": "text", "id": 145, "page_no": 9, "cluster": {"id": 145, "label": "text", "bbox": {"l": 300.581, "t": 683.622, "r": 302.726, "b": 693.429, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 173, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 300.581, "r_y0": 693.429, "r_x1": 302.726, "r_y1": 693.429, "r_x2": 302.726, "r_y2": 683.622, "r_x3": 300.581, "r_y3": 683.622, "coord_origin": "TOPLEFT"}, "text": "\u2265", "orig": "\u2265", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "\u2265"}], "headers": [{"label": "page_header", "id": 7, "page_no": 9, "cluster": {"id": 7, "label": "page_header", "bbox": {"l": 134.765, "t": 91.49300000000005, "r": 143.979, "b": 102.78200000000004, "coord_origin": "TOPLEFT"}, "confidence": 0.8309906721115112, "cells": [{"index": 0, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 102.78200000000004, "r_x1": 143.979, "r_y1": 102.78200000000004, "r_x2": 143.979, "r_y2": 91.49300000000005, "r_x3": 134.765, "r_y3": 91.49300000000005, "coord_origin": "TOPLEFT"}, "text": "10", "orig": "10", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "10"}, {"label": "page_header", "id": 6, "page_no": 9, "cluster": {"id": 6, "label": "page_header", "bbox": {"l": 167.821, "t": 91.49300000000005, "r": 231.72, "b": 102.78200000000004, "coord_origin": "TOPLEFT"}, "confidence": 0.8367075324058533, "cells": [{"index": 1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 167.821, "r_y0": 102.78200000000004, "r_x1": 231.72, "r_y1": 102.78200000000004, "r_x2": 231.72, "r_y2": 91.49300000000005, "r_x3": 167.821, "r_y3": 91.49300000000005, "coord_origin": "TOPLEFT"}, "text": "M. Lysak, et al.", "orig": "M. Lysak, et al.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "M. Lysak, et al."}]}}, {"page_no": 10, "size": {"width": 612.0, "height": 792.0}, "cells": [{"index": 0, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 194.478, "r_y0": 102.78200000000004, "r_x1": 447.543, "r_y1": 102.78200000000004, "r_x2": 447.543, "r_y2": 91.49300000000005, "r_x3": 194.478, "r_y3": 91.49300000000005, "coord_origin": "TOPLEFT"}, "text": "Optimized Table Tokenization for Table Structure Recognition", "orig": "Optimized Table Tokenization for Table Structure Recognition", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 471.376, "r_y0": 102.78200000000004, "r_x1": 480.59, "r_y1": 102.78200000000004, "r_x2": 480.59, "r_y2": 91.49300000000005, "r_x3": 471.376, "r_y3": 91.49300000000005, "coord_origin": "TOPLEFT"}, "text": "11", "orig": "11", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 2, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 133.72500000000002, "r_x1": 162.644, "r_y1": 133.72500000000002, "r_x2": 162.644, "r_y2": 125.79899999999998, "r_x3": 134.765, "r_y3": 125.79899999999998, "coord_origin": "TOPLEFT"}, "text": "Fig. 6.", "orig": "Fig. 6.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 3, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 165.215, "r_y0": 134.87300000000005, "r_x1": 480.587, "r_y1": 134.87300000000005, "r_x2": 480.587, "r_y2": 123.58399999999995, "r_x3": 165.215, "r_y3": 123.58399999999995, "coord_origin": "TOPLEFT"}, "text": "Visualization of predicted structure and detected bounding boxes on a complex", "orig": "Visualization of predicted structure and detected bounding boxes on a complex", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 4, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 145.832, "r_x1": 480.588, "r_y1": 145.832, "r_x2": 480.588, "r_y2": 134.543, "r_x3": 134.765, "r_y3": 134.543, "coord_origin": "TOPLEFT"}, "text": "table with many rows. The OTSL model (B) captured repeating pattern of horizontally", "orig": "table with many rows. The OTSL model (B) captured repeating pattern of horizontally", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 5, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 156.79100000000005, "r_x1": 480.588, "r_y1": 156.79100000000005, "r_x2": 480.588, "r_y2": 145.50199999999995, "r_x3": 134.765, "r_y3": 145.50199999999995, "coord_origin": "TOPLEFT"}, "text": "merged cells from the GT (A), unlike the HTML model (C). The HTML model also", "orig": "merged cells from the GT (A), unlike the HTML model (C). The HTML model also", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 6, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 167.75, "r_x1": 480.588, "r_y1": 167.75, "r_x2": 480.588, "r_y2": 156.461, "r_x3": 134.765, "r_y3": 156.461, "coord_origin": "TOPLEFT"}, "text": "didn't complete the HTML sequence correctly and displayed a lot more of drift and", "orig": "didn't complete the HTML sequence correctly and displayed a lot more of drift and", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 7, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 178.70899999999995, "r_x1": 415.845, "r_y1": 178.70899999999995, "r_x2": 415.845, "r_y2": 167.41999999999996, "r_x3": 134.765, "r_y3": 167.41999999999996, "coord_origin": "TOPLEFT"}, "text": "overlap of bounding boxes. \"PMC5406406_003_01.png\" PubTabNet.", "orig": "overlap of bounding boxes. \"PMC5406406_003_01.png\" PubTabNet.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 8, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 171.505, "r_y0": 320.335, "r_x1": 177.596, "r_y1": 320.335, "r_x2": 177.596, "r_y2": 312.552, "r_x3": 171.505, "r_y3": 312.552, "coord_origin": "TOPLEFT"}, "text": "B", "orig": "B", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 9, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 171.058, "r_y0": 500.537, "r_x1": 177.149, "r_y1": 500.537, "r_x2": 177.149, "r_y2": 492.754, "r_x3": 171.058, "r_y3": 492.754, "coord_origin": "TOPLEFT"}, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 10, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 283.047, "r_y0": 633.395, "r_x1": 374.963, "r_y1": 633.395, "r_x2": 374.963, "r_y2": 627.558, "r_x3": 283.047, "r_y3": 627.558, "coord_origin": "TOPLEFT"}, "text": "Incorrect end of HTML sequence", "orig": "Incorrect end of HTML sequence", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 11, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 283.047, "r_y0": 623.271, "r_x1": 398.06, "r_y1": 623.271, "r_x2": 398.06, "r_y2": 617.434, "r_x3": 283.047, "r_y3": 617.434, "coord_origin": "TOPLEFT"}, "text": "Horizontally merged cells are not present", "orig": "Horizontally merged cells are not present", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 12, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 293.642, "r_y0": 471.511, "r_x1": 437.508, "r_y1": 471.511, "r_x2": 437.508, "r_y2": 465.674, "r_x3": 293.642, "r_y3": 465.674, "coord_origin": "TOPLEFT"}, "text": "Repeating pattern is well represented in predictions", "orig": "Repeating pattern is well represented in predictions", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 13, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 181.891, "r_y0": 294.273, "r_x1": 239.235, "r_y1": 294.273, "r_x2": 239.235, "r_y2": 288.436, "r_x3": 181.891, "r_y3": 288.436, "coord_origin": "TOPLEFT"}, "text": "Repeating pattern of", "orig": "Repeating pattern of", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 14, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 181.891, "r_y0": 300.807, "r_x1": 251.529, "r_y1": 300.807, "r_x2": 251.529, "r_y2": 294.97, "r_x3": 181.891, "r_y3": 294.97, "coord_origin": "TOPLEFT"}, "text": "horizontally merged cells", "orig": "horizontally merged cells", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 15, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 247.834, "r_y0": 194.32600000000002, "r_x1": 253.613, "r_y1": 194.32600000000002, "r_x2": 253.613, "r_y2": 186.962, "r_x3": 247.834, "r_y3": 186.962, "coord_origin": "TOPLEFT"}, "text": "A", "orig": "A", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 16, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 292.19, "r_y0": 613.719, "r_x1": 381.547, "r_y1": 613.719, "r_x2": 381.547, "r_y2": 607.8820000000001, "r_x3": 292.19, "r_y3": 607.8820000000001, "coord_origin": "TOPLEFT"}, "text": "Bounding box drifting at the end", "orig": "Bounding box drifting at the end", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 17, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 180.157, "r_y0": 403.401, "r_x1": 180.173, "r_y1": 381.368, "r_x2": 172.39, "r_y2": 381.363, "r_x3": 172.374, "r_y3": 403.395, "coord_origin": "TOPLEFT"}, "text": "OTSL", "orig": "OTSL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 18, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 180.157, "r_y0": 578.748, "r_x1": 180.174, "r_y1": 555.783, "r_x2": 172.391, "r_y2": 555.777, "r_x3": 172.374, "r_y3": 578.742, "coord_origin": "TOPLEFT"}, "text": "HTML", "orig": "HTML", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "parsed_page": null, "predictions": {"layout": {"clusters": [{"id": 0, "label": "page_header", "bbox": {"l": 194.478, "t": 91.49300000000005, "r": 447.543, "b": 102.78200000000004, "coord_origin": "TOPLEFT"}, "confidence": 0.9301655888557434, "cells": [{"index": 0, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 194.478, "r_y0": 102.78200000000004, "r_x1": 447.543, "r_y1": 102.78200000000004, "r_x2": 447.543, "r_y2": 91.49300000000005, "r_x3": 194.478, "r_y3": 91.49300000000005, "coord_origin": "TOPLEFT"}, "text": "Optimized Table Tokenization for Table Structure Recognition", "orig": "Optimized Table Tokenization for Table Structure Recognition", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 1, "label": "page_header", "bbox": {"l": 471.376, "t": 91.49300000000005, "r": 480.59, "b": 102.78200000000004, "coord_origin": "TOPLEFT"}, "confidence": 0.9007201790809631, "cells": [{"index": 1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 471.376, "r_y0": 102.78200000000004, "r_x1": 480.59, "r_y1": 102.78200000000004, "r_x2": 480.59, "r_y2": 91.49300000000005, "r_x3": 471.376, "r_y3": 91.49300000000005, "coord_origin": "TOPLEFT"}, "text": "11", "orig": "11", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 2, "label": "caption", "bbox": {"l": 134.765, "t": 123.58399999999995, "r": 480.588, "b": 178.70899999999995, "coord_origin": "TOPLEFT"}, "confidence": 0.8657060861587524, "cells": [{"index": 2, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 133.72500000000002, "r_x1": 162.644, "r_y1": 133.72500000000002, "r_x2": 162.644, "r_y2": 125.79899999999998, "r_x3": 134.765, "r_y3": 125.79899999999998, "coord_origin": "TOPLEFT"}, "text": "Fig. 6.", "orig": "Fig. 6.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 3, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 165.215, "r_y0": 134.87300000000005, "r_x1": 480.587, "r_y1": 134.87300000000005, "r_x2": 480.587, "r_y2": 123.58399999999995, "r_x3": 165.215, "r_y3": 123.58399999999995, "coord_origin": "TOPLEFT"}, "text": "Visualization of predicted structure and detected bounding boxes on a complex", "orig": "Visualization of predicted structure and detected bounding boxes on a complex", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 4, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 145.832, "r_x1": 480.588, "r_y1": 145.832, "r_x2": 480.588, "r_y2": 134.543, "r_x3": 134.765, "r_y3": 134.543, "coord_origin": "TOPLEFT"}, "text": "table with many rows. The OTSL model (B) captured repeating pattern of horizontally", "orig": "table with many rows. The OTSL model (B) captured repeating pattern of horizontally", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 5, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 156.79100000000005, "r_x1": 480.588, "r_y1": 156.79100000000005, "r_x2": 480.588, "r_y2": 145.50199999999995, "r_x3": 134.765, "r_y3": 145.50199999999995, "coord_origin": "TOPLEFT"}, "text": "merged cells from the GT (A), unlike the HTML model (C). The HTML model also", "orig": "merged cells from the GT (A), unlike the HTML model (C). The HTML model also", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 6, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 167.75, "r_x1": 480.588, "r_y1": 167.75, "r_x2": 480.588, "r_y2": 156.461, "r_x3": 134.765, "r_y3": 156.461, "coord_origin": "TOPLEFT"}, "text": "didn't complete the HTML sequence correctly and displayed a lot more of drift and", "orig": "didn't complete the HTML sequence correctly and displayed a lot more of drift and", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 7, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 178.70899999999995, "r_x1": 415.845, "r_y1": 178.70899999999995, "r_x2": 415.845, "r_y2": 167.41999999999996, "r_x3": 134.765, "r_y3": 167.41999999999996, "coord_origin": "TOPLEFT"}, "text": "overlap of bounding boxes. \"PMC5406406_003_01.png\" PubTabNet.", "orig": "overlap of bounding boxes. \"PMC5406406_003_01.png\" PubTabNet.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 3, "label": "picture", "bbox": {"l": 168.39285278320312, "t": 181.9665069580078, "r": 447.35137939453125, "b": 634.0056762695312, "coord_origin": "TOPLEFT"}, "confidence": 0.7612658739089966, "cells": [{"index": 8, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 171.505, "r_y0": 320.335, "r_x1": 177.596, "r_y1": 320.335, "r_x2": 177.596, "r_y2": 312.552, "r_x3": 171.505, "r_y3": 312.552, "coord_origin": "TOPLEFT"}, "text": "B", "orig": "B", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 9, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 171.058, "r_y0": 500.537, "r_x1": 177.149, "r_y1": 500.537, "r_x2": 177.149, "r_y2": 492.754, "r_x3": 171.058, "r_y3": 492.754, "coord_origin": "TOPLEFT"}, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 10, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 283.047, "r_y0": 633.395, "r_x1": 374.963, "r_y1": 633.395, "r_x2": 374.963, "r_y2": 627.558, "r_x3": 283.047, "r_y3": 627.558, "coord_origin": "TOPLEFT"}, "text": "Incorrect end of HTML sequence", "orig": "Incorrect end of HTML sequence", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 11, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 283.047, "r_y0": 623.271, "r_x1": 398.06, "r_y1": 623.271, "r_x2": 398.06, "r_y2": 617.434, "r_x3": 283.047, "r_y3": 617.434, "coord_origin": "TOPLEFT"}, "text": "Horizontally merged cells are not present", "orig": "Horizontally merged cells are not present", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 12, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 293.642, "r_y0": 471.511, "r_x1": 437.508, "r_y1": 471.511, "r_x2": 437.508, "r_y2": 465.674, "r_x3": 293.642, "r_y3": 465.674, "coord_origin": "TOPLEFT"}, "text": "Repeating pattern is well represented in predictions", "orig": "Repeating pattern is well represented in predictions", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 13, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 181.891, "r_y0": 294.273, "r_x1": 239.235, "r_y1": 294.273, "r_x2": 239.235, "r_y2": 288.436, "r_x3": 181.891, "r_y3": 288.436, "coord_origin": "TOPLEFT"}, "text": "Repeating pattern of", "orig": "Repeating pattern of", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 14, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 181.891, "r_y0": 300.807, "r_x1": 251.529, "r_y1": 300.807, "r_x2": 251.529, "r_y2": 294.97, "r_x3": 181.891, "r_y3": 294.97, "coord_origin": "TOPLEFT"}, "text": "horizontally merged cells", "orig": "horizontally merged cells", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 15, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 247.834, "r_y0": 194.32600000000002, "r_x1": 253.613, "r_y1": 194.32600000000002, "r_x2": 253.613, "r_y2": 186.962, "r_x3": 247.834, "r_y3": 186.962, "coord_origin": "TOPLEFT"}, "text": "A", "orig": "A", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 16, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 292.19, "r_y0": 613.719, "r_x1": 381.547, "r_y1": 613.719, "r_x2": 381.547, "r_y2": 607.8820000000001, "r_x3": 292.19, "r_y3": 607.8820000000001, "coord_origin": "TOPLEFT"}, "text": "Bounding box drifting at the end", "orig": "Bounding box drifting at the end", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 17, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 180.157, "r_y0": 403.401, "r_x1": 180.173, "r_y1": 381.368, "r_x2": 172.39, "r_y2": 381.363, "r_x3": 172.374, "r_y3": 403.395, "coord_origin": "TOPLEFT"}, "text": "OTSL", "orig": "OTSL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 18, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 180.157, "r_y0": 578.748, "r_x1": 180.174, "r_y1": 555.783, "r_x2": 172.391, "r_y2": 555.777, "r_x3": 172.374, "r_y3": 578.742, "coord_origin": "TOPLEFT"}, "text": "HTML", "orig": "HTML", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": [{"id": 18, "label": "text", "bbox": {"l": 171.505, "t": 312.552, "r": 177.596, "b": 320.335, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 8, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 171.505, "r_y0": 320.335, "r_x1": 177.596, "r_y1": 320.335, "r_x2": 177.596, "r_y2": 312.552, "r_x3": 171.505, "r_y3": 312.552, "coord_origin": "TOPLEFT"}, "text": "B", "orig": "B", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 19, "label": "text", "bbox": {"l": 171.058, "t": 492.754, "r": 177.149, "b": 500.537, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 9, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 171.058, "r_y0": 500.537, "r_x1": 177.149, "r_y1": 500.537, "r_x2": 177.149, "r_y2": 492.754, "r_x3": 171.058, "r_y3": 492.754, "coord_origin": "TOPLEFT"}, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 20, "label": "text", "bbox": {"l": 283.047, "t": 627.558, "r": 374.963, "b": 633.395, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 10, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 283.047, "r_y0": 633.395, "r_x1": 374.963, "r_y1": 633.395, "r_x2": 374.963, "r_y2": 627.558, "r_x3": 283.047, "r_y3": 627.558, "coord_origin": "TOPLEFT"}, "text": "Incorrect end of HTML sequence", "orig": "Incorrect end of HTML sequence", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 21, "label": "text", "bbox": {"l": 283.047, "t": 617.434, "r": 398.06, "b": 623.271, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 11, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 283.047, "r_y0": 623.271, "r_x1": 398.06, "r_y1": 623.271, "r_x2": 398.06, "r_y2": 617.434, "r_x3": 283.047, "r_y3": 617.434, "coord_origin": "TOPLEFT"}, "text": "Horizontally merged cells are not present", "orig": "Horizontally merged cells are not present", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 22, "label": "text", "bbox": {"l": 293.642, "t": 465.674, "r": 437.508, "b": 471.511, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 12, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 293.642, "r_y0": 471.511, "r_x1": 437.508, "r_y1": 471.511, "r_x2": 437.508, "r_y2": 465.674, "r_x3": 293.642, "r_y3": 465.674, "coord_origin": "TOPLEFT"}, "text": "Repeating pattern is well represented in predictions", "orig": "Repeating pattern is well represented in predictions", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 23, "label": "text", "bbox": {"l": 181.891, "t": 288.436, "r": 239.235, "b": 294.273, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 13, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 181.891, "r_y0": 294.273, "r_x1": 239.235, "r_y1": 294.273, "r_x2": 239.235, "r_y2": 288.436, "r_x3": 181.891, "r_y3": 288.436, "coord_origin": "TOPLEFT"}, "text": "Repeating pattern of", "orig": "Repeating pattern of", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 24, "label": "text", "bbox": {"l": 181.891, "t": 294.97, "r": 251.529, "b": 300.807, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 14, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 181.891, "r_y0": 300.807, "r_x1": 251.529, "r_y1": 300.807, "r_x2": 251.529, "r_y2": 294.97, "r_x3": 181.891, "r_y3": 294.97, "coord_origin": "TOPLEFT"}, "text": "horizontally merged cells", "orig": "horizontally merged cells", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 25, "label": "text", "bbox": {"l": 247.834, "t": 186.962, "r": 253.613, "b": 194.32600000000002, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 15, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 247.834, "r_y0": 194.32600000000002, "r_x1": 253.613, "r_y1": 194.32600000000002, "r_x2": 253.613, "r_y2": 186.962, "r_x3": 247.834, "r_y3": 186.962, "coord_origin": "TOPLEFT"}, "text": "A", "orig": "A", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 26, "label": "text", "bbox": {"l": 292.19, "t": 607.8820000000001, "r": 381.547, "b": 613.719, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 16, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 292.19, "r_y0": 613.719, "r_x1": 381.547, "r_y1": 613.719, "r_x2": 381.547, "r_y2": 607.8820000000001, "r_x3": 292.19, "r_y3": 607.8820000000001, "coord_origin": "TOPLEFT"}, "text": "Bounding box drifting at the end", "orig": "Bounding box drifting at the end", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 27, "label": "text", "bbox": {"l": 172.374, "t": 381.363, "r": 180.173, "b": 403.401, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 17, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 180.157, "r_y0": 403.401, "r_x1": 180.173, "r_y1": 381.368, "r_x2": 172.39, "r_y2": 381.363, "r_x3": 172.374, "r_y3": 403.395, "coord_origin": "TOPLEFT"}, "text": "OTSL", "orig": "OTSL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 28, "label": "text", "bbox": {"l": 172.374, "t": 555.777, "r": 180.174, "b": 578.748, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 18, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 180.157, "r_y0": 578.748, "r_x1": 180.174, "r_y1": 555.783, "r_x2": 172.391, "r_y2": 555.777, "r_x3": 172.374, "r_y3": 578.742, "coord_origin": "TOPLEFT"}, "text": "HTML", "orig": "HTML", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}]}]}, "tablestructure": {"table_map": {}}, "figures_classification": null, "equations_prediction": null, "vlm_response": null}, "assembled": {"elements": [{"label": "page_header", "id": 0, "page_no": 10, "cluster": {"id": 0, "label": "page_header", "bbox": {"l": 194.478, "t": 91.49300000000005, "r": 447.543, "b": 102.78200000000004, "coord_origin": "TOPLEFT"}, "confidence": 0.9301655888557434, "cells": [{"index": 0, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 194.478, "r_y0": 102.78200000000004, "r_x1": 447.543, "r_y1": 102.78200000000004, "r_x2": 447.543, "r_y2": 91.49300000000005, "r_x3": 194.478, "r_y3": 91.49300000000005, "coord_origin": "TOPLEFT"}, "text": "Optimized Table Tokenization for Table Structure Recognition", "orig": "Optimized Table Tokenization for Table Structure Recognition", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "Optimized Table Tokenization for Table Structure Recognition"}, {"label": "page_header", "id": 1, "page_no": 10, "cluster": {"id": 1, "label": "page_header", "bbox": {"l": 471.376, "t": 91.49300000000005, "r": 480.59, "b": 102.78200000000004, "coord_origin": "TOPLEFT"}, "confidence": 0.9007201790809631, "cells": [{"index": 1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 471.376, "r_y0": 102.78200000000004, "r_x1": 480.59, "r_y1": 102.78200000000004, "r_x2": 480.59, "r_y2": 91.49300000000005, "r_x3": 471.376, "r_y3": 91.49300000000005, "coord_origin": "TOPLEFT"}, "text": "11", "orig": "11", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "11"}, {"label": "caption", "id": 2, "page_no": 10, "cluster": {"id": 2, "label": "caption", "bbox": {"l": 134.765, "t": 123.58399999999995, "r": 480.588, "b": 178.70899999999995, "coord_origin": "TOPLEFT"}, "confidence": 0.8657060861587524, "cells": [{"index": 2, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 133.72500000000002, "r_x1": 162.644, "r_y1": 133.72500000000002, "r_x2": 162.644, "r_y2": 125.79899999999998, "r_x3": 134.765, "r_y3": 125.79899999999998, "coord_origin": "TOPLEFT"}, "text": "Fig. 6.", "orig": "Fig. 6.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 3, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 165.215, "r_y0": 134.87300000000005, "r_x1": 480.587, "r_y1": 134.87300000000005, "r_x2": 480.587, "r_y2": 123.58399999999995, "r_x3": 165.215, "r_y3": 123.58399999999995, "coord_origin": "TOPLEFT"}, "text": "Visualization of predicted structure and detected bounding boxes on a complex", "orig": "Visualization of predicted structure and detected bounding boxes on a complex", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 4, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 145.832, "r_x1": 480.588, "r_y1": 145.832, "r_x2": 480.588, "r_y2": 134.543, "r_x3": 134.765, "r_y3": 134.543, "coord_origin": "TOPLEFT"}, "text": "table with many rows. The OTSL model (B) captured repeating pattern of horizontally", "orig": "table with many rows. The OTSL model (B) captured repeating pattern of horizontally", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 5, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 156.79100000000005, "r_x1": 480.588, "r_y1": 156.79100000000005, "r_x2": 480.588, "r_y2": 145.50199999999995, "r_x3": 134.765, "r_y3": 145.50199999999995, "coord_origin": "TOPLEFT"}, "text": "merged cells from the GT (A), unlike the HTML model (C). The HTML model also", "orig": "merged cells from the GT (A), unlike the HTML model (C). The HTML model also", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 6, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 167.75, "r_x1": 480.588, "r_y1": 167.75, "r_x2": 480.588, "r_y2": 156.461, "r_x3": 134.765, "r_y3": 156.461, "coord_origin": "TOPLEFT"}, "text": "didn't complete the HTML sequence correctly and displayed a lot more of drift and", "orig": "didn't complete the HTML sequence correctly and displayed a lot more of drift and", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 7, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 178.70899999999995, "r_x1": 415.845, "r_y1": 178.70899999999995, "r_x2": 415.845, "r_y2": 167.41999999999996, "r_x3": 134.765, "r_y3": 167.41999999999996, "coord_origin": "TOPLEFT"}, "text": "overlap of bounding boxes. \"PMC5406406_003_01.png\" PubTabNet.", "orig": "overlap of bounding boxes. \"PMC5406406_003_01.png\" PubTabNet.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "Fig. 6. Visualization of predicted structure and detected bounding boxes on a complex table with many rows. The OTSL model (B) captured repeating pattern of horizontally merged cells from the GT (A), unlike the HTML model (C). The HTML model also didn't complete the HTML sequence correctly and displayed a lot more of drift and overlap of bounding boxes. \"PMC5406406_003_01.png\" PubTabNet."}, {"label": "picture", "id": 3, "page_no": 10, "cluster": {"id": 3, "label": "picture", "bbox": {"l": 168.39285278320312, "t": 181.9665069580078, "r": 447.35137939453125, "b": 634.0056762695312, "coord_origin": "TOPLEFT"}, "confidence": 0.7612658739089966, "cells": [{"index": 8, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 171.505, "r_y0": 320.335, "r_x1": 177.596, "r_y1": 320.335, "r_x2": 177.596, "r_y2": 312.552, "r_x3": 171.505, "r_y3": 312.552, "coord_origin": "TOPLEFT"}, "text": "B", "orig": "B", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 9, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 171.058, "r_y0": 500.537, "r_x1": 177.149, "r_y1": 500.537, "r_x2": 177.149, "r_y2": 492.754, "r_x3": 171.058, "r_y3": 492.754, "coord_origin": "TOPLEFT"}, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 10, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 283.047, "r_y0": 633.395, "r_x1": 374.963, "r_y1": 633.395, "r_x2": 374.963, "r_y2": 627.558, "r_x3": 283.047, "r_y3": 627.558, "coord_origin": "TOPLEFT"}, "text": "Incorrect end of HTML sequence", "orig": "Incorrect end of HTML sequence", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 11, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 283.047, "r_y0": 623.271, "r_x1": 398.06, "r_y1": 623.271, "r_x2": 398.06, "r_y2": 617.434, "r_x3": 283.047, "r_y3": 617.434, "coord_origin": "TOPLEFT"}, "text": "Horizontally merged cells are not present", "orig": "Horizontally merged cells are not present", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 12, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 293.642, "r_y0": 471.511, "r_x1": 437.508, "r_y1": 471.511, "r_x2": 437.508, "r_y2": 465.674, "r_x3": 293.642, "r_y3": 465.674, "coord_origin": "TOPLEFT"}, "text": "Repeating pattern is well represented in predictions", "orig": "Repeating pattern is well represented in predictions", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 13, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 181.891, "r_y0": 294.273, "r_x1": 239.235, "r_y1": 294.273, "r_x2": 239.235, "r_y2": 288.436, "r_x3": 181.891, "r_y3": 288.436, "coord_origin": "TOPLEFT"}, "text": "Repeating pattern of", "orig": "Repeating pattern of", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 14, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 181.891, "r_y0": 300.807, "r_x1": 251.529, "r_y1": 300.807, "r_x2": 251.529, "r_y2": 294.97, "r_x3": 181.891, "r_y3": 294.97, "coord_origin": "TOPLEFT"}, "text": "horizontally merged cells", "orig": "horizontally merged cells", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 15, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 247.834, "r_y0": 194.32600000000002, "r_x1": 253.613, "r_y1": 194.32600000000002, "r_x2": 253.613, "r_y2": 186.962, "r_x3": 247.834, "r_y3": 186.962, "coord_origin": "TOPLEFT"}, "text": "A", "orig": "A", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 16, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 292.19, "r_y0": 613.719, "r_x1": 381.547, "r_y1": 613.719, "r_x2": 381.547, "r_y2": 607.8820000000001, "r_x3": 292.19, "r_y3": 607.8820000000001, "coord_origin": "TOPLEFT"}, "text": "Bounding box drifting at the end", "orig": "Bounding box drifting at the end", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 17, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 180.157, "r_y0": 403.401, "r_x1": 180.173, "r_y1": 381.368, "r_x2": 172.39, "r_y2": 381.363, "r_x3": 172.374, "r_y3": 403.395, "coord_origin": "TOPLEFT"}, "text": "OTSL", "orig": "OTSL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 18, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 180.157, "r_y0": 578.748, "r_x1": 180.174, "r_y1": 555.783, "r_x2": 172.391, "r_y2": 555.777, "r_x3": 172.374, "r_y3": 578.742, "coord_origin": "TOPLEFT"}, "text": "HTML", "orig": "HTML", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": [{"id": 18, "label": "text", "bbox": {"l": 171.505, "t": 312.552, "r": 177.596, "b": 320.335, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 8, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 171.505, "r_y0": 320.335, "r_x1": 177.596, "r_y1": 320.335, "r_x2": 177.596, "r_y2": 312.552, "r_x3": 171.505, "r_y3": 312.552, "coord_origin": "TOPLEFT"}, "text": "B", "orig": "B", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 19, "label": "text", "bbox": {"l": 171.058, "t": 492.754, "r": 177.149, "b": 500.537, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 9, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 171.058, "r_y0": 500.537, "r_x1": 177.149, "r_y1": 500.537, "r_x2": 177.149, "r_y2": 492.754, "r_x3": 171.058, "r_y3": 492.754, "coord_origin": "TOPLEFT"}, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 20, "label": "text", "bbox": {"l": 283.047, "t": 627.558, "r": 374.963, "b": 633.395, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 10, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 283.047, "r_y0": 633.395, "r_x1": 374.963, "r_y1": 633.395, "r_x2": 374.963, "r_y2": 627.558, "r_x3": 283.047, "r_y3": 627.558, "coord_origin": "TOPLEFT"}, "text": "Incorrect end of HTML sequence", "orig": "Incorrect end of HTML sequence", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 21, "label": "text", "bbox": {"l": 283.047, "t": 617.434, "r": 398.06, "b": 623.271, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 11, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 283.047, "r_y0": 623.271, "r_x1": 398.06, "r_y1": 623.271, "r_x2": 398.06, "r_y2": 617.434, "r_x3": 283.047, "r_y3": 617.434, "coord_origin": "TOPLEFT"}, "text": "Horizontally merged cells are not present", "orig": "Horizontally merged cells are not present", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 22, "label": "text", "bbox": {"l": 293.642, "t": 465.674, "r": 437.508, "b": 471.511, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 12, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 293.642, "r_y0": 471.511, "r_x1": 437.508, "r_y1": 471.511, "r_x2": 437.508, "r_y2": 465.674, "r_x3": 293.642, "r_y3": 465.674, "coord_origin": "TOPLEFT"}, "text": "Repeating pattern is well represented in predictions", "orig": "Repeating pattern is well represented in predictions", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 23, "label": "text", "bbox": {"l": 181.891, "t": 288.436, "r": 239.235, "b": 294.273, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 13, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 181.891, "r_y0": 294.273, "r_x1": 239.235, "r_y1": 294.273, "r_x2": 239.235, "r_y2": 288.436, "r_x3": 181.891, "r_y3": 288.436, "coord_origin": "TOPLEFT"}, "text": "Repeating pattern of", "orig": "Repeating pattern of", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 24, "label": "text", "bbox": {"l": 181.891, "t": 294.97, "r": 251.529, "b": 300.807, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 14, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 181.891, "r_y0": 300.807, "r_x1": 251.529, "r_y1": 300.807, "r_x2": 251.529, "r_y2": 294.97, "r_x3": 181.891, "r_y3": 294.97, "coord_origin": "TOPLEFT"}, "text": "horizontally merged cells", "orig": "horizontally merged cells", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 25, "label": "text", "bbox": {"l": 247.834, "t": 186.962, "r": 253.613, "b": 194.32600000000002, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 15, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 247.834, "r_y0": 194.32600000000002, "r_x1": 253.613, "r_y1": 194.32600000000002, "r_x2": 253.613, "r_y2": 186.962, "r_x3": 247.834, "r_y3": 186.962, "coord_origin": "TOPLEFT"}, "text": "A", "orig": "A", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 26, "label": "text", "bbox": {"l": 292.19, "t": 607.8820000000001, "r": 381.547, "b": 613.719, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 16, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 292.19, "r_y0": 613.719, "r_x1": 381.547, "r_y1": 613.719, "r_x2": 381.547, "r_y2": 607.8820000000001, "r_x3": 292.19, "r_y3": 607.8820000000001, "coord_origin": "TOPLEFT"}, "text": "Bounding box drifting at the end", "orig": "Bounding box drifting at the end", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 27, "label": "text", "bbox": {"l": 172.374, "t": 381.363, "r": 180.173, "b": 403.401, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 17, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 180.157, "r_y0": 403.401, "r_x1": 180.173, "r_y1": 381.368, "r_x2": 172.39, "r_y2": 381.363, "r_x3": 172.374, "r_y3": 403.395, "coord_origin": "TOPLEFT"}, "text": "OTSL", "orig": "OTSL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 28, "label": "text", "bbox": {"l": 172.374, "t": 555.777, "r": 180.174, "b": 578.748, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 18, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 180.157, "r_y0": 578.748, "r_x1": 180.174, "r_y1": 555.783, "r_x2": 172.391, "r_y2": 555.777, "r_x3": 172.374, "r_y3": 578.742, "coord_origin": "TOPLEFT"}, "text": "HTML", "orig": "HTML", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}]}, "text": "", "annotations": [], "provenance": null, "predicted_class": null, "confidence": null}], "body": [{"label": "caption", "id": 2, "page_no": 10, "cluster": {"id": 2, "label": "caption", "bbox": {"l": 134.765, "t": 123.58399999999995, "r": 480.588, "b": 178.70899999999995, "coord_origin": "TOPLEFT"}, "confidence": 0.8657060861587524, "cells": [{"index": 2, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 133.72500000000002, "r_x1": 162.644, "r_y1": 133.72500000000002, "r_x2": 162.644, "r_y2": 125.79899999999998, "r_x3": 134.765, "r_y3": 125.79899999999998, "coord_origin": "TOPLEFT"}, "text": "Fig. 6.", "orig": "Fig. 6.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 3, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 165.215, "r_y0": 134.87300000000005, "r_x1": 480.587, "r_y1": 134.87300000000005, "r_x2": 480.587, "r_y2": 123.58399999999995, "r_x3": 165.215, "r_y3": 123.58399999999995, "coord_origin": "TOPLEFT"}, "text": "Visualization of predicted structure and detected bounding boxes on a complex", "orig": "Visualization of predicted structure and detected bounding boxes on a complex", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 4, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 145.832, "r_x1": 480.588, "r_y1": 145.832, "r_x2": 480.588, "r_y2": 134.543, "r_x3": 134.765, "r_y3": 134.543, "coord_origin": "TOPLEFT"}, "text": "table with many rows. The OTSL model (B) captured repeating pattern of horizontally", "orig": "table with many rows. The OTSL model (B) captured repeating pattern of horizontally", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 5, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 156.79100000000005, "r_x1": 480.588, "r_y1": 156.79100000000005, "r_x2": 480.588, "r_y2": 145.50199999999995, "r_x3": 134.765, "r_y3": 145.50199999999995, "coord_origin": "TOPLEFT"}, "text": "merged cells from the GT (A), unlike the HTML model (C). The HTML model also", "orig": "merged cells from the GT (A), unlike the HTML model (C). The HTML model also", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 6, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 167.75, "r_x1": 480.588, "r_y1": 167.75, "r_x2": 480.588, "r_y2": 156.461, "r_x3": 134.765, "r_y3": 156.461, "coord_origin": "TOPLEFT"}, "text": "didn't complete the HTML sequence correctly and displayed a lot more of drift and", "orig": "didn't complete the HTML sequence correctly and displayed a lot more of drift and", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 7, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 178.70899999999995, "r_x1": 415.845, "r_y1": 178.70899999999995, "r_x2": 415.845, "r_y2": 167.41999999999996, "r_x3": 134.765, "r_y3": 167.41999999999996, "coord_origin": "TOPLEFT"}, "text": "overlap of bounding boxes. \"PMC5406406_003_01.png\" PubTabNet.", "orig": "overlap of bounding boxes. \"PMC5406406_003_01.png\" PubTabNet.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "Fig. 6. Visualization of predicted structure and detected bounding boxes on a complex table with many rows. The OTSL model (B) captured repeating pattern of horizontally merged cells from the GT (A), unlike the HTML model (C). The HTML model also didn't complete the HTML sequence correctly and displayed a lot more of drift and overlap of bounding boxes. \"PMC5406406_003_01.png\" PubTabNet."}, {"label": "picture", "id": 3, "page_no": 10, "cluster": {"id": 3, "label": "picture", "bbox": {"l": 168.39285278320312, "t": 181.9665069580078, "r": 447.35137939453125, "b": 634.0056762695312, "coord_origin": "TOPLEFT"}, "confidence": 0.7612658739089966, "cells": [{"index": 8, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 171.505, "r_y0": 320.335, "r_x1": 177.596, "r_y1": 320.335, "r_x2": 177.596, "r_y2": 312.552, "r_x3": 171.505, "r_y3": 312.552, "coord_origin": "TOPLEFT"}, "text": "B", "orig": "B", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 9, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 171.058, "r_y0": 500.537, "r_x1": 177.149, "r_y1": 500.537, "r_x2": 177.149, "r_y2": 492.754, "r_x3": 171.058, "r_y3": 492.754, "coord_origin": "TOPLEFT"}, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 10, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 283.047, "r_y0": 633.395, "r_x1": 374.963, "r_y1": 633.395, "r_x2": 374.963, "r_y2": 627.558, "r_x3": 283.047, "r_y3": 627.558, "coord_origin": "TOPLEFT"}, "text": "Incorrect end of HTML sequence", "orig": "Incorrect end of HTML sequence", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 11, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 283.047, "r_y0": 623.271, "r_x1": 398.06, "r_y1": 623.271, "r_x2": 398.06, "r_y2": 617.434, "r_x3": 283.047, "r_y3": 617.434, "coord_origin": "TOPLEFT"}, "text": "Horizontally merged cells are not present", "orig": "Horizontally merged cells are not present", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 12, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 293.642, "r_y0": 471.511, "r_x1": 437.508, "r_y1": 471.511, "r_x2": 437.508, "r_y2": 465.674, "r_x3": 293.642, "r_y3": 465.674, "coord_origin": "TOPLEFT"}, "text": "Repeating pattern is well represented in predictions", "orig": "Repeating pattern is well represented in predictions", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 13, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 181.891, "r_y0": 294.273, "r_x1": 239.235, "r_y1": 294.273, "r_x2": 239.235, "r_y2": 288.436, "r_x3": 181.891, "r_y3": 288.436, "coord_origin": "TOPLEFT"}, "text": "Repeating pattern of", "orig": "Repeating pattern of", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 14, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 181.891, "r_y0": 300.807, "r_x1": 251.529, "r_y1": 300.807, "r_x2": 251.529, "r_y2": 294.97, "r_x3": 181.891, "r_y3": 294.97, "coord_origin": "TOPLEFT"}, "text": "horizontally merged cells", "orig": "horizontally merged cells", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 15, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 247.834, "r_y0": 194.32600000000002, "r_x1": 253.613, "r_y1": 194.32600000000002, "r_x2": 253.613, "r_y2": 186.962, "r_x3": 247.834, "r_y3": 186.962, "coord_origin": "TOPLEFT"}, "text": "A", "orig": "A", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 16, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 292.19, "r_y0": 613.719, "r_x1": 381.547, "r_y1": 613.719, "r_x2": 381.547, "r_y2": 607.8820000000001, "r_x3": 292.19, "r_y3": 607.8820000000001, "coord_origin": "TOPLEFT"}, "text": "Bounding box drifting at the end", "orig": "Bounding box drifting at the end", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 17, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 180.157, "r_y0": 403.401, "r_x1": 180.173, "r_y1": 381.368, "r_x2": 172.39, "r_y2": 381.363, "r_x3": 172.374, "r_y3": 403.395, "coord_origin": "TOPLEFT"}, "text": "OTSL", "orig": "OTSL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 18, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 180.157, "r_y0": 578.748, "r_x1": 180.174, "r_y1": 555.783, "r_x2": 172.391, "r_y2": 555.777, "r_x3": 172.374, "r_y3": 578.742, "coord_origin": "TOPLEFT"}, "text": "HTML", "orig": "HTML", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": [{"id": 18, "label": "text", "bbox": {"l": 171.505, "t": 312.552, "r": 177.596, "b": 320.335, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 8, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 171.505, "r_y0": 320.335, "r_x1": 177.596, "r_y1": 320.335, "r_x2": 177.596, "r_y2": 312.552, "r_x3": 171.505, "r_y3": 312.552, "coord_origin": "TOPLEFT"}, "text": "B", "orig": "B", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 19, "label": "text", "bbox": {"l": 171.058, "t": 492.754, "r": 177.149, "b": 500.537, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 9, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 171.058, "r_y0": 500.537, "r_x1": 177.149, "r_y1": 500.537, "r_x2": 177.149, "r_y2": 492.754, "r_x3": 171.058, "r_y3": 492.754, "coord_origin": "TOPLEFT"}, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 20, "label": "text", "bbox": {"l": 283.047, "t": 627.558, "r": 374.963, "b": 633.395, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 10, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 283.047, "r_y0": 633.395, "r_x1": 374.963, "r_y1": 633.395, "r_x2": 374.963, "r_y2": 627.558, "r_x3": 283.047, "r_y3": 627.558, "coord_origin": "TOPLEFT"}, "text": "Incorrect end of HTML sequence", "orig": "Incorrect end of HTML sequence", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 21, "label": "text", "bbox": {"l": 283.047, "t": 617.434, "r": 398.06, "b": 623.271, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 11, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 283.047, "r_y0": 623.271, "r_x1": 398.06, "r_y1": 623.271, "r_x2": 398.06, "r_y2": 617.434, "r_x3": 283.047, "r_y3": 617.434, "coord_origin": "TOPLEFT"}, "text": "Horizontally merged cells are not present", "orig": "Horizontally merged cells are not present", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 22, "label": "text", "bbox": {"l": 293.642, "t": 465.674, "r": 437.508, "b": 471.511, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 12, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 293.642, "r_y0": 471.511, "r_x1": 437.508, "r_y1": 471.511, "r_x2": 437.508, "r_y2": 465.674, "r_x3": 293.642, "r_y3": 465.674, "coord_origin": "TOPLEFT"}, "text": "Repeating pattern is well represented in predictions", "orig": "Repeating pattern is well represented in predictions", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 23, "label": "text", "bbox": {"l": 181.891, "t": 288.436, "r": 239.235, "b": 294.273, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 13, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 181.891, "r_y0": 294.273, "r_x1": 239.235, "r_y1": 294.273, "r_x2": 239.235, "r_y2": 288.436, "r_x3": 181.891, "r_y3": 288.436, "coord_origin": "TOPLEFT"}, "text": "Repeating pattern of", "orig": "Repeating pattern of", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 24, "label": "text", "bbox": {"l": 181.891, "t": 294.97, "r": 251.529, "b": 300.807, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 14, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 181.891, "r_y0": 300.807, "r_x1": 251.529, "r_y1": 300.807, "r_x2": 251.529, "r_y2": 294.97, "r_x3": 181.891, "r_y3": 294.97, "coord_origin": "TOPLEFT"}, "text": "horizontally merged cells", "orig": "horizontally merged cells", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 25, "label": "text", "bbox": {"l": 247.834, "t": 186.962, "r": 253.613, "b": 194.32600000000002, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 15, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 247.834, "r_y0": 194.32600000000002, "r_x1": 253.613, "r_y1": 194.32600000000002, "r_x2": 253.613, "r_y2": 186.962, "r_x3": 247.834, "r_y3": 186.962, "coord_origin": "TOPLEFT"}, "text": "A", "orig": "A", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 26, "label": "text", "bbox": {"l": 292.19, "t": 607.8820000000001, "r": 381.547, "b": 613.719, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 16, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 292.19, "r_y0": 613.719, "r_x1": 381.547, "r_y1": 613.719, "r_x2": 381.547, "r_y2": 607.8820000000001, "r_x3": 292.19, "r_y3": 607.8820000000001, "coord_origin": "TOPLEFT"}, "text": "Bounding box drifting at the end", "orig": "Bounding box drifting at the end", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 27, "label": "text", "bbox": {"l": 172.374, "t": 381.363, "r": 180.173, "b": 403.401, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 17, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 180.157, "r_y0": 403.401, "r_x1": 180.173, "r_y1": 381.368, "r_x2": 172.39, "r_y2": 381.363, "r_x3": 172.374, "r_y3": 403.395, "coord_origin": "TOPLEFT"}, "text": "OTSL", "orig": "OTSL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 28, "label": "text", "bbox": {"l": 172.374, "t": 555.777, "r": 180.174, "b": 578.748, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 18, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 180.157, "r_y0": 578.748, "r_x1": 180.174, "r_y1": 555.783, "r_x2": 172.391, "r_y2": 555.777, "r_x3": 172.374, "r_y3": 578.742, "coord_origin": "TOPLEFT"}, "text": "HTML", "orig": "HTML", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}]}, "text": "", "annotations": [], "provenance": null, "predicted_class": null, "confidence": null}], "headers": [{"label": "page_header", "id": 0, "page_no": 10, "cluster": {"id": 0, "label": "page_header", "bbox": {"l": 194.478, "t": 91.49300000000005, "r": 447.543, "b": 102.78200000000004, "coord_origin": "TOPLEFT"}, "confidence": 0.9301655888557434, "cells": [{"index": 0, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 194.478, "r_y0": 102.78200000000004, "r_x1": 447.543, "r_y1": 102.78200000000004, "r_x2": 447.543, "r_y2": 91.49300000000005, "r_x3": 194.478, "r_y3": 91.49300000000005, "coord_origin": "TOPLEFT"}, "text": "Optimized Table Tokenization for Table Structure Recognition", "orig": "Optimized Table Tokenization for Table Structure Recognition", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "Optimized Table Tokenization for Table Structure Recognition"}, {"label": "page_header", "id": 1, "page_no": 10, "cluster": {"id": 1, "label": "page_header", "bbox": {"l": 471.376, "t": 91.49300000000005, "r": 480.59, "b": 102.78200000000004, "coord_origin": "TOPLEFT"}, "confidence": 0.9007201790809631, "cells": [{"index": 1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 471.376, "r_y0": 102.78200000000004, "r_x1": 480.59, "r_y1": 102.78200000000004, "r_x2": 480.59, "r_y2": 91.49300000000005, "r_x3": 471.376, "r_y3": 91.49300000000005, "coord_origin": "TOPLEFT"}, "text": "11", "orig": "11", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "11"}]}}, {"page_no": 11, "size": {"width": 612.0, "height": 792.0}, "cells": [{"index": 0, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 102.78200000000004, "r_x1": 143.979, "r_y1": 102.78200000000004, "r_x2": 143.979, "r_y2": 91.49300000000005, "r_x3": 134.765, "r_y3": 91.49300000000005, "coord_origin": "TOPLEFT"}, "text": "12", "orig": "12", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 167.821, "r_y0": 102.78200000000004, "r_x1": 231.72, "r_y1": 102.78200000000004, "r_x2": 231.72, "r_y2": 91.49300000000005, "r_x3": 167.821, "r_y3": 91.49300000000005, "coord_origin": "TOPLEFT"}, "text": "M. Lysak, et al.", "orig": "M. Lysak, et al.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 2, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 128.11699999999996, "r_x1": 141.489, "r_y1": 128.11699999999996, "r_x2": 141.489, "r_y2": 117.54899999999998, "r_x3": 134.765, "r_y3": 117.54899999999998, "coord_origin": "TOPLEFT"}, "text": "6", "orig": "6", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 3, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 154.938, "r_y0": 128.11699999999996, "r_x1": 219.255, "r_y1": 128.11699999999996, "r_x2": 219.255, "r_y2": 117.54899999999998, "r_x3": 154.938, "r_y3": 117.54899999999998, "coord_origin": "TOPLEFT"}, "text": "Conclusion", "orig": "Conclusion", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 4, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 155.66099999999994, "r_x1": 480.595, "r_y1": 155.66099999999994, "r_x2": 480.595, "r_y2": 146.86400000000003, "r_x3": 134.765, "r_y3": 146.86400000000003, "coord_origin": "TOPLEFT"}, "text": "We demonstrated that representing tables in HTML for the task of table struc-", "orig": "We demonstrated that representing tables in HTML for the task of table struc-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 5, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 167.61599999999999, "r_x1": 152.499, "r_y1": 167.61599999999999, "r_x2": 152.499, "r_y2": 158.81899999999996, "r_x3": 134.765, "r_y3": 158.81899999999996, "coord_origin": "TOPLEFT"}, "text": "ture", "orig": "ture", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 6, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 156.963, "r_y0": 167.61599999999999, "r_x1": 205.131, "r_y1": 167.61599999999999, "r_x2": 205.131, "r_y2": 158.81899999999996, "r_x3": 156.963, "r_y3": 158.81899999999996, "coord_origin": "TOPLEFT"}, "text": "recognition", "orig": "recognition", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 7, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 209.594, "r_y0": 167.61599999999999, "r_x1": 480.595, "r_y1": 167.61599999999999, "r_x2": 480.595, "r_y2": 158.81899999999996, "r_x3": 209.594, "r_y3": 158.81899999999996, "coord_origin": "TOPLEFT"}, "text": "with Im2Seq models is ill-suited and has serious limitations.", "orig": "with Im2Seq models is ill-suited and has serious limitations.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 8, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 179.57100000000003, "r_x1": 480.59, "r_y1": 179.57100000000003, "r_x2": 480.59, "r_y2": 170.774, "r_x3": 134.765, "r_y3": 170.774, "coord_origin": "TOPLEFT"}, "text": "Furthermore, we presented in this paper an Optimized Table Structure Language", "orig": "Furthermore, we presented in this paper an Optimized Table Structure Language", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 9, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 191.52700000000004, "r_x1": 480.596, "r_y1": 191.52700000000004, "r_x2": 480.596, "r_y2": 182.73000000000002, "r_x3": 134.765, "r_y3": 182.73000000000002, "coord_origin": "TOPLEFT"}, "text": "(OTSL) which, when compared to commonly used general purpose languages,", "orig": "(OTSL) which, when compared to commonly used general purpose languages,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 10, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 203.48199999999997, "r_x1": 239.539, "r_y1": 203.48199999999997, "r_x2": 239.539, "r_y2": 194.68499999999995, "r_x3": 134.765, "r_y3": 194.68499999999995, "coord_origin": "TOPLEFT"}, "text": "has several key benefits.", "orig": "has several key benefits.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 11, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 149.709, "r_y0": 216.24099999999999, "r_x1": 480.593, "r_y1": 216.24099999999999, "r_x2": 480.593, "r_y2": 207.44399999999996, "r_x3": 149.709, "r_y3": 207.44399999999996, "coord_origin": "TOPLEFT"}, "text": "First and foremost, given the same network configuration, inference time for", "orig": "First and foremost, given the same network configuration, inference time for", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 12, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 228.19600000000003, "r_x1": 480.594, "r_y1": 228.19600000000003, "r_x2": 480.594, "r_y2": 219.399, "r_x3": 134.765, "r_y3": 219.399, "coord_origin": "TOPLEFT"}, "text": "a table-structure prediction is about 2 times faster compared to the conventional", "orig": "a table-structure prediction is about 2 times faster compared to the conventional", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 13, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 240.15099999999995, "r_x1": 480.591, "r_y1": 240.15099999999995, "r_x2": 480.591, "r_y2": 231.35400000000004, "r_x3": 134.765, "r_y3": 231.35400000000004, "coord_origin": "TOPLEFT"}, "text": "HTML approach. This is primarily owed to the shorter sequence length of the", "orig": "HTML approach. This is primarily owed to the shorter sequence length of the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 14, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 252.106, "r_x1": 230.936, "r_y1": 252.106, "r_x2": 230.936, "r_y2": 243.30899999999997, "r_x3": 134.765, "r_y3": 243.30899999999997, "coord_origin": "TOPLEFT"}, "text": "OTSL representation.", "orig": "OTSL representation.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 15, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 235.838, "r_y0": 252.106, "r_x1": 281.762, "r_y1": 252.106, "r_x2": 281.762, "r_y2": 243.30899999999997, "r_x3": 235.838, "r_y3": 243.30899999999997, "coord_origin": "TOPLEFT"}, "text": "Additional", "orig": "Additional", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 16, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 286.664, "r_y0": 252.106, "r_x1": 340.395, "r_y1": 252.106, "r_x2": 340.395, "r_y2": 243.30899999999997, "r_x3": 286.664, "r_y3": 243.30899999999997, "coord_origin": "TOPLEFT"}, "text": "performance", "orig": "performance", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 17, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 345.287, "r_y0": 252.106, "r_x1": 378.82, "r_y1": 252.106, "r_x2": 378.82, "r_y2": 243.30899999999997, "r_x3": 345.287, "r_y3": 243.30899999999997, "coord_origin": "TOPLEFT"}, "text": "benefits", "orig": "benefits", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 18, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 383.721, "r_y0": 252.106, "r_x1": 456.32, "r_y1": 252.106, "r_x2": 456.32, "r_y2": 243.30899999999997, "r_x3": 383.721, "r_y3": 243.30899999999997, "coord_origin": "TOPLEFT"}, "text": "can be obtained", "orig": "can be obtained", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 19, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 461.221, "r_y0": 252.106, "r_x1": 480.588, "r_y1": 252.106, "r_x2": 480.588, "r_y2": 243.30899999999997, "r_x3": 461.221, "r_y3": 243.30899999999997, "coord_origin": "TOPLEFT"}, "text": "with", "orig": "with", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 20, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 264.062, "r_x1": 480.595, "r_y1": 264.062, "r_x2": 480.595, "r_y2": 255.265, "r_x3": 134.765, "r_y3": 255.265, "coord_origin": "TOPLEFT"}, "text": "HPO (hyper parameter optimization). As we demonstrate in our experiments,", "orig": "HPO (hyper parameter optimization). As we demonstrate in our experiments,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 21, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 276.01700000000005, "r_x1": 480.588, "r_y1": 276.01700000000005, "r_x2": 480.588, "r_y2": 267.22, "r_x3": 134.765, "r_y3": 267.22, "coord_origin": "TOPLEFT"}, "text": "models trained on OTSL can be significantly smaller, e.g. by reducing the number", "orig": "models trained on OTSL can be significantly smaller, e.g. by reducing the number", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 22, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 287.972, "r_x1": 480.593, "r_y1": 287.972, "r_x2": 480.593, "r_y2": 279.17499999999995, "r_x3": 134.765, "r_y3": 279.17499999999995, "coord_origin": "TOPLEFT"}, "text": "of encoder and decoder layers, while preserving comparatively good prediction", "orig": "of encoder and decoder layers, while preserving comparatively good prediction", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 23, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 299.927, "r_x1": 480.589, "r_y1": 299.927, "r_x2": 480.589, "r_y2": 291.13, "r_x3": 134.765, "r_y3": 291.13, "coord_origin": "TOPLEFT"}, "text": "quality. This can further improve inference performance, yielding 5-6 times faster", "orig": "quality. This can further improve inference performance, yielding 5-6 times faster", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 24, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 311.882, "r_x1": 480.594, "r_y1": 311.882, "r_x2": 480.594, "r_y2": 303.085, "r_x3": 134.765, "r_y3": 303.085, "coord_origin": "TOPLEFT"}, "text": "inference speed in OTSL with prediction quality comparable to models trained", "orig": "inference speed in OTSL with prediction quality comparable to models trained", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 25, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 323.837, "r_x1": 240.923, "r_y1": 323.837, "r_x2": 240.923, "r_y2": 315.04, "r_x3": 134.765, "r_y3": 315.04, "coord_origin": "TOPLEFT"}, "text": "on HTML (see Table 1).", "orig": "on HTML (see Table 1).", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 26, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 149.709, "r_y0": 336.596, "r_x1": 480.59, "r_y1": 336.596, "r_x2": 480.59, "r_y2": 327.799, "r_x3": 149.709, "r_y3": 327.799, "coord_origin": "TOPLEFT"}, "text": "Secondly, OTSL has more inherent structure and a significantly restricted vo-", "orig": "Secondly, OTSL has more inherent structure and a significantly restricted vo-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 27, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 348.552, "r_x1": 480.595, "r_y1": 348.552, "r_x2": 480.595, "r_y2": 339.755, "r_x3": 134.765, "r_y3": 339.755, "coord_origin": "TOPLEFT"}, "text": "cabulary size. This allows autoregressive models to perform better in the TED", "orig": "cabulary size. This allows autoregressive models to perform better in the TED", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 28, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 360.507, "r_x1": 480.587, "r_y1": 360.507, "r_x2": 480.587, "r_y2": 351.71, "r_x3": 134.765, "r_y3": 351.71, "coord_origin": "TOPLEFT"}, "text": "metric, but especially with regards to prediction accuracy of the table-cell bound-", "orig": "metric, but especially with regards to prediction accuracy of the table-cell bound-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 29, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 372.462, "r_x1": 480.595, "r_y1": 372.462, "r_x2": 480.595, "r_y2": 363.665, "r_x3": 134.765, "r_y3": 363.665, "coord_origin": "TOPLEFT"}, "text": "ing boxes (see Table 2). As shown in Figure 5, we observe that the OTSL dras-", "orig": "ing boxes (see Table 2). As shown in Figure 5, we observe that the OTSL dras-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 30, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 384.417, "r_x1": 480.59, "r_y1": 384.417, "r_x2": 480.59, "r_y2": 375.62, "r_x3": 134.765, "r_y3": 375.62, "coord_origin": "TOPLEFT"}, "text": "tically reduces the drift for table cell bounding boxes at high row count and in", "orig": "tically reduces the drift for table cell bounding boxes at high row count and in", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 31, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 396.372, "r_x1": 480.587, "r_y1": 396.372, "r_x2": 480.587, "r_y2": 387.575, "r_x3": 134.765, "r_y3": 387.575, "coord_origin": "TOPLEFT"}, "text": "sparse tables. This leads to more accurate predictions and a significant reduction", "orig": "sparse tables. This leads to more accurate predictions and a significant reduction", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 32, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 408.328, "r_x1": 480.586, "r_y1": 408.328, "r_x2": 480.586, "r_y2": 399.531, "r_x3": 134.765, "r_y3": 399.531, "coord_origin": "TOPLEFT"}, "text": "in post-processing complexity, which is an undesired necessity in HTML-based", "orig": "in post-processing complexity, which is an undesired necessity in HTML-based", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 33, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 420.283, "r_x1": 480.587, "r_y1": 420.283, "r_x2": 480.587, "r_y2": 411.486, "r_x3": 134.765, "r_y3": 411.486, "coord_origin": "TOPLEFT"}, "text": "Im2Seq models. Significant novelty lies in OTSL syntactical rules, which are few,", "orig": "Im2Seq models. Significant novelty lies in OTSL syntactical rules, which are few,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 34, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 432.238, "r_x1": 480.595, "r_y1": 432.238, "r_x2": 480.595, "r_y2": 423.441, "r_x3": 134.765, "r_y3": 423.441, "coord_origin": "TOPLEFT"}, "text": "simple and always backwards looking. Each new token can be validated only by", "orig": "simple and always backwards looking. Each new token can be validated only by", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 35, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 444.193, "r_x1": 480.588, "r_y1": 444.193, "r_x2": 480.588, "r_y2": 435.396, "r_x3": 134.765, "r_y3": 435.396, "coord_origin": "TOPLEFT"}, "text": "analyzing the sequence of previous tokens, without requiring the entire sequence", "orig": "analyzing the sequence of previous tokens, without requiring the entire sequence", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 36, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 456.148, "r_x1": 480.59, "r_y1": 456.148, "r_x2": 480.59, "r_y2": 447.351, "r_x3": 134.765, "r_y3": 447.351, "coord_origin": "TOPLEFT"}, "text": "to detect mistakes. This in return allows to perform structural error detection", "orig": "to detect mistakes. This in return allows to perform structural error detection", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 37, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 468.103, "r_x1": 366.777, "r_y1": 468.103, "r_x2": 366.777, "r_y2": 459.306, "r_x3": 134.765, "r_y3": 459.306, "coord_origin": "TOPLEFT"}, "text": "and correction on-the-fly during sequence generation.", "orig": "and correction on-the-fly during sequence generation.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 38, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 504.389, "r_x1": 197.686, "r_y1": 504.389, "r_x2": 197.686, "r_y2": 493.821, "r_x3": 134.765, "r_y3": 493.821, "coord_origin": "TOPLEFT"}, "text": "References", "orig": "References", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 39, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 139.371, "r_y0": 531.8910000000001, "r_x1": 146.537, "r_y1": 531.8910000000001, "r_x2": 146.537, "r_y2": 520.602, "r_x3": 139.371, "r_y3": 520.602, "coord_origin": "TOPLEFT"}, "text": "1.", "orig": "1.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 40, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 151.522, "r_y0": 531.8910000000001, "r_x1": 189.958, "r_y1": 531.8910000000001, "r_x2": 189.958, "r_y2": 520.602, "r_x3": 151.522, "r_y3": 520.602, "coord_origin": "TOPLEFT"}, "text": "Auer, C.,", "orig": "Auer, C.,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 41, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 194.342, "r_y0": 531.8910000000001, "r_x1": 216.222, "r_y1": 531.8910000000001, "r_x2": 216.222, "r_y2": 520.602, "r_x3": 194.342, "r_y3": 520.602, "coord_origin": "TOPLEFT"}, "text": "Dolfi,", "orig": "Dolfi,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 42, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 220.607, "r_y0": 531.8910000000001, "r_x1": 277.21, "r_y1": 531.8910000000001, "r_x2": 277.21, "r_y2": 520.602, "r_x3": 220.607, "r_y3": 520.602, "coord_origin": "TOPLEFT"}, "text": "M., Carvalho,", "orig": "M., Carvalho,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 43, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 281.594, "r_y0": 531.8910000000001, "r_x1": 293.621, "r_y1": 531.8910000000001, "r_x2": 293.621, "r_y2": 520.602, "r_x3": 281.594, "r_y3": 520.602, "coord_origin": "TOPLEFT"}, "text": "A.,", "orig": "A.,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 44, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 297.996, "r_y0": 531.8910000000001, "r_x1": 379.518, "r_y1": 531.8910000000001, "r_x2": 379.518, "r_y2": 520.602, "r_x3": 297.996, "r_y3": 520.602, "coord_origin": "TOPLEFT"}, "text": "Ramis, C.B., Staar,", "orig": "Ramis, C.B., Staar,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 45, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 383.894, "r_y0": 531.8910000000001, "r_x1": 413.839, "r_y1": 531.8910000000001, "r_x2": 413.839, "r_y2": 520.602, "r_x3": 383.894, "r_y3": 520.602, "coord_origin": "TOPLEFT"}, "text": "P.W.J.:", "orig": "P.W.J.:", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 46, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 418.214, "r_y0": 531.8910000000001, "r_x1": 459.065, "r_y1": 531.8910000000001, "r_x2": 459.065, "r_y2": 520.602, "r_x3": 418.214, "r_y3": 520.602, "coord_origin": "TOPLEFT"}, "text": "Delivering", "orig": "Delivering", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 47, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 463.441, "r_y0": 531.8910000000001, "r_x1": 480.592, "r_y1": 531.8910000000001, "r_x2": 480.592, "r_y2": 520.602, "r_x3": 463.441, "r_y3": 520.602, "coord_origin": "TOPLEFT"}, "text": "doc-", "orig": "doc-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 48, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 151.518, "r_y0": 542.85, "r_x1": 235.799, "r_y1": 542.85, "r_x2": 235.799, "r_y2": 531.5609999999999, "r_x3": 151.518, "r_y3": 531.5609999999999, "coord_origin": "TOPLEFT"}, "text": "ument conversion as", "orig": "ument conversion as", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 49, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 240.246, "r_y0": 542.85, "r_x1": 270.806, "r_y1": 542.85, "r_x2": 270.806, "r_y2": 531.5609999999999, "r_x3": 240.246, "r_y3": 531.5609999999999, "coord_origin": "TOPLEFT"}, "text": "a cloud", "orig": "a cloud", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 50, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 275.262, "r_y0": 542.85, "r_x1": 302.214, "r_y1": 542.85, "r_x2": 302.214, "r_y2": 531.5609999999999, "r_x3": 275.262, "r_y3": 531.5609999999999, "coord_origin": "TOPLEFT"}, "text": "service", "orig": "service", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 51, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 306.661, "r_y0": 542.85, "r_x1": 346.433, "r_y1": 542.85, "r_x2": 346.433, "r_y2": 531.5609999999999, "r_x3": 306.661, "r_y3": 531.5609999999999, "coord_origin": "TOPLEFT"}, "text": "with high", "orig": "with high", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 52, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 350.889, "r_y0": 542.85, "r_x1": 480.587, "r_y1": 542.85, "r_x2": 480.587, "r_y2": 531.5609999999999, "r_x3": 350.889, "r_y3": 531.5609999999999, "coord_origin": "TOPLEFT"}, "text": "throughput and responsiveness.", "orig": "throughput and responsiveness.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 53, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 151.518, "r_y0": 553.809, "r_x1": 176.341, "r_y1": 553.809, "r_x2": 176.341, "r_y2": 542.52, "r_x3": 151.518, "r_y3": 542.52, "coord_origin": "TOPLEFT"}, "text": "CoRR", "orig": "CoRR", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 54, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 179.464, "r_y0": 552.6610000000001, "r_x1": 250.68, "r_y1": 552.6610000000001, "r_x2": 250.68, "r_y2": 544.735, "r_x3": 179.464, "r_y3": 544.735, "coord_origin": "TOPLEFT"}, "text": "abs/2206.00785", "orig": "abs/2206.00785", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 55, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 253.804, "r_y0": 553.809, "r_x1": 281.957, "r_y1": 553.809, "r_x2": 281.957, "r_y2": 542.52, "r_x3": 253.804, "r_y3": 542.52, "coord_origin": "TOPLEFT"}, "text": "(2022).", "orig": "(2022).", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 56, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 285.078, "r_y0": 552.913, "r_x1": 478.034, "r_y1": 552.913, "r_x2": 478.034, "r_y2": 545.444, "r_x3": 285.078, "r_y3": 545.444, "coord_origin": "TOPLEFT"}, "text": "https://doi.org/10.48550/arXiv.2206.00785", "orig": "https://doi.org/10.48550/arXiv.2206.00785", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 57, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 478.032, "r_y0": 553.809, "r_x1": 480.591, "r_y1": 553.809, "r_x2": 480.591, "r_y2": 542.52, "r_x3": 478.032, "r_y3": 542.52, "coord_origin": "TOPLEFT"}, "text": ",", "orig": ",", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 58, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 151.518, "r_y0": 563.8720000000001, "r_x1": 344.474, "r_y1": 563.8720000000001, "r_x2": 344.474, "r_y2": 556.403, "r_x3": 151.518, "r_y3": 556.403, "coord_origin": "TOPLEFT"}, "text": "https://doi.org/10.48550/arXiv.2206.00785", "orig": "https://doi.org/10.48550/arXiv.2206.00785", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 59, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 139.371, "r_y0": 576.53, "r_x1": 146.537, "r_y1": 576.53, "r_x2": 146.537, "r_y2": 565.241, "r_x3": 139.371, "r_y3": 565.241, "coord_origin": "TOPLEFT"}, "text": "2.", "orig": "2.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 60, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 151.522, "r_y0": 576.53, "r_x1": 480.586, "r_y1": 576.53, "r_x2": 480.586, "r_y2": 565.241, "r_x3": 151.522, "r_y3": 565.241, "coord_origin": "TOPLEFT"}, "text": "Chen, B., Peng, D., Zhang, J., Ren, Y., Jin, L.: Complex table structure recognition", "orig": "Chen, B., Peng, D., Zhang, J., Ren, Y., Jin, L.: Complex table structure recognition", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 61, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 151.518, "r_y0": 587.489, "r_x1": 480.59, "r_y1": 587.489, "r_x2": 480.59, "r_y2": 576.2, "r_x3": 151.518, "r_y3": 576.2, "coord_origin": "TOPLEFT"}, "text": "in the wild using transformer and identity matrix-based augmentation. In: Porwal,", "orig": "in the wild using transformer and identity matrix-based augmentation. In: Porwal,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 62, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 151.518, "r_y0": 598.448, "r_x1": 480.592, "r_y1": 598.448, "r_x2": 480.592, "r_y2": 587.159, "r_x3": 151.518, "r_y3": 587.159, "coord_origin": "TOPLEFT"}, "text": "U., Forn\u00e9s, A., Shafait, F. (eds.) Frontiers in Handwriting Recognition. pp. 545-", "orig": "U., Forn\u00e9s, A., Shafait, F. (eds.) Frontiers in Handwriting Recognition. pp. 545-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 63, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 151.518, "r_y0": 609.407, "r_x1": 364.179, "r_y1": 609.407, "r_x2": 364.179, "r_y2": 598.1179999999999, "r_x3": 151.518, "r_y3": 598.1179999999999, "coord_origin": "TOPLEFT"}, "text": "561. Springer International Publishing, Cham (2022)", "orig": "561. Springer International Publishing, Cham (2022)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 64, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 139.371, "r_y0": 621.17, "r_x1": 146.537, "r_y1": 621.17, "r_x2": 146.537, "r_y2": 609.881, "r_x3": 139.371, "r_y3": 609.881, "coord_origin": "TOPLEFT"}, "text": "3.", "orig": "3.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 65, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 151.522, "r_y0": 621.17, "r_x1": 168.412, "r_y1": 621.17, "r_x2": 168.412, "r_y2": 609.881, "r_x3": 151.522, "r_y3": 609.881, "coord_origin": "TOPLEFT"}, "text": "Chi,", "orig": "Chi,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 66, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 172.68, "r_y0": 621.17, "r_x1": 183.428, "r_y1": 621.17, "r_x2": 183.428, "r_y2": 609.881, "r_x3": 172.68, "r_y3": 609.881, "coord_origin": "TOPLEFT"}, "text": "Z.,", "orig": "Z.,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 67, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 187.696, "r_y0": 621.17, "r_x1": 480.587, "r_y1": 621.17, "r_x2": 480.587, "r_y2": 609.881, "r_x3": 187.696, "r_y3": 609.881, "coord_origin": "TOPLEFT"}, "text": "Huang, H., Xu, H.D., Yu, H., Yin, W., Mao, X.L.: Complicated table", "orig": "Huang, H., Xu, H.D., Yu, H., Yin, W., Mao, X.L.: Complicated table", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 68, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 151.518, "r_y0": 632.129, "r_x1": 400.225, "r_y1": 632.129, "r_x2": 400.225, "r_y2": 620.84, "r_x3": 151.518, "r_y3": 620.84, "coord_origin": "TOPLEFT"}, "text": "structure recognition. arXiv preprint arXiv:1908.04729 (2019)", "orig": "structure recognition. arXiv preprint arXiv:1908.04729 (2019)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 69, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 139.371, "r_y0": 643.892, "r_x1": 146.537, "r_y1": 643.892, "r_x2": 146.537, "r_y2": 632.6030000000001, "r_x3": 139.371, "r_y3": 632.6030000000001, "coord_origin": "TOPLEFT"}, "text": "4.", "orig": "4.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 70, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 151.522, "r_y0": 643.892, "r_x1": 191.523, "r_y1": 643.892, "r_x2": 191.523, "r_y2": 632.6030000000001, "r_x3": 151.522, "r_y3": 632.6030000000001, "coord_origin": "TOPLEFT"}, "text": "Deng, Y.,", "orig": "Deng, Y.,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 71, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 196.087, "r_y0": 643.892, "r_x1": 240.312, "r_y1": 643.892, "r_x2": 240.312, "r_y2": 632.6030000000001, "r_x3": 196.087, "r_y3": 632.6030000000001, "coord_origin": "TOPLEFT"}, "text": "Rosenberg,", "orig": "Rosenberg,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 72, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 244.876, "r_y0": 643.892, "r_x1": 257.031, "r_y1": 643.892, "r_x2": 257.031, "r_y2": 632.6030000000001, "r_x3": 244.876, "r_y3": 632.6030000000001, "coord_origin": "TOPLEFT"}, "text": "D.,", "orig": "D.,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 73, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 261.586, "r_y0": 643.892, "r_x1": 351.96, "r_y1": 643.892, "r_x2": 351.96, "r_y2": 632.6030000000001, "r_x3": 261.586, "r_y3": 632.6030000000001, "coord_origin": "TOPLEFT"}, "text": "Mann, G.: Challenges", "orig": "Mann, G.: Challenges", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 74, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 356.524, "r_y0": 643.892, "r_x1": 364.201, "r_y1": 643.892, "r_x2": 364.201, "r_y2": 632.6030000000001, "r_x3": 356.524, "r_y3": 632.6030000000001, "coord_origin": "TOPLEFT"}, "text": "in", "orig": "in", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 75, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 368.756, "r_y0": 643.892, "r_x1": 411.757, "r_y1": 643.892, "r_x2": 411.757, "r_y2": 632.6030000000001, "r_x3": 368.756, "r_y3": 632.6030000000001, "coord_origin": "TOPLEFT"}, "text": "end-to-end", "orig": "end-to-end", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 76, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 416.321, "r_y0": 643.892, "r_x1": 441.425, "r_y1": 643.892, "r_x2": 441.425, "r_y2": 632.6030000000001, "r_x3": 416.321, "r_y3": 632.6030000000001, "coord_origin": "TOPLEFT"}, "text": "neural", "orig": "neural", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 77, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 445.989, "r_y0": 643.892, "r_x1": 480.588, "r_y1": 643.892, "r_x2": 480.588, "r_y2": 632.6030000000001, "r_x3": 445.989, "r_y3": 632.6030000000001, "coord_origin": "TOPLEFT"}, "text": "scientific", "orig": "scientific", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 78, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 151.518, "r_y0": 654.851, "r_x1": 171.483, "r_y1": 654.851, "r_x2": 171.483, "r_y2": 643.562, "r_x3": 151.518, "r_y3": 643.562, "coord_origin": "TOPLEFT"}, "text": "table", "orig": "table", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 79, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 175.509, "r_y0": 654.851, "r_x1": 222.623, "r_y1": 654.851, "r_x2": 222.623, "r_y2": 643.562, "r_x3": 175.509, "r_y3": 643.562, "coord_origin": "TOPLEFT"}, "text": "recognition.", "orig": "recognition.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 80, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 226.649, "r_y0": 654.851, "r_x1": 237.652, "r_y1": 654.851, "r_x2": 237.652, "r_y2": 643.562, "r_x3": 226.649, "r_y3": 643.562, "coord_origin": "TOPLEFT"}, "text": "In:", "orig": "In:", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 81, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 241.678, "r_y0": 654.851, "r_x1": 480.588, "r_y1": 654.851, "r_x2": 480.588, "r_y2": 643.562, "r_x3": 241.678, "r_y3": 643.562, "coord_origin": "TOPLEFT"}, "text": "2019 International Conference on Document Analysis and", "orig": "2019 International Conference on Document Analysis and", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 82, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 151.518, "r_y0": 665.809, "r_x1": 350.111, "r_y1": 665.809, "r_x2": 350.111, "r_y2": 654.52, "r_x3": 151.518, "r_y3": 654.52, "coord_origin": "TOPLEFT"}, "text": "Recognition (ICDAR). pp. 894-901. IEEE (2019)", "orig": "Recognition (ICDAR). pp. 894-901. IEEE (2019)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "parsed_page": null, "predictions": {"layout": {"clusters": [{"id": 10, "label": "page_header", "bbox": {"l": 134.765, "t": 91.49300000000005, "r": 143.979, "b": 102.78200000000004, "coord_origin": "TOPLEFT"}, "confidence": 0.8610832691192627, "cells": [{"index": 0, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 102.78200000000004, "r_x1": 143.979, "r_y1": 102.78200000000004, "r_x2": 143.979, "r_y2": 91.49300000000005, "r_x3": 134.765, "r_y3": 91.49300000000005, "coord_origin": "TOPLEFT"}, "text": "12", "orig": "12", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 9, "label": "page_header", "bbox": {"l": 167.821, "t": 91.49300000000005, "r": 231.72, "b": 102.78200000000004, "coord_origin": "TOPLEFT"}, "confidence": 0.8927664756774902, "cells": [{"index": 1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 167.821, "r_y0": 102.78200000000004, "r_x1": 231.72, "r_y1": 102.78200000000004, "r_x2": 231.72, "r_y2": 91.49300000000005, "r_x3": 167.821, "r_y3": 91.49300000000005, "coord_origin": "TOPLEFT"}, "text": "M. Lysak, et al.", "orig": "M. Lysak, et al.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 8, "label": "section_header", "bbox": {"l": 134.765, "t": 117.54899999999998, "r": 219.255, "b": 128.11699999999996, "coord_origin": "TOPLEFT"}, "confidence": 0.915635347366333, "cells": [{"index": 2, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 128.11699999999996, "r_x1": 141.489, "r_y1": 128.11699999999996, "r_x2": 141.489, "r_y2": 117.54899999999998, "r_x3": 134.765, "r_y3": 117.54899999999998, "coord_origin": "TOPLEFT"}, "text": "6", "orig": "6", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 3, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 154.938, "r_y0": 128.11699999999996, "r_x1": 219.255, "r_y1": 128.11699999999996, "r_x2": 219.255, "r_y2": 117.54899999999998, "r_x3": 154.938, "r_y3": 117.54899999999998, "coord_origin": "TOPLEFT"}, "text": "Conclusion", "orig": "Conclusion", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 2, "label": "text", "bbox": {"l": 134.765, "t": 146.86400000000003, "r": 480.596, "b": 203.48199999999997, "coord_origin": "TOPLEFT"}, "confidence": 0.9806171655654907, "cells": [{"index": 4, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 155.66099999999994, "r_x1": 480.595, "r_y1": 155.66099999999994, "r_x2": 480.595, "r_y2": 146.86400000000003, "r_x3": 134.765, "r_y3": 146.86400000000003, "coord_origin": "TOPLEFT"}, "text": "We demonstrated that representing tables in HTML for the task of table struc-", "orig": "We demonstrated that representing tables in HTML for the task of table struc-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 5, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 167.61599999999999, "r_x1": 152.499, "r_y1": 167.61599999999999, "r_x2": 152.499, "r_y2": 158.81899999999996, "r_x3": 134.765, "r_y3": 158.81899999999996, "coord_origin": "TOPLEFT"}, "text": "ture", "orig": "ture", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 6, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 156.963, "r_y0": 167.61599999999999, "r_x1": 205.131, "r_y1": 167.61599999999999, "r_x2": 205.131, "r_y2": 158.81899999999996, "r_x3": 156.963, "r_y3": 158.81899999999996, "coord_origin": "TOPLEFT"}, "text": "recognition", "orig": "recognition", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 7, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 209.594, "r_y0": 167.61599999999999, "r_x1": 480.595, "r_y1": 167.61599999999999, "r_x2": 480.595, "r_y2": 158.81899999999996, "r_x3": 209.594, "r_y3": 158.81899999999996, "coord_origin": "TOPLEFT"}, "text": "with Im2Seq models is ill-suited and has serious limitations.", "orig": "with Im2Seq models is ill-suited and has serious limitations.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 8, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 179.57100000000003, "r_x1": 480.59, "r_y1": 179.57100000000003, "r_x2": 480.59, "r_y2": 170.774, "r_x3": 134.765, "r_y3": 170.774, "coord_origin": "TOPLEFT"}, "text": "Furthermore, we presented in this paper an Optimized Table Structure Language", "orig": "Furthermore, we presented in this paper an Optimized Table Structure Language", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 9, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 191.52700000000004, "r_x1": 480.596, "r_y1": 191.52700000000004, "r_x2": 480.596, "r_y2": 182.73000000000002, "r_x3": 134.765, "r_y3": 182.73000000000002, "coord_origin": "TOPLEFT"}, "text": "(OTSL) which, when compared to commonly used general purpose languages,", "orig": "(OTSL) which, when compared to commonly used general purpose languages,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 10, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 203.48199999999997, "r_x1": 239.539, "r_y1": 203.48199999999997, "r_x2": 239.539, "r_y2": 194.68499999999995, "r_x3": 134.765, "r_y3": 194.68499999999995, "coord_origin": "TOPLEFT"}, "text": "has several key benefits.", "orig": "has several key benefits.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 0, "label": "text", "bbox": {"l": 134.765, "t": 207.44399999999996, "r": 480.595, "b": 323.837, "coord_origin": "TOPLEFT"}, "confidence": 0.9873476028442383, "cells": [{"index": 11, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 149.709, "r_y0": 216.24099999999999, "r_x1": 480.593, "r_y1": 216.24099999999999, "r_x2": 480.593, "r_y2": 207.44399999999996, "r_x3": 149.709, "r_y3": 207.44399999999996, "coord_origin": "TOPLEFT"}, "text": "First and foremost, given the same network configuration, inference time for", "orig": "First and foremost, given the same network configuration, inference time for", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 12, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 228.19600000000003, "r_x1": 480.594, "r_y1": 228.19600000000003, "r_x2": 480.594, "r_y2": 219.399, "r_x3": 134.765, "r_y3": 219.399, "coord_origin": "TOPLEFT"}, "text": "a table-structure prediction is about 2 times faster compared to the conventional", "orig": "a table-structure prediction is about 2 times faster compared to the conventional", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 13, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 240.15099999999995, "r_x1": 480.591, "r_y1": 240.15099999999995, "r_x2": 480.591, "r_y2": 231.35400000000004, "r_x3": 134.765, "r_y3": 231.35400000000004, "coord_origin": "TOPLEFT"}, "text": "HTML approach. This is primarily owed to the shorter sequence length of the", "orig": "HTML approach. This is primarily owed to the shorter sequence length of the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 14, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 252.106, "r_x1": 230.936, "r_y1": 252.106, "r_x2": 230.936, "r_y2": 243.30899999999997, "r_x3": 134.765, "r_y3": 243.30899999999997, "coord_origin": "TOPLEFT"}, "text": "OTSL representation.", "orig": "OTSL representation.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 15, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 235.838, "r_y0": 252.106, "r_x1": 281.762, "r_y1": 252.106, "r_x2": 281.762, "r_y2": 243.30899999999997, "r_x3": 235.838, "r_y3": 243.30899999999997, "coord_origin": "TOPLEFT"}, "text": "Additional", "orig": "Additional", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 16, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 286.664, "r_y0": 252.106, "r_x1": 340.395, "r_y1": 252.106, "r_x2": 340.395, "r_y2": 243.30899999999997, "r_x3": 286.664, "r_y3": 243.30899999999997, "coord_origin": "TOPLEFT"}, "text": "performance", "orig": "performance", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 17, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 345.287, "r_y0": 252.106, "r_x1": 378.82, "r_y1": 252.106, "r_x2": 378.82, "r_y2": 243.30899999999997, "r_x3": 345.287, "r_y3": 243.30899999999997, "coord_origin": "TOPLEFT"}, "text": "benefits", "orig": "benefits", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 18, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 383.721, "r_y0": 252.106, "r_x1": 456.32, "r_y1": 252.106, "r_x2": 456.32, "r_y2": 243.30899999999997, "r_x3": 383.721, "r_y3": 243.30899999999997, "coord_origin": "TOPLEFT"}, "text": "can be obtained", "orig": "can be obtained", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 19, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 461.221, "r_y0": 252.106, "r_x1": 480.588, "r_y1": 252.106, "r_x2": 480.588, "r_y2": 243.30899999999997, "r_x3": 461.221, "r_y3": 243.30899999999997, "coord_origin": "TOPLEFT"}, "text": "with", "orig": "with", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 20, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 264.062, "r_x1": 480.595, "r_y1": 264.062, "r_x2": 480.595, "r_y2": 255.265, "r_x3": 134.765, "r_y3": 255.265, "coord_origin": "TOPLEFT"}, "text": "HPO (hyper parameter optimization). As we demonstrate in our experiments,", "orig": "HPO (hyper parameter optimization). As we demonstrate in our experiments,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 21, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 276.01700000000005, "r_x1": 480.588, "r_y1": 276.01700000000005, "r_x2": 480.588, "r_y2": 267.22, "r_x3": 134.765, "r_y3": 267.22, "coord_origin": "TOPLEFT"}, "text": "models trained on OTSL can be significantly smaller, e.g. by reducing the number", "orig": "models trained on OTSL can be significantly smaller, e.g. by reducing the number", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 22, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 287.972, "r_x1": 480.593, "r_y1": 287.972, "r_x2": 480.593, "r_y2": 279.17499999999995, "r_x3": 134.765, "r_y3": 279.17499999999995, "coord_origin": "TOPLEFT"}, "text": "of encoder and decoder layers, while preserving comparatively good prediction", "orig": "of encoder and decoder layers, while preserving comparatively good prediction", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 23, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 299.927, "r_x1": 480.589, "r_y1": 299.927, "r_x2": 480.589, "r_y2": 291.13, "r_x3": 134.765, "r_y3": 291.13, "coord_origin": "TOPLEFT"}, "text": "quality. This can further improve inference performance, yielding 5-6 times faster", "orig": "quality. This can further improve inference performance, yielding 5-6 times faster", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 24, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 311.882, "r_x1": 480.594, "r_y1": 311.882, "r_x2": 480.594, "r_y2": 303.085, "r_x3": 134.765, "r_y3": 303.085, "coord_origin": "TOPLEFT"}, "text": "inference speed in OTSL with prediction quality comparable to models trained", "orig": "inference speed in OTSL with prediction quality comparable to models trained", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 25, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 323.837, "r_x1": 240.923, "r_y1": 323.837, "r_x2": 240.923, "r_y2": 315.04, "r_x3": 134.765, "r_y3": 315.04, "coord_origin": "TOPLEFT"}, "text": "on HTML (see Table 1).", "orig": "on HTML (see Table 1).", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 1, "label": "text", "bbox": {"l": 134.765, "t": 327.799, "r": 480.595, "b": 468.103, "coord_origin": "TOPLEFT"}, "confidence": 0.9868747591972351, "cells": [{"index": 26, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 149.709, "r_y0": 336.596, "r_x1": 480.59, "r_y1": 336.596, "r_x2": 480.59, "r_y2": 327.799, "r_x3": 149.709, "r_y3": 327.799, "coord_origin": "TOPLEFT"}, "text": "Secondly, OTSL has more inherent structure and a significantly restricted vo-", "orig": "Secondly, OTSL has more inherent structure and a significantly restricted vo-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 27, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 348.552, "r_x1": 480.595, "r_y1": 348.552, "r_x2": 480.595, "r_y2": 339.755, "r_x3": 134.765, "r_y3": 339.755, "coord_origin": "TOPLEFT"}, "text": "cabulary size. This allows autoregressive models to perform better in the TED", "orig": "cabulary size. This allows autoregressive models to perform better in the TED", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 28, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 360.507, "r_x1": 480.587, "r_y1": 360.507, "r_x2": 480.587, "r_y2": 351.71, "r_x3": 134.765, "r_y3": 351.71, "coord_origin": "TOPLEFT"}, "text": "metric, but especially with regards to prediction accuracy of the table-cell bound-", "orig": "metric, but especially with regards to prediction accuracy of the table-cell bound-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 29, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 372.462, "r_x1": 480.595, "r_y1": 372.462, "r_x2": 480.595, "r_y2": 363.665, "r_x3": 134.765, "r_y3": 363.665, "coord_origin": "TOPLEFT"}, "text": "ing boxes (see Table 2). As shown in Figure 5, we observe that the OTSL dras-", "orig": "ing boxes (see Table 2). As shown in Figure 5, we observe that the OTSL dras-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 30, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 384.417, "r_x1": 480.59, "r_y1": 384.417, "r_x2": 480.59, "r_y2": 375.62, "r_x3": 134.765, "r_y3": 375.62, "coord_origin": "TOPLEFT"}, "text": "tically reduces the drift for table cell bounding boxes at high row count and in", "orig": "tically reduces the drift for table cell bounding boxes at high row count and in", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 31, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 396.372, "r_x1": 480.587, "r_y1": 396.372, "r_x2": 480.587, "r_y2": 387.575, "r_x3": 134.765, "r_y3": 387.575, "coord_origin": "TOPLEFT"}, "text": "sparse tables. This leads to more accurate predictions and a significant reduction", "orig": "sparse tables. This leads to more accurate predictions and a significant reduction", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 32, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 408.328, "r_x1": 480.586, "r_y1": 408.328, "r_x2": 480.586, "r_y2": 399.531, "r_x3": 134.765, "r_y3": 399.531, "coord_origin": "TOPLEFT"}, "text": "in post-processing complexity, which is an undesired necessity in HTML-based", "orig": "in post-processing complexity, which is an undesired necessity in HTML-based", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 33, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 420.283, "r_x1": 480.587, "r_y1": 420.283, "r_x2": 480.587, "r_y2": 411.486, "r_x3": 134.765, "r_y3": 411.486, "coord_origin": "TOPLEFT"}, "text": "Im2Seq models. Significant novelty lies in OTSL syntactical rules, which are few,", "orig": "Im2Seq models. Significant novelty lies in OTSL syntactical rules, which are few,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 34, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 432.238, "r_x1": 480.595, "r_y1": 432.238, "r_x2": 480.595, "r_y2": 423.441, "r_x3": 134.765, "r_y3": 423.441, "coord_origin": "TOPLEFT"}, "text": "simple and always backwards looking. Each new token can be validated only by", "orig": "simple and always backwards looking. Each new token can be validated only by", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 35, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 444.193, "r_x1": 480.588, "r_y1": 444.193, "r_x2": 480.588, "r_y2": 435.396, "r_x3": 134.765, "r_y3": 435.396, "coord_origin": "TOPLEFT"}, "text": "analyzing the sequence of previous tokens, without requiring the entire sequence", "orig": "analyzing the sequence of previous tokens, without requiring the entire sequence", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 36, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 456.148, "r_x1": 480.59, "r_y1": 456.148, "r_x2": 480.59, "r_y2": 447.351, "r_x3": 134.765, "r_y3": 447.351, "coord_origin": "TOPLEFT"}, "text": "to detect mistakes. This in return allows to perform structural error detection", "orig": "to detect mistakes. This in return allows to perform structural error detection", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 37, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 468.103, "r_x1": 366.777, "r_y1": 468.103, "r_x2": 366.777, "r_y2": 459.306, "r_x3": 134.765, "r_y3": 459.306, "coord_origin": "TOPLEFT"}, "text": "and correction on-the-fly during sequence generation.", "orig": "and correction on-the-fly during sequence generation.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 7, "label": "section_header", "bbox": {"l": 134.765, "t": 493.821, "r": 197.686, "b": 504.389, "coord_origin": "TOPLEFT"}, "confidence": 0.9403266310691833, "cells": [{"index": 38, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 504.389, "r_x1": 197.686, "r_y1": 504.389, "r_x2": 197.686, "r_y2": 493.821, "r_x3": 134.765, "r_y3": 493.821, "coord_origin": "TOPLEFT"}, "text": "References", "orig": "References", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 5, "label": "list_item", "bbox": {"l": 139.371, "t": 520.602, "r": 480.592, "b": 563.8720000000001, "coord_origin": "TOPLEFT"}, "confidence": 0.9698606729507446, "cells": [{"index": 39, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 139.371, "r_y0": 531.8910000000001, "r_x1": 146.537, "r_y1": 531.8910000000001, "r_x2": 146.537, "r_y2": 520.602, "r_x3": 139.371, "r_y3": 520.602, "coord_origin": "TOPLEFT"}, "text": "1.", "orig": "1.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 40, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 151.522, "r_y0": 531.8910000000001, "r_x1": 189.958, "r_y1": 531.8910000000001, "r_x2": 189.958, "r_y2": 520.602, "r_x3": 151.522, "r_y3": 520.602, "coord_origin": "TOPLEFT"}, "text": "Auer, C.,", "orig": "Auer, C.,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 41, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 194.342, "r_y0": 531.8910000000001, "r_x1": 216.222, "r_y1": 531.8910000000001, "r_x2": 216.222, "r_y2": 520.602, "r_x3": 194.342, "r_y3": 520.602, "coord_origin": "TOPLEFT"}, "text": "Dolfi,", "orig": "Dolfi,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 42, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 220.607, "r_y0": 531.8910000000001, "r_x1": 277.21, "r_y1": 531.8910000000001, "r_x2": 277.21, "r_y2": 520.602, "r_x3": 220.607, "r_y3": 520.602, "coord_origin": "TOPLEFT"}, "text": "M., Carvalho,", "orig": "M., Carvalho,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 43, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 281.594, "r_y0": 531.8910000000001, "r_x1": 293.621, "r_y1": 531.8910000000001, "r_x2": 293.621, "r_y2": 520.602, "r_x3": 281.594, "r_y3": 520.602, "coord_origin": "TOPLEFT"}, "text": "A.,", "orig": "A.,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 44, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 297.996, "r_y0": 531.8910000000001, "r_x1": 379.518, "r_y1": 531.8910000000001, "r_x2": 379.518, "r_y2": 520.602, "r_x3": 297.996, "r_y3": 520.602, "coord_origin": "TOPLEFT"}, "text": "Ramis, C.B., Staar,", "orig": "Ramis, C.B., Staar,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 45, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 383.894, "r_y0": 531.8910000000001, "r_x1": 413.839, "r_y1": 531.8910000000001, "r_x2": 413.839, "r_y2": 520.602, "r_x3": 383.894, "r_y3": 520.602, "coord_origin": "TOPLEFT"}, "text": "P.W.J.:", "orig": "P.W.J.:", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 46, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 418.214, "r_y0": 531.8910000000001, "r_x1": 459.065, "r_y1": 531.8910000000001, "r_x2": 459.065, "r_y2": 520.602, "r_x3": 418.214, "r_y3": 520.602, "coord_origin": "TOPLEFT"}, "text": "Delivering", "orig": "Delivering", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 47, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 463.441, "r_y0": 531.8910000000001, "r_x1": 480.592, "r_y1": 531.8910000000001, "r_x2": 480.592, "r_y2": 520.602, "r_x3": 463.441, "r_y3": 520.602, "coord_origin": "TOPLEFT"}, "text": "doc-", "orig": "doc-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 48, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 151.518, "r_y0": 542.85, "r_x1": 235.799, "r_y1": 542.85, "r_x2": 235.799, "r_y2": 531.5609999999999, "r_x3": 151.518, "r_y3": 531.5609999999999, "coord_origin": "TOPLEFT"}, "text": "ument conversion as", "orig": "ument conversion as", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 49, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 240.246, "r_y0": 542.85, "r_x1": 270.806, "r_y1": 542.85, "r_x2": 270.806, "r_y2": 531.5609999999999, "r_x3": 240.246, "r_y3": 531.5609999999999, "coord_origin": "TOPLEFT"}, "text": "a cloud", "orig": "a cloud", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 50, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 275.262, "r_y0": 542.85, "r_x1": 302.214, "r_y1": 542.85, "r_x2": 302.214, "r_y2": 531.5609999999999, "r_x3": 275.262, "r_y3": 531.5609999999999, "coord_origin": "TOPLEFT"}, "text": "service", "orig": "service", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 51, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 306.661, "r_y0": 542.85, "r_x1": 346.433, "r_y1": 542.85, "r_x2": 346.433, "r_y2": 531.5609999999999, "r_x3": 306.661, "r_y3": 531.5609999999999, "coord_origin": "TOPLEFT"}, "text": "with high", "orig": "with high", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 52, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 350.889, "r_y0": 542.85, "r_x1": 480.587, "r_y1": 542.85, "r_x2": 480.587, "r_y2": 531.5609999999999, "r_x3": 350.889, "r_y3": 531.5609999999999, "coord_origin": "TOPLEFT"}, "text": "throughput and responsiveness.", "orig": "throughput and responsiveness.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 53, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 151.518, "r_y0": 553.809, "r_x1": 176.341, "r_y1": 553.809, "r_x2": 176.341, "r_y2": 542.52, "r_x3": 151.518, "r_y3": 542.52, "coord_origin": "TOPLEFT"}, "text": "CoRR", "orig": "CoRR", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 54, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 179.464, "r_y0": 552.6610000000001, "r_x1": 250.68, "r_y1": 552.6610000000001, "r_x2": 250.68, "r_y2": 544.735, "r_x3": 179.464, "r_y3": 544.735, "coord_origin": "TOPLEFT"}, "text": "abs/2206.00785", "orig": "abs/2206.00785", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 55, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 253.804, "r_y0": 553.809, "r_x1": 281.957, "r_y1": 553.809, "r_x2": 281.957, "r_y2": 542.52, "r_x3": 253.804, "r_y3": 542.52, "coord_origin": "TOPLEFT"}, "text": "(2022).", "orig": "(2022).", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 56, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 285.078, "r_y0": 552.913, "r_x1": 478.034, "r_y1": 552.913, "r_x2": 478.034, "r_y2": 545.444, "r_x3": 285.078, "r_y3": 545.444, "coord_origin": "TOPLEFT"}, "text": "https://doi.org/10.48550/arXiv.2206.00785", "orig": "https://doi.org/10.48550/arXiv.2206.00785", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 57, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 478.032, "r_y0": 553.809, "r_x1": 480.591, "r_y1": 553.809, "r_x2": 480.591, "r_y2": 542.52, "r_x3": 478.032, "r_y3": 542.52, "coord_origin": "TOPLEFT"}, "text": ",", "orig": ",", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 58, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 151.518, "r_y0": 563.8720000000001, "r_x1": 344.474, "r_y1": 563.8720000000001, "r_x2": 344.474, "r_y2": 556.403, "r_x3": 151.518, "r_y3": 556.403, "coord_origin": "TOPLEFT"}, "text": "https://doi.org/10.48550/arXiv.2206.00785", "orig": "https://doi.org/10.48550/arXiv.2206.00785", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 4, "label": "list_item", "bbox": {"l": 139.371, "t": 565.241, "r": 480.592, "b": 609.407, "coord_origin": "TOPLEFT"}, "confidence": 0.9730570316314697, "cells": [{"index": 59, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 139.371, "r_y0": 576.53, "r_x1": 146.537, "r_y1": 576.53, "r_x2": 146.537, "r_y2": 565.241, "r_x3": 139.371, "r_y3": 565.241, "coord_origin": "TOPLEFT"}, "text": "2.", "orig": "2.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 60, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 151.522, "r_y0": 576.53, "r_x1": 480.586, "r_y1": 576.53, "r_x2": 480.586, "r_y2": 565.241, "r_x3": 151.522, "r_y3": 565.241, "coord_origin": "TOPLEFT"}, "text": "Chen, B., Peng, D., Zhang, J., Ren, Y., Jin, L.: Complex table structure recognition", "orig": "Chen, B., Peng, D., Zhang, J., Ren, Y., Jin, L.: Complex table structure recognition", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 61, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 151.518, "r_y0": 587.489, "r_x1": 480.59, "r_y1": 587.489, "r_x2": 480.59, "r_y2": 576.2, "r_x3": 151.518, "r_y3": 576.2, "coord_origin": "TOPLEFT"}, "text": "in the wild using transformer and identity matrix-based augmentation. In: Porwal,", "orig": "in the wild using transformer and identity matrix-based augmentation. In: Porwal,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 62, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 151.518, "r_y0": 598.448, "r_x1": 480.592, "r_y1": 598.448, "r_x2": 480.592, "r_y2": 587.159, "r_x3": 151.518, "r_y3": 587.159, "coord_origin": "TOPLEFT"}, "text": "U., Forn\u00e9s, A., Shafait, F. (eds.) Frontiers in Handwriting Recognition. pp. 545-", "orig": "U., Forn\u00e9s, A., Shafait, F. (eds.) Frontiers in Handwriting Recognition. pp. 545-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 63, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 151.518, "r_y0": 609.407, "r_x1": 364.179, "r_y1": 609.407, "r_x2": 364.179, "r_y2": 598.1179999999999, "r_x3": 151.518, "r_y3": 598.1179999999999, "coord_origin": "TOPLEFT"}, "text": "561. Springer International Publishing, Cham (2022)", "orig": "561. Springer International Publishing, Cham (2022)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 6, "label": "list_item", "bbox": {"l": 139.371, "t": 609.881, "r": 480.587, "b": 632.129, "coord_origin": "TOPLEFT"}, "confidence": 0.9617196321487427, "cells": [{"index": 64, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 139.371, "r_y0": 621.17, "r_x1": 146.537, "r_y1": 621.17, "r_x2": 146.537, "r_y2": 609.881, "r_x3": 139.371, "r_y3": 609.881, "coord_origin": "TOPLEFT"}, "text": "3.", "orig": "3.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 65, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 151.522, "r_y0": 621.17, "r_x1": 168.412, "r_y1": 621.17, "r_x2": 168.412, "r_y2": 609.881, "r_x3": 151.522, "r_y3": 609.881, "coord_origin": "TOPLEFT"}, "text": "Chi,", "orig": "Chi,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 66, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 172.68, "r_y0": 621.17, "r_x1": 183.428, "r_y1": 621.17, "r_x2": 183.428, "r_y2": 609.881, "r_x3": 172.68, "r_y3": 609.881, "coord_origin": "TOPLEFT"}, "text": "Z.,", "orig": "Z.,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 67, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 187.696, "r_y0": 621.17, "r_x1": 480.587, "r_y1": 621.17, "r_x2": 480.587, "r_y2": 609.881, "r_x3": 187.696, "r_y3": 609.881, "coord_origin": "TOPLEFT"}, "text": "Huang, H., Xu, H.D., Yu, H., Yin, W., Mao, X.L.: Complicated table", "orig": "Huang, H., Xu, H.D., Yu, H., Yin, W., Mao, X.L.: Complicated table", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 68, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 151.518, "r_y0": 632.129, "r_x1": 400.225, "r_y1": 632.129, "r_x2": 400.225, "r_y2": 620.84, "r_x3": 151.518, "r_y3": 620.84, "coord_origin": "TOPLEFT"}, "text": "structure recognition. arXiv preprint arXiv:1908.04729 (2019)", "orig": "structure recognition. arXiv preprint arXiv:1908.04729 (2019)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 3, "label": "list_item", "bbox": {"l": 139.371, "t": 632.6030000000001, "r": 480.588, "b": 665.809, "coord_origin": "TOPLEFT"}, "confidence": 0.9754673838615417, "cells": [{"index": 69, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 139.371, "r_y0": 643.892, "r_x1": 146.537, "r_y1": 643.892, "r_x2": 146.537, "r_y2": 632.6030000000001, "r_x3": 139.371, "r_y3": 632.6030000000001, "coord_origin": "TOPLEFT"}, "text": "4.", "orig": "4.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 70, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 151.522, "r_y0": 643.892, "r_x1": 191.523, "r_y1": 643.892, "r_x2": 191.523, "r_y2": 632.6030000000001, "r_x3": 151.522, "r_y3": 632.6030000000001, "coord_origin": "TOPLEFT"}, "text": "Deng, Y.,", "orig": "Deng, Y.,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 71, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 196.087, "r_y0": 643.892, "r_x1": 240.312, "r_y1": 643.892, "r_x2": 240.312, "r_y2": 632.6030000000001, "r_x3": 196.087, "r_y3": 632.6030000000001, "coord_origin": "TOPLEFT"}, "text": "Rosenberg,", "orig": "Rosenberg,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 72, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 244.876, "r_y0": 643.892, "r_x1": 257.031, "r_y1": 643.892, "r_x2": 257.031, "r_y2": 632.6030000000001, "r_x3": 244.876, "r_y3": 632.6030000000001, "coord_origin": "TOPLEFT"}, "text": "D.,", "orig": "D.,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 73, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 261.586, "r_y0": 643.892, "r_x1": 351.96, "r_y1": 643.892, "r_x2": 351.96, "r_y2": 632.6030000000001, "r_x3": 261.586, "r_y3": 632.6030000000001, "coord_origin": "TOPLEFT"}, "text": "Mann, G.: Challenges", "orig": "Mann, G.: Challenges", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 74, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 356.524, "r_y0": 643.892, "r_x1": 364.201, "r_y1": 643.892, "r_x2": 364.201, "r_y2": 632.6030000000001, "r_x3": 356.524, "r_y3": 632.6030000000001, "coord_origin": "TOPLEFT"}, "text": "in", "orig": "in", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 75, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 368.756, "r_y0": 643.892, "r_x1": 411.757, "r_y1": 643.892, "r_x2": 411.757, "r_y2": 632.6030000000001, "r_x3": 368.756, "r_y3": 632.6030000000001, "coord_origin": "TOPLEFT"}, "text": "end-to-end", "orig": "end-to-end", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 76, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 416.321, "r_y0": 643.892, "r_x1": 441.425, "r_y1": 643.892, "r_x2": 441.425, "r_y2": 632.6030000000001, "r_x3": 416.321, "r_y3": 632.6030000000001, "coord_origin": "TOPLEFT"}, "text": "neural", "orig": "neural", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 77, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 445.989, "r_y0": 643.892, "r_x1": 480.588, "r_y1": 643.892, "r_x2": 480.588, "r_y2": 632.6030000000001, "r_x3": 445.989, "r_y3": 632.6030000000001, "coord_origin": "TOPLEFT"}, "text": "scientific", "orig": "scientific", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 78, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 151.518, "r_y0": 654.851, "r_x1": 171.483, "r_y1": 654.851, "r_x2": 171.483, "r_y2": 643.562, "r_x3": 151.518, "r_y3": 643.562, "coord_origin": "TOPLEFT"}, "text": "table", "orig": "table", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 79, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 175.509, "r_y0": 654.851, "r_x1": 222.623, "r_y1": 654.851, "r_x2": 222.623, "r_y2": 643.562, "r_x3": 175.509, "r_y3": 643.562, "coord_origin": "TOPLEFT"}, "text": "recognition.", "orig": "recognition.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 80, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 226.649, "r_y0": 654.851, "r_x1": 237.652, "r_y1": 654.851, "r_x2": 237.652, "r_y2": 643.562, "r_x3": 226.649, "r_y3": 643.562, "coord_origin": "TOPLEFT"}, "text": "In:", "orig": "In:", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 81, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 241.678, "r_y0": 654.851, "r_x1": 480.588, "r_y1": 654.851, "r_x2": 480.588, "r_y2": 643.562, "r_x3": 241.678, "r_y3": 643.562, "coord_origin": "TOPLEFT"}, "text": "2019 International Conference on Document Analysis and", "orig": "2019 International Conference on Document Analysis and", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 82, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 151.518, "r_y0": 665.809, "r_x1": 350.111, "r_y1": 665.809, "r_x2": 350.111, "r_y2": 654.52, "r_x3": 151.518, "r_y3": 654.52, "coord_origin": "TOPLEFT"}, "text": "Recognition (ICDAR). pp. 894-901. IEEE (2019)", "orig": "Recognition (ICDAR). pp. 894-901. IEEE (2019)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}]}, "tablestructure": {"table_map": {}}, "figures_classification": null, "equations_prediction": null, "vlm_response": null}, "assembled": {"elements": [{"label": "page_header", "id": 10, "page_no": 11, "cluster": {"id": 10, "label": "page_header", "bbox": {"l": 134.765, "t": 91.49300000000005, "r": 143.979, "b": 102.78200000000004, "coord_origin": "TOPLEFT"}, "confidence": 0.8610832691192627, "cells": [{"index": 0, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 102.78200000000004, "r_x1": 143.979, "r_y1": 102.78200000000004, "r_x2": 143.979, "r_y2": 91.49300000000005, "r_x3": 134.765, "r_y3": 91.49300000000005, "coord_origin": "TOPLEFT"}, "text": "12", "orig": "12", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "12"}, {"label": "page_header", "id": 9, "page_no": 11, "cluster": {"id": 9, "label": "page_header", "bbox": {"l": 167.821, "t": 91.49300000000005, "r": 231.72, "b": 102.78200000000004, "coord_origin": "TOPLEFT"}, "confidence": 0.8927664756774902, "cells": [{"index": 1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 167.821, "r_y0": 102.78200000000004, "r_x1": 231.72, "r_y1": 102.78200000000004, "r_x2": 231.72, "r_y2": 91.49300000000005, "r_x3": 167.821, "r_y3": 91.49300000000005, "coord_origin": "TOPLEFT"}, "text": "M. Lysak, et al.", "orig": "M. Lysak, et al.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "M. Lysak, et al."}, {"label": "section_header", "id": 8, "page_no": 11, "cluster": {"id": 8, "label": "section_header", "bbox": {"l": 134.765, "t": 117.54899999999998, "r": 219.255, "b": 128.11699999999996, "coord_origin": "TOPLEFT"}, "confidence": 0.915635347366333, "cells": [{"index": 2, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 128.11699999999996, "r_x1": 141.489, "r_y1": 128.11699999999996, "r_x2": 141.489, "r_y2": 117.54899999999998, "r_x3": 134.765, "r_y3": 117.54899999999998, "coord_origin": "TOPLEFT"}, "text": "6", "orig": "6", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 3, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 154.938, "r_y0": 128.11699999999996, "r_x1": 219.255, "r_y1": 128.11699999999996, "r_x2": 219.255, "r_y2": 117.54899999999998, "r_x3": 154.938, "r_y3": 117.54899999999998, "coord_origin": "TOPLEFT"}, "text": "Conclusion", "orig": "Conclusion", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "6 Conclusion"}, {"label": "text", "id": 2, "page_no": 11, "cluster": {"id": 2, "label": "text", "bbox": {"l": 134.765, "t": 146.86400000000003, "r": 480.596, "b": 203.48199999999997, "coord_origin": "TOPLEFT"}, "confidence": 0.9806171655654907, "cells": [{"index": 4, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 155.66099999999994, "r_x1": 480.595, "r_y1": 155.66099999999994, "r_x2": 480.595, "r_y2": 146.86400000000003, "r_x3": 134.765, "r_y3": 146.86400000000003, "coord_origin": "TOPLEFT"}, "text": "We demonstrated that representing tables in HTML for the task of table struc-", "orig": "We demonstrated that representing tables in HTML for the task of table struc-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 5, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 167.61599999999999, "r_x1": 152.499, "r_y1": 167.61599999999999, "r_x2": 152.499, "r_y2": 158.81899999999996, "r_x3": 134.765, "r_y3": 158.81899999999996, "coord_origin": "TOPLEFT"}, "text": "ture", "orig": "ture", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 6, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 156.963, "r_y0": 167.61599999999999, "r_x1": 205.131, "r_y1": 167.61599999999999, "r_x2": 205.131, "r_y2": 158.81899999999996, "r_x3": 156.963, "r_y3": 158.81899999999996, "coord_origin": "TOPLEFT"}, "text": "recognition", "orig": "recognition", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 7, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 209.594, "r_y0": 167.61599999999999, "r_x1": 480.595, "r_y1": 167.61599999999999, "r_x2": 480.595, "r_y2": 158.81899999999996, "r_x3": 209.594, "r_y3": 158.81899999999996, "coord_origin": "TOPLEFT"}, "text": "with Im2Seq models is ill-suited and has serious limitations.", "orig": "with Im2Seq models is ill-suited and has serious limitations.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 8, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 179.57100000000003, "r_x1": 480.59, "r_y1": 179.57100000000003, "r_x2": 480.59, "r_y2": 170.774, "r_x3": 134.765, "r_y3": 170.774, "coord_origin": "TOPLEFT"}, "text": "Furthermore, we presented in this paper an Optimized Table Structure Language", "orig": "Furthermore, we presented in this paper an Optimized Table Structure Language", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 9, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 191.52700000000004, "r_x1": 480.596, "r_y1": 191.52700000000004, "r_x2": 480.596, "r_y2": 182.73000000000002, "r_x3": 134.765, "r_y3": 182.73000000000002, "coord_origin": "TOPLEFT"}, "text": "(OTSL) which, when compared to commonly used general purpose languages,", "orig": "(OTSL) which, when compared to commonly used general purpose languages,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 10, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 203.48199999999997, "r_x1": 239.539, "r_y1": 203.48199999999997, "r_x2": 239.539, "r_y2": 194.68499999999995, "r_x3": 134.765, "r_y3": 194.68499999999995, "coord_origin": "TOPLEFT"}, "text": "has several key benefits.", "orig": "has several key benefits.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "We demonstrated that representing tables in HTML for the task of table structure recognition with Im2Seq models is ill-suited and has serious limitations. Furthermore, we presented in this paper an Optimized Table Structure Language (OTSL) which, when compared to commonly used general purpose languages, has several key benefits."}, {"label": "text", "id": 0, "page_no": 11, "cluster": {"id": 0, "label": "text", "bbox": {"l": 134.765, "t": 207.44399999999996, "r": 480.595, "b": 323.837, "coord_origin": "TOPLEFT"}, "confidence": 0.9873476028442383, "cells": [{"index": 11, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 149.709, "r_y0": 216.24099999999999, "r_x1": 480.593, "r_y1": 216.24099999999999, "r_x2": 480.593, "r_y2": 207.44399999999996, "r_x3": 149.709, "r_y3": 207.44399999999996, "coord_origin": "TOPLEFT"}, "text": "First and foremost, given the same network configuration, inference time for", "orig": "First and foremost, given the same network configuration, inference time for", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 12, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 228.19600000000003, "r_x1": 480.594, "r_y1": 228.19600000000003, "r_x2": 480.594, "r_y2": 219.399, "r_x3": 134.765, "r_y3": 219.399, "coord_origin": "TOPLEFT"}, "text": "a table-structure prediction is about 2 times faster compared to the conventional", "orig": "a table-structure prediction is about 2 times faster compared to the conventional", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 13, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 240.15099999999995, "r_x1": 480.591, "r_y1": 240.15099999999995, "r_x2": 480.591, "r_y2": 231.35400000000004, "r_x3": 134.765, "r_y3": 231.35400000000004, "coord_origin": "TOPLEFT"}, "text": "HTML approach. This is primarily owed to the shorter sequence length of the", "orig": "HTML approach. This is primarily owed to the shorter sequence length of the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 14, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 252.106, "r_x1": 230.936, "r_y1": 252.106, "r_x2": 230.936, "r_y2": 243.30899999999997, "r_x3": 134.765, "r_y3": 243.30899999999997, "coord_origin": "TOPLEFT"}, "text": "OTSL representation.", "orig": "OTSL representation.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 15, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 235.838, "r_y0": 252.106, "r_x1": 281.762, "r_y1": 252.106, "r_x2": 281.762, "r_y2": 243.30899999999997, "r_x3": 235.838, "r_y3": 243.30899999999997, "coord_origin": "TOPLEFT"}, "text": "Additional", "orig": "Additional", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 16, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 286.664, "r_y0": 252.106, "r_x1": 340.395, "r_y1": 252.106, "r_x2": 340.395, "r_y2": 243.30899999999997, "r_x3": 286.664, "r_y3": 243.30899999999997, "coord_origin": "TOPLEFT"}, "text": "performance", "orig": "performance", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 17, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 345.287, "r_y0": 252.106, "r_x1": 378.82, "r_y1": 252.106, "r_x2": 378.82, "r_y2": 243.30899999999997, "r_x3": 345.287, "r_y3": 243.30899999999997, "coord_origin": "TOPLEFT"}, "text": "benefits", "orig": "benefits", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 18, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 383.721, "r_y0": 252.106, "r_x1": 456.32, "r_y1": 252.106, "r_x2": 456.32, "r_y2": 243.30899999999997, "r_x3": 383.721, "r_y3": 243.30899999999997, "coord_origin": "TOPLEFT"}, "text": "can be obtained", "orig": "can be obtained", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 19, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 461.221, "r_y0": 252.106, "r_x1": 480.588, "r_y1": 252.106, "r_x2": 480.588, "r_y2": 243.30899999999997, "r_x3": 461.221, "r_y3": 243.30899999999997, "coord_origin": "TOPLEFT"}, "text": "with", "orig": "with", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 20, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 264.062, "r_x1": 480.595, "r_y1": 264.062, "r_x2": 480.595, "r_y2": 255.265, "r_x3": 134.765, "r_y3": 255.265, "coord_origin": "TOPLEFT"}, "text": "HPO (hyper parameter optimization). As we demonstrate in our experiments,", "orig": "HPO (hyper parameter optimization). As we demonstrate in our experiments,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 21, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 276.01700000000005, "r_x1": 480.588, "r_y1": 276.01700000000005, "r_x2": 480.588, "r_y2": 267.22, "r_x3": 134.765, "r_y3": 267.22, "coord_origin": "TOPLEFT"}, "text": "models trained on OTSL can be significantly smaller, e.g. by reducing the number", "orig": "models trained on OTSL can be significantly smaller, e.g. by reducing the number", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 22, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 287.972, "r_x1": 480.593, "r_y1": 287.972, "r_x2": 480.593, "r_y2": 279.17499999999995, "r_x3": 134.765, "r_y3": 279.17499999999995, "coord_origin": "TOPLEFT"}, "text": "of encoder and decoder layers, while preserving comparatively good prediction", "orig": "of encoder and decoder layers, while preserving comparatively good prediction", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 23, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 299.927, "r_x1": 480.589, "r_y1": 299.927, "r_x2": 480.589, "r_y2": 291.13, "r_x3": 134.765, "r_y3": 291.13, "coord_origin": "TOPLEFT"}, "text": "quality. This can further improve inference performance, yielding 5-6 times faster", "orig": "quality. This can further improve inference performance, yielding 5-6 times faster", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 24, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 311.882, "r_x1": 480.594, "r_y1": 311.882, "r_x2": 480.594, "r_y2": 303.085, "r_x3": 134.765, "r_y3": 303.085, "coord_origin": "TOPLEFT"}, "text": "inference speed in OTSL with prediction quality comparable to models trained", "orig": "inference speed in OTSL with prediction quality comparable to models trained", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 25, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 323.837, "r_x1": 240.923, "r_y1": 323.837, "r_x2": 240.923, "r_y2": 315.04, "r_x3": 134.765, "r_y3": 315.04, "coord_origin": "TOPLEFT"}, "text": "on HTML (see Table 1).", "orig": "on HTML (see Table 1).", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "First and foremost, given the same network configuration, inference time for a table-structure prediction is about 2 times faster compared to the conventional HTML approach. This is primarily owed to the shorter sequence length of the OTSL representation. Additional performance benefits can be obtained with HPO (hyper parameter optimization). As we demonstrate in our experiments, models trained on OTSL can be significantly smaller, e.g. by reducing the number of encoder and decoder layers, while preserving comparatively good prediction quality. This can further improve inference performance, yielding 5-6 times faster inference speed in OTSL with prediction quality comparable to models trained on HTML (see Table 1)."}, {"label": "text", "id": 1, "page_no": 11, "cluster": {"id": 1, "label": "text", "bbox": {"l": 134.765, "t": 327.799, "r": 480.595, "b": 468.103, "coord_origin": "TOPLEFT"}, "confidence": 0.9868747591972351, "cells": [{"index": 26, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 149.709, "r_y0": 336.596, "r_x1": 480.59, "r_y1": 336.596, "r_x2": 480.59, "r_y2": 327.799, "r_x3": 149.709, "r_y3": 327.799, "coord_origin": "TOPLEFT"}, "text": "Secondly, OTSL has more inherent structure and a significantly restricted vo-", "orig": "Secondly, OTSL has more inherent structure and a significantly restricted vo-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 27, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 348.552, "r_x1": 480.595, "r_y1": 348.552, "r_x2": 480.595, "r_y2": 339.755, "r_x3": 134.765, "r_y3": 339.755, "coord_origin": "TOPLEFT"}, "text": "cabulary size. This allows autoregressive models to perform better in the TED", "orig": "cabulary size. This allows autoregressive models to perform better in the TED", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 28, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 360.507, "r_x1": 480.587, "r_y1": 360.507, "r_x2": 480.587, "r_y2": 351.71, "r_x3": 134.765, "r_y3": 351.71, "coord_origin": "TOPLEFT"}, "text": "metric, but especially with regards to prediction accuracy of the table-cell bound-", "orig": "metric, but especially with regards to prediction accuracy of the table-cell bound-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 29, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 372.462, "r_x1": 480.595, "r_y1": 372.462, "r_x2": 480.595, "r_y2": 363.665, "r_x3": 134.765, "r_y3": 363.665, "coord_origin": "TOPLEFT"}, "text": "ing boxes (see Table 2). As shown in Figure 5, we observe that the OTSL dras-", "orig": "ing boxes (see Table 2). As shown in Figure 5, we observe that the OTSL dras-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 30, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 384.417, "r_x1": 480.59, "r_y1": 384.417, "r_x2": 480.59, "r_y2": 375.62, "r_x3": 134.765, "r_y3": 375.62, "coord_origin": "TOPLEFT"}, "text": "tically reduces the drift for table cell bounding boxes at high row count and in", "orig": "tically reduces the drift for table cell bounding boxes at high row count and in", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 31, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 396.372, "r_x1": 480.587, "r_y1": 396.372, "r_x2": 480.587, "r_y2": 387.575, "r_x3": 134.765, "r_y3": 387.575, "coord_origin": "TOPLEFT"}, "text": "sparse tables. This leads to more accurate predictions and a significant reduction", "orig": "sparse tables. This leads to more accurate predictions and a significant reduction", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 32, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 408.328, "r_x1": 480.586, "r_y1": 408.328, "r_x2": 480.586, "r_y2": 399.531, "r_x3": 134.765, "r_y3": 399.531, "coord_origin": "TOPLEFT"}, "text": "in post-processing complexity, which is an undesired necessity in HTML-based", "orig": "in post-processing complexity, which is an undesired necessity in HTML-based", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 33, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 420.283, "r_x1": 480.587, "r_y1": 420.283, "r_x2": 480.587, "r_y2": 411.486, "r_x3": 134.765, "r_y3": 411.486, "coord_origin": "TOPLEFT"}, "text": "Im2Seq models. Significant novelty lies in OTSL syntactical rules, which are few,", "orig": "Im2Seq models. Significant novelty lies in OTSL syntactical rules, which are few,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 34, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 432.238, "r_x1": 480.595, "r_y1": 432.238, "r_x2": 480.595, "r_y2": 423.441, "r_x3": 134.765, "r_y3": 423.441, "coord_origin": "TOPLEFT"}, "text": "simple and always backwards looking. Each new token can be validated only by", "orig": "simple and always backwards looking. Each new token can be validated only by", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 35, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 444.193, "r_x1": 480.588, "r_y1": 444.193, "r_x2": 480.588, "r_y2": 435.396, "r_x3": 134.765, "r_y3": 435.396, "coord_origin": "TOPLEFT"}, "text": "analyzing the sequence of previous tokens, without requiring the entire sequence", "orig": "analyzing the sequence of previous tokens, without requiring the entire sequence", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 36, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 456.148, "r_x1": 480.59, "r_y1": 456.148, "r_x2": 480.59, "r_y2": 447.351, "r_x3": 134.765, "r_y3": 447.351, "coord_origin": "TOPLEFT"}, "text": "to detect mistakes. This in return allows to perform structural error detection", "orig": "to detect mistakes. This in return allows to perform structural error detection", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 37, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 468.103, "r_x1": 366.777, "r_y1": 468.103, "r_x2": 366.777, "r_y2": 459.306, "r_x3": 134.765, "r_y3": 459.306, "coord_origin": "TOPLEFT"}, "text": "and correction on-the-fly during sequence generation.", "orig": "and correction on-the-fly during sequence generation.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "Secondly, OTSL has more inherent structure and a significantly restricted vocabulary size. This allows autoregressive models to perform better in the TED metric, but especially with regards to prediction accuracy of the table-cell bounding boxes (see Table 2). As shown in Figure 5, we observe that the OTSL drastically reduces the drift for table cell bounding boxes at high row count and in sparse tables. This leads to more accurate predictions and a significant reduction in post-processing complexity, which is an undesired necessity in HTML-based Im2Seq models. Significant novelty lies in OTSL syntactical rules, which are few, simple and always backwards looking. Each new token can be validated only by analyzing the sequence of previous tokens, without requiring the entire sequence to detect mistakes. This in return allows to perform structural error detection and correction on-the-fly during sequence generation."}, {"label": "section_header", "id": 7, "page_no": 11, "cluster": {"id": 7, "label": "section_header", "bbox": {"l": 134.765, "t": 493.821, "r": 197.686, "b": 504.389, "coord_origin": "TOPLEFT"}, "confidence": 0.9403266310691833, "cells": [{"index": 38, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 504.389, "r_x1": 197.686, "r_y1": 504.389, "r_x2": 197.686, "r_y2": 493.821, "r_x3": 134.765, "r_y3": 493.821, "coord_origin": "TOPLEFT"}, "text": "References", "orig": "References", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "References"}, {"label": "list_item", "id": 5, "page_no": 11, "cluster": {"id": 5, "label": "list_item", "bbox": {"l": 139.371, "t": 520.602, "r": 480.592, "b": 563.8720000000001, "coord_origin": "TOPLEFT"}, "confidence": 0.9698606729507446, "cells": [{"index": 39, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 139.371, "r_y0": 531.8910000000001, "r_x1": 146.537, "r_y1": 531.8910000000001, "r_x2": 146.537, "r_y2": 520.602, "r_x3": 139.371, "r_y3": 520.602, "coord_origin": "TOPLEFT"}, "text": "1.", "orig": "1.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 40, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 151.522, "r_y0": 531.8910000000001, "r_x1": 189.958, "r_y1": 531.8910000000001, "r_x2": 189.958, "r_y2": 520.602, "r_x3": 151.522, "r_y3": 520.602, "coord_origin": "TOPLEFT"}, "text": "Auer, C.,", "orig": "Auer, C.,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 41, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 194.342, "r_y0": 531.8910000000001, "r_x1": 216.222, "r_y1": 531.8910000000001, "r_x2": 216.222, "r_y2": 520.602, "r_x3": 194.342, "r_y3": 520.602, "coord_origin": "TOPLEFT"}, "text": "Dolfi,", "orig": "Dolfi,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 42, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 220.607, "r_y0": 531.8910000000001, "r_x1": 277.21, "r_y1": 531.8910000000001, "r_x2": 277.21, "r_y2": 520.602, "r_x3": 220.607, "r_y3": 520.602, "coord_origin": "TOPLEFT"}, "text": "M., Carvalho,", "orig": "M., Carvalho,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 43, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 281.594, "r_y0": 531.8910000000001, "r_x1": 293.621, "r_y1": 531.8910000000001, "r_x2": 293.621, "r_y2": 520.602, "r_x3": 281.594, "r_y3": 520.602, "coord_origin": "TOPLEFT"}, "text": "A.,", "orig": "A.,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 44, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 297.996, "r_y0": 531.8910000000001, "r_x1": 379.518, "r_y1": 531.8910000000001, "r_x2": 379.518, "r_y2": 520.602, "r_x3": 297.996, "r_y3": 520.602, "coord_origin": "TOPLEFT"}, "text": "Ramis, C.B., Staar,", "orig": "Ramis, C.B., Staar,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 45, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 383.894, "r_y0": 531.8910000000001, "r_x1": 413.839, "r_y1": 531.8910000000001, "r_x2": 413.839, "r_y2": 520.602, "r_x3": 383.894, "r_y3": 520.602, "coord_origin": "TOPLEFT"}, "text": "P.W.J.:", "orig": "P.W.J.:", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 46, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 418.214, "r_y0": 531.8910000000001, "r_x1": 459.065, "r_y1": 531.8910000000001, "r_x2": 459.065, "r_y2": 520.602, "r_x3": 418.214, "r_y3": 520.602, "coord_origin": "TOPLEFT"}, "text": "Delivering", "orig": "Delivering", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 47, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 463.441, "r_y0": 531.8910000000001, "r_x1": 480.592, "r_y1": 531.8910000000001, "r_x2": 480.592, "r_y2": 520.602, "r_x3": 463.441, "r_y3": 520.602, "coord_origin": "TOPLEFT"}, "text": "doc-", "orig": "doc-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 48, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 151.518, "r_y0": 542.85, "r_x1": 235.799, "r_y1": 542.85, "r_x2": 235.799, "r_y2": 531.5609999999999, "r_x3": 151.518, "r_y3": 531.5609999999999, "coord_origin": "TOPLEFT"}, "text": "ument conversion as", "orig": "ument conversion as", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 49, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 240.246, "r_y0": 542.85, "r_x1": 270.806, "r_y1": 542.85, "r_x2": 270.806, "r_y2": 531.5609999999999, "r_x3": 240.246, "r_y3": 531.5609999999999, "coord_origin": "TOPLEFT"}, "text": "a cloud", "orig": "a cloud", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 50, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 275.262, "r_y0": 542.85, "r_x1": 302.214, "r_y1": 542.85, "r_x2": 302.214, "r_y2": 531.5609999999999, "r_x3": 275.262, "r_y3": 531.5609999999999, "coord_origin": "TOPLEFT"}, "text": "service", "orig": "service", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 51, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 306.661, "r_y0": 542.85, "r_x1": 346.433, "r_y1": 542.85, "r_x2": 346.433, "r_y2": 531.5609999999999, "r_x3": 306.661, "r_y3": 531.5609999999999, "coord_origin": "TOPLEFT"}, "text": "with high", "orig": "with high", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 52, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 350.889, "r_y0": 542.85, "r_x1": 480.587, "r_y1": 542.85, "r_x2": 480.587, "r_y2": 531.5609999999999, "r_x3": 350.889, "r_y3": 531.5609999999999, "coord_origin": "TOPLEFT"}, "text": "throughput and responsiveness.", "orig": "throughput and responsiveness.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 53, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 151.518, "r_y0": 553.809, "r_x1": 176.341, "r_y1": 553.809, "r_x2": 176.341, "r_y2": 542.52, "r_x3": 151.518, "r_y3": 542.52, "coord_origin": "TOPLEFT"}, "text": "CoRR", "orig": "CoRR", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 54, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 179.464, "r_y0": 552.6610000000001, "r_x1": 250.68, "r_y1": 552.6610000000001, "r_x2": 250.68, "r_y2": 544.735, "r_x3": 179.464, "r_y3": 544.735, "coord_origin": "TOPLEFT"}, "text": "abs/2206.00785", "orig": "abs/2206.00785", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 55, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 253.804, "r_y0": 553.809, "r_x1": 281.957, "r_y1": 553.809, "r_x2": 281.957, "r_y2": 542.52, "r_x3": 253.804, "r_y3": 542.52, "coord_origin": "TOPLEFT"}, "text": "(2022).", "orig": "(2022).", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 56, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 285.078, "r_y0": 552.913, "r_x1": 478.034, "r_y1": 552.913, "r_x2": 478.034, "r_y2": 545.444, "r_x3": 285.078, "r_y3": 545.444, "coord_origin": "TOPLEFT"}, "text": "https://doi.org/10.48550/arXiv.2206.00785", "orig": "https://doi.org/10.48550/arXiv.2206.00785", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 57, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 478.032, "r_y0": 553.809, "r_x1": 480.591, "r_y1": 553.809, "r_x2": 480.591, "r_y2": 542.52, "r_x3": 478.032, "r_y3": 542.52, "coord_origin": "TOPLEFT"}, "text": ",", "orig": ",", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 58, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 151.518, "r_y0": 563.8720000000001, "r_x1": 344.474, "r_y1": 563.8720000000001, "r_x2": 344.474, "r_y2": 556.403, "r_x3": 151.518, "r_y3": 556.403, "coord_origin": "TOPLEFT"}, "text": "https://doi.org/10.48550/arXiv.2206.00785", "orig": "https://doi.org/10.48550/arXiv.2206.00785", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "1. Auer, C., Dolfi, M., Carvalho, A., Ramis, C.B., Staar, P.W.J.: Delivering document conversion as a cloud service with high throughput and responsiveness. CoRR abs/2206.00785 (2022). https://doi.org/10.48550/arXiv.2206.00785 , https://doi.org/10.48550/arXiv.2206.00785"}, {"label": "list_item", "id": 4, "page_no": 11, "cluster": {"id": 4, "label": "list_item", "bbox": {"l": 139.371, "t": 565.241, "r": 480.592, "b": 609.407, "coord_origin": "TOPLEFT"}, "confidence": 0.9730570316314697, "cells": [{"index": 59, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 139.371, "r_y0": 576.53, "r_x1": 146.537, "r_y1": 576.53, "r_x2": 146.537, "r_y2": 565.241, "r_x3": 139.371, "r_y3": 565.241, "coord_origin": "TOPLEFT"}, "text": "2.", "orig": "2.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 60, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 151.522, "r_y0": 576.53, "r_x1": 480.586, "r_y1": 576.53, "r_x2": 480.586, "r_y2": 565.241, "r_x3": 151.522, "r_y3": 565.241, "coord_origin": "TOPLEFT"}, "text": "Chen, B., Peng, D., Zhang, J., Ren, Y., Jin, L.: Complex table structure recognition", "orig": "Chen, B., Peng, D., Zhang, J., Ren, Y., Jin, L.: Complex table structure recognition", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 61, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 151.518, "r_y0": 587.489, "r_x1": 480.59, "r_y1": 587.489, "r_x2": 480.59, "r_y2": 576.2, "r_x3": 151.518, "r_y3": 576.2, "coord_origin": "TOPLEFT"}, "text": "in the wild using transformer and identity matrix-based augmentation. In: Porwal,", "orig": "in the wild using transformer and identity matrix-based augmentation. In: Porwal,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 62, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 151.518, "r_y0": 598.448, "r_x1": 480.592, "r_y1": 598.448, "r_x2": 480.592, "r_y2": 587.159, "r_x3": 151.518, "r_y3": 587.159, "coord_origin": "TOPLEFT"}, "text": "U., Forn\u00e9s, A., Shafait, F. (eds.) Frontiers in Handwriting Recognition. pp. 545-", "orig": "U., Forn\u00e9s, A., Shafait, F. (eds.) Frontiers in Handwriting Recognition. pp. 545-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 63, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 151.518, "r_y0": 609.407, "r_x1": 364.179, "r_y1": 609.407, "r_x2": 364.179, "r_y2": 598.1179999999999, "r_x3": 151.518, "r_y3": 598.1179999999999, "coord_origin": "TOPLEFT"}, "text": "561. Springer International Publishing, Cham (2022)", "orig": "561. Springer International Publishing, Cham (2022)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "2. Chen, B., Peng, D., Zhang, J., Ren, Y., Jin, L.: Complex table structure recognition in the wild using transformer and identity matrix-based augmentation. In: Porwal, U., Forn\u00e9s, A., Shafait, F. (eds.) Frontiers in Handwriting Recognition. pp. 545561. Springer International Publishing, Cham (2022)"}, {"label": "list_item", "id": 6, "page_no": 11, "cluster": {"id": 6, "label": "list_item", "bbox": {"l": 139.371, "t": 609.881, "r": 480.587, "b": 632.129, "coord_origin": "TOPLEFT"}, "confidence": 0.9617196321487427, "cells": [{"index": 64, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 139.371, "r_y0": 621.17, "r_x1": 146.537, "r_y1": 621.17, "r_x2": 146.537, "r_y2": 609.881, "r_x3": 139.371, "r_y3": 609.881, "coord_origin": "TOPLEFT"}, "text": "3.", "orig": "3.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 65, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 151.522, "r_y0": 621.17, "r_x1": 168.412, "r_y1": 621.17, "r_x2": 168.412, "r_y2": 609.881, "r_x3": 151.522, "r_y3": 609.881, "coord_origin": "TOPLEFT"}, "text": "Chi,", "orig": "Chi,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 66, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 172.68, "r_y0": 621.17, "r_x1": 183.428, "r_y1": 621.17, "r_x2": 183.428, "r_y2": 609.881, "r_x3": 172.68, "r_y3": 609.881, "coord_origin": "TOPLEFT"}, "text": "Z.,", "orig": "Z.,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 67, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 187.696, "r_y0": 621.17, "r_x1": 480.587, "r_y1": 621.17, "r_x2": 480.587, "r_y2": 609.881, "r_x3": 187.696, "r_y3": 609.881, "coord_origin": "TOPLEFT"}, "text": "Huang, H., Xu, H.D., Yu, H., Yin, W., Mao, X.L.: Complicated table", "orig": "Huang, H., Xu, H.D., Yu, H., Yin, W., Mao, X.L.: Complicated table", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 68, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 151.518, "r_y0": 632.129, "r_x1": 400.225, "r_y1": 632.129, "r_x2": 400.225, "r_y2": 620.84, "r_x3": 151.518, "r_y3": 620.84, "coord_origin": "TOPLEFT"}, "text": "structure recognition. arXiv preprint arXiv:1908.04729 (2019)", "orig": "structure recognition. arXiv preprint arXiv:1908.04729 (2019)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "3. Chi, Z., Huang, H., Xu, H.D., Yu, H., Yin, W., Mao, X.L.: Complicated table structure recognition. arXiv preprint arXiv:1908.04729 (2019)"}, {"label": "list_item", "id": 3, "page_no": 11, "cluster": {"id": 3, "label": "list_item", "bbox": {"l": 139.371, "t": 632.6030000000001, "r": 480.588, "b": 665.809, "coord_origin": "TOPLEFT"}, "confidence": 0.9754673838615417, "cells": [{"index": 69, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 139.371, "r_y0": 643.892, "r_x1": 146.537, "r_y1": 643.892, "r_x2": 146.537, "r_y2": 632.6030000000001, "r_x3": 139.371, "r_y3": 632.6030000000001, "coord_origin": "TOPLEFT"}, "text": "4.", "orig": "4.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 70, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 151.522, "r_y0": 643.892, "r_x1": 191.523, "r_y1": 643.892, "r_x2": 191.523, "r_y2": 632.6030000000001, "r_x3": 151.522, "r_y3": 632.6030000000001, "coord_origin": "TOPLEFT"}, "text": "Deng, Y.,", "orig": "Deng, Y.,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 71, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 196.087, "r_y0": 643.892, "r_x1": 240.312, "r_y1": 643.892, "r_x2": 240.312, "r_y2": 632.6030000000001, "r_x3": 196.087, "r_y3": 632.6030000000001, "coord_origin": "TOPLEFT"}, "text": "Rosenberg,", "orig": "Rosenberg,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 72, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 244.876, "r_y0": 643.892, "r_x1": 257.031, "r_y1": 643.892, "r_x2": 257.031, "r_y2": 632.6030000000001, "r_x3": 244.876, "r_y3": 632.6030000000001, "coord_origin": "TOPLEFT"}, "text": "D.,", "orig": "D.,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 73, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 261.586, "r_y0": 643.892, "r_x1": 351.96, "r_y1": 643.892, "r_x2": 351.96, "r_y2": 632.6030000000001, "r_x3": 261.586, "r_y3": 632.6030000000001, "coord_origin": "TOPLEFT"}, "text": "Mann, G.: Challenges", "orig": "Mann, G.: Challenges", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 74, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 356.524, "r_y0": 643.892, "r_x1": 364.201, "r_y1": 643.892, "r_x2": 364.201, "r_y2": 632.6030000000001, "r_x3": 356.524, "r_y3": 632.6030000000001, "coord_origin": "TOPLEFT"}, "text": "in", "orig": "in", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 75, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 368.756, "r_y0": 643.892, "r_x1": 411.757, "r_y1": 643.892, "r_x2": 411.757, "r_y2": 632.6030000000001, "r_x3": 368.756, "r_y3": 632.6030000000001, "coord_origin": "TOPLEFT"}, "text": "end-to-end", "orig": "end-to-end", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 76, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 416.321, "r_y0": 643.892, "r_x1": 441.425, "r_y1": 643.892, "r_x2": 441.425, "r_y2": 632.6030000000001, "r_x3": 416.321, "r_y3": 632.6030000000001, "coord_origin": "TOPLEFT"}, "text": "neural", "orig": "neural", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 77, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 445.989, "r_y0": 643.892, "r_x1": 480.588, "r_y1": 643.892, "r_x2": 480.588, "r_y2": 632.6030000000001, "r_x3": 445.989, "r_y3": 632.6030000000001, "coord_origin": "TOPLEFT"}, "text": "scientific", "orig": "scientific", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 78, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 151.518, "r_y0": 654.851, "r_x1": 171.483, "r_y1": 654.851, "r_x2": 171.483, "r_y2": 643.562, "r_x3": 151.518, "r_y3": 643.562, "coord_origin": "TOPLEFT"}, "text": "table", "orig": "table", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 79, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 175.509, "r_y0": 654.851, "r_x1": 222.623, "r_y1": 654.851, "r_x2": 222.623, "r_y2": 643.562, "r_x3": 175.509, "r_y3": 643.562, "coord_origin": "TOPLEFT"}, "text": "recognition.", "orig": "recognition.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 80, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 226.649, "r_y0": 654.851, "r_x1": 237.652, "r_y1": 654.851, "r_x2": 237.652, "r_y2": 643.562, "r_x3": 226.649, "r_y3": 643.562, "coord_origin": "TOPLEFT"}, "text": "In:", "orig": "In:", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 81, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 241.678, "r_y0": 654.851, "r_x1": 480.588, "r_y1": 654.851, "r_x2": 480.588, "r_y2": 643.562, "r_x3": 241.678, "r_y3": 643.562, "coord_origin": "TOPLEFT"}, "text": "2019 International Conference on Document Analysis and", "orig": "2019 International Conference on Document Analysis and", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 82, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 151.518, "r_y0": 665.809, "r_x1": 350.111, "r_y1": 665.809, "r_x2": 350.111, "r_y2": 654.52, "r_x3": 151.518, "r_y3": 654.52, "coord_origin": "TOPLEFT"}, "text": "Recognition (ICDAR). pp. 894-901. IEEE (2019)", "orig": "Recognition (ICDAR). pp. 894-901. IEEE (2019)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "4. Deng, Y., Rosenberg, D., Mann, G.: Challenges in end-to-end neural scientific table recognition. In: 2019 International Conference on Document Analysis and Recognition (ICDAR). pp. 894-901. IEEE (2019)"}], "body": [{"label": "section_header", "id": 8, "page_no": 11, "cluster": {"id": 8, "label": "section_header", "bbox": {"l": 134.765, "t": 117.54899999999998, "r": 219.255, "b": 128.11699999999996, "coord_origin": "TOPLEFT"}, "confidence": 0.915635347366333, "cells": [{"index": 2, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 128.11699999999996, "r_x1": 141.489, "r_y1": 128.11699999999996, "r_x2": 141.489, "r_y2": 117.54899999999998, "r_x3": 134.765, "r_y3": 117.54899999999998, "coord_origin": "TOPLEFT"}, "text": "6", "orig": "6", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 3, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 154.938, "r_y0": 128.11699999999996, "r_x1": 219.255, "r_y1": 128.11699999999996, "r_x2": 219.255, "r_y2": 117.54899999999998, "r_x3": 154.938, "r_y3": 117.54899999999998, "coord_origin": "TOPLEFT"}, "text": "Conclusion", "orig": "Conclusion", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "6 Conclusion"}, {"label": "text", "id": 2, "page_no": 11, "cluster": {"id": 2, "label": "text", "bbox": {"l": 134.765, "t": 146.86400000000003, "r": 480.596, "b": 203.48199999999997, "coord_origin": "TOPLEFT"}, "confidence": 0.9806171655654907, "cells": [{"index": 4, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 155.66099999999994, "r_x1": 480.595, "r_y1": 155.66099999999994, "r_x2": 480.595, "r_y2": 146.86400000000003, "r_x3": 134.765, "r_y3": 146.86400000000003, "coord_origin": "TOPLEFT"}, "text": "We demonstrated that representing tables in HTML for the task of table struc-", "orig": "We demonstrated that representing tables in HTML for the task of table struc-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 5, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 167.61599999999999, "r_x1": 152.499, "r_y1": 167.61599999999999, "r_x2": 152.499, "r_y2": 158.81899999999996, "r_x3": 134.765, "r_y3": 158.81899999999996, "coord_origin": "TOPLEFT"}, "text": "ture", "orig": "ture", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 6, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 156.963, "r_y0": 167.61599999999999, "r_x1": 205.131, "r_y1": 167.61599999999999, "r_x2": 205.131, "r_y2": 158.81899999999996, "r_x3": 156.963, "r_y3": 158.81899999999996, "coord_origin": "TOPLEFT"}, "text": "recognition", "orig": "recognition", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 7, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 209.594, "r_y0": 167.61599999999999, "r_x1": 480.595, "r_y1": 167.61599999999999, "r_x2": 480.595, "r_y2": 158.81899999999996, "r_x3": 209.594, "r_y3": 158.81899999999996, "coord_origin": "TOPLEFT"}, "text": "with Im2Seq models is ill-suited and has serious limitations.", "orig": "with Im2Seq models is ill-suited and has serious limitations.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 8, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 179.57100000000003, "r_x1": 480.59, "r_y1": 179.57100000000003, "r_x2": 480.59, "r_y2": 170.774, "r_x3": 134.765, "r_y3": 170.774, "coord_origin": "TOPLEFT"}, "text": "Furthermore, we presented in this paper an Optimized Table Structure Language", "orig": "Furthermore, we presented in this paper an Optimized Table Structure Language", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 9, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 191.52700000000004, "r_x1": 480.596, "r_y1": 191.52700000000004, "r_x2": 480.596, "r_y2": 182.73000000000002, "r_x3": 134.765, "r_y3": 182.73000000000002, "coord_origin": "TOPLEFT"}, "text": "(OTSL) which, when compared to commonly used general purpose languages,", "orig": "(OTSL) which, when compared to commonly used general purpose languages,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 10, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 203.48199999999997, "r_x1": 239.539, "r_y1": 203.48199999999997, "r_x2": 239.539, "r_y2": 194.68499999999995, "r_x3": 134.765, "r_y3": 194.68499999999995, "coord_origin": "TOPLEFT"}, "text": "has several key benefits.", "orig": "has several key benefits.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "We demonstrated that representing tables in HTML for the task of table structure recognition with Im2Seq models is ill-suited and has serious limitations. Furthermore, we presented in this paper an Optimized Table Structure Language (OTSL) which, when compared to commonly used general purpose languages, has several key benefits."}, {"label": "text", "id": 0, "page_no": 11, "cluster": {"id": 0, "label": "text", "bbox": {"l": 134.765, "t": 207.44399999999996, "r": 480.595, "b": 323.837, "coord_origin": "TOPLEFT"}, "confidence": 0.9873476028442383, "cells": [{"index": 11, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 149.709, "r_y0": 216.24099999999999, "r_x1": 480.593, "r_y1": 216.24099999999999, "r_x2": 480.593, "r_y2": 207.44399999999996, "r_x3": 149.709, "r_y3": 207.44399999999996, "coord_origin": "TOPLEFT"}, "text": "First and foremost, given the same network configuration, inference time for", "orig": "First and foremost, given the same network configuration, inference time for", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 12, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 228.19600000000003, "r_x1": 480.594, "r_y1": 228.19600000000003, "r_x2": 480.594, "r_y2": 219.399, "r_x3": 134.765, "r_y3": 219.399, "coord_origin": "TOPLEFT"}, "text": "a table-structure prediction is about 2 times faster compared to the conventional", "orig": "a table-structure prediction is about 2 times faster compared to the conventional", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 13, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 240.15099999999995, "r_x1": 480.591, "r_y1": 240.15099999999995, "r_x2": 480.591, "r_y2": 231.35400000000004, "r_x3": 134.765, "r_y3": 231.35400000000004, "coord_origin": "TOPLEFT"}, "text": "HTML approach. This is primarily owed to the shorter sequence length of the", "orig": "HTML approach. This is primarily owed to the shorter sequence length of the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 14, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 252.106, "r_x1": 230.936, "r_y1": 252.106, "r_x2": 230.936, "r_y2": 243.30899999999997, "r_x3": 134.765, "r_y3": 243.30899999999997, "coord_origin": "TOPLEFT"}, "text": "OTSL representation.", "orig": "OTSL representation.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 15, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 235.838, "r_y0": 252.106, "r_x1": 281.762, "r_y1": 252.106, "r_x2": 281.762, "r_y2": 243.30899999999997, "r_x3": 235.838, "r_y3": 243.30899999999997, "coord_origin": "TOPLEFT"}, "text": "Additional", "orig": "Additional", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 16, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 286.664, "r_y0": 252.106, "r_x1": 340.395, "r_y1": 252.106, "r_x2": 340.395, "r_y2": 243.30899999999997, "r_x3": 286.664, "r_y3": 243.30899999999997, "coord_origin": "TOPLEFT"}, "text": "performance", "orig": "performance", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 17, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 345.287, "r_y0": 252.106, "r_x1": 378.82, "r_y1": 252.106, "r_x2": 378.82, "r_y2": 243.30899999999997, "r_x3": 345.287, "r_y3": 243.30899999999997, "coord_origin": "TOPLEFT"}, "text": "benefits", "orig": "benefits", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 18, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 383.721, "r_y0": 252.106, "r_x1": 456.32, "r_y1": 252.106, "r_x2": 456.32, "r_y2": 243.30899999999997, "r_x3": 383.721, "r_y3": 243.30899999999997, "coord_origin": "TOPLEFT"}, "text": "can be obtained", "orig": "can be obtained", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 19, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 461.221, "r_y0": 252.106, "r_x1": 480.588, "r_y1": 252.106, "r_x2": 480.588, "r_y2": 243.30899999999997, "r_x3": 461.221, "r_y3": 243.30899999999997, "coord_origin": "TOPLEFT"}, "text": "with", "orig": "with", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 20, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 264.062, "r_x1": 480.595, "r_y1": 264.062, "r_x2": 480.595, "r_y2": 255.265, "r_x3": 134.765, "r_y3": 255.265, "coord_origin": "TOPLEFT"}, "text": "HPO (hyper parameter optimization). As we demonstrate in our experiments,", "orig": "HPO (hyper parameter optimization). As we demonstrate in our experiments,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 21, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 276.01700000000005, "r_x1": 480.588, "r_y1": 276.01700000000005, "r_x2": 480.588, "r_y2": 267.22, "r_x3": 134.765, "r_y3": 267.22, "coord_origin": "TOPLEFT"}, "text": "models trained on OTSL can be significantly smaller, e.g. by reducing the number", "orig": "models trained on OTSL can be significantly smaller, e.g. by reducing the number", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 22, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 287.972, "r_x1": 480.593, "r_y1": 287.972, "r_x2": 480.593, "r_y2": 279.17499999999995, "r_x3": 134.765, "r_y3": 279.17499999999995, "coord_origin": "TOPLEFT"}, "text": "of encoder and decoder layers, while preserving comparatively good prediction", "orig": "of encoder and decoder layers, while preserving comparatively good prediction", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 23, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 299.927, "r_x1": 480.589, "r_y1": 299.927, "r_x2": 480.589, "r_y2": 291.13, "r_x3": 134.765, "r_y3": 291.13, "coord_origin": "TOPLEFT"}, "text": "quality. This can further improve inference performance, yielding 5-6 times faster", "orig": "quality. This can further improve inference performance, yielding 5-6 times faster", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 24, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 311.882, "r_x1": 480.594, "r_y1": 311.882, "r_x2": 480.594, "r_y2": 303.085, "r_x3": 134.765, "r_y3": 303.085, "coord_origin": "TOPLEFT"}, "text": "inference speed in OTSL with prediction quality comparable to models trained", "orig": "inference speed in OTSL with prediction quality comparable to models trained", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 25, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 323.837, "r_x1": 240.923, "r_y1": 323.837, "r_x2": 240.923, "r_y2": 315.04, "r_x3": 134.765, "r_y3": 315.04, "coord_origin": "TOPLEFT"}, "text": "on HTML (see Table 1).", "orig": "on HTML (see Table 1).", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "First and foremost, given the same network configuration, inference time for a table-structure prediction is about 2 times faster compared to the conventional HTML approach. This is primarily owed to the shorter sequence length of the OTSL representation. Additional performance benefits can be obtained with HPO (hyper parameter optimization). As we demonstrate in our experiments, models trained on OTSL can be significantly smaller, e.g. by reducing the number of encoder and decoder layers, while preserving comparatively good prediction quality. This can further improve inference performance, yielding 5-6 times faster inference speed in OTSL with prediction quality comparable to models trained on HTML (see Table 1)."}, {"label": "text", "id": 1, "page_no": 11, "cluster": {"id": 1, "label": "text", "bbox": {"l": 134.765, "t": 327.799, "r": 480.595, "b": 468.103, "coord_origin": "TOPLEFT"}, "confidence": 0.9868747591972351, "cells": [{"index": 26, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 149.709, "r_y0": 336.596, "r_x1": 480.59, "r_y1": 336.596, "r_x2": 480.59, "r_y2": 327.799, "r_x3": 149.709, "r_y3": 327.799, "coord_origin": "TOPLEFT"}, "text": "Secondly, OTSL has more inherent structure and a significantly restricted vo-", "orig": "Secondly, OTSL has more inherent structure and a significantly restricted vo-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 27, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 348.552, "r_x1": 480.595, "r_y1": 348.552, "r_x2": 480.595, "r_y2": 339.755, "r_x3": 134.765, "r_y3": 339.755, "coord_origin": "TOPLEFT"}, "text": "cabulary size. This allows autoregressive models to perform better in the TED", "orig": "cabulary size. This allows autoregressive models to perform better in the TED", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 28, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 360.507, "r_x1": 480.587, "r_y1": 360.507, "r_x2": 480.587, "r_y2": 351.71, "r_x3": 134.765, "r_y3": 351.71, "coord_origin": "TOPLEFT"}, "text": "metric, but especially with regards to prediction accuracy of the table-cell bound-", "orig": "metric, but especially with regards to prediction accuracy of the table-cell bound-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 29, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 372.462, "r_x1": 480.595, "r_y1": 372.462, "r_x2": 480.595, "r_y2": 363.665, "r_x3": 134.765, "r_y3": 363.665, "coord_origin": "TOPLEFT"}, "text": "ing boxes (see Table 2). As shown in Figure 5, we observe that the OTSL dras-", "orig": "ing boxes (see Table 2). As shown in Figure 5, we observe that the OTSL dras-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 30, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 384.417, "r_x1": 480.59, "r_y1": 384.417, "r_x2": 480.59, "r_y2": 375.62, "r_x3": 134.765, "r_y3": 375.62, "coord_origin": "TOPLEFT"}, "text": "tically reduces the drift for table cell bounding boxes at high row count and in", "orig": "tically reduces the drift for table cell bounding boxes at high row count and in", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 31, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 396.372, "r_x1": 480.587, "r_y1": 396.372, "r_x2": 480.587, "r_y2": 387.575, "r_x3": 134.765, "r_y3": 387.575, "coord_origin": "TOPLEFT"}, "text": "sparse tables. This leads to more accurate predictions and a significant reduction", "orig": "sparse tables. This leads to more accurate predictions and a significant reduction", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 32, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 408.328, "r_x1": 480.586, "r_y1": 408.328, "r_x2": 480.586, "r_y2": 399.531, "r_x3": 134.765, "r_y3": 399.531, "coord_origin": "TOPLEFT"}, "text": "in post-processing complexity, which is an undesired necessity in HTML-based", "orig": "in post-processing complexity, which is an undesired necessity in HTML-based", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 33, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 420.283, "r_x1": 480.587, "r_y1": 420.283, "r_x2": 480.587, "r_y2": 411.486, "r_x3": 134.765, "r_y3": 411.486, "coord_origin": "TOPLEFT"}, "text": "Im2Seq models. Significant novelty lies in OTSL syntactical rules, which are few,", "orig": "Im2Seq models. Significant novelty lies in OTSL syntactical rules, which are few,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 34, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 432.238, "r_x1": 480.595, "r_y1": 432.238, "r_x2": 480.595, "r_y2": 423.441, "r_x3": 134.765, "r_y3": 423.441, "coord_origin": "TOPLEFT"}, "text": "simple and always backwards looking. Each new token can be validated only by", "orig": "simple and always backwards looking. Each new token can be validated only by", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 35, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 444.193, "r_x1": 480.588, "r_y1": 444.193, "r_x2": 480.588, "r_y2": 435.396, "r_x3": 134.765, "r_y3": 435.396, "coord_origin": "TOPLEFT"}, "text": "analyzing the sequence of previous tokens, without requiring the entire sequence", "orig": "analyzing the sequence of previous tokens, without requiring the entire sequence", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 36, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 456.148, "r_x1": 480.59, "r_y1": 456.148, "r_x2": 480.59, "r_y2": 447.351, "r_x3": 134.765, "r_y3": 447.351, "coord_origin": "TOPLEFT"}, "text": "to detect mistakes. This in return allows to perform structural error detection", "orig": "to detect mistakes. This in return allows to perform structural error detection", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 37, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 468.103, "r_x1": 366.777, "r_y1": 468.103, "r_x2": 366.777, "r_y2": 459.306, "r_x3": 134.765, "r_y3": 459.306, "coord_origin": "TOPLEFT"}, "text": "and correction on-the-fly during sequence generation.", "orig": "and correction on-the-fly during sequence generation.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "Secondly, OTSL has more inherent structure and a significantly restricted vocabulary size. This allows autoregressive models to perform better in the TED metric, but especially with regards to prediction accuracy of the table-cell bounding boxes (see Table 2). As shown in Figure 5, we observe that the OTSL drastically reduces the drift for table cell bounding boxes at high row count and in sparse tables. This leads to more accurate predictions and a significant reduction in post-processing complexity, which is an undesired necessity in HTML-based Im2Seq models. Significant novelty lies in OTSL syntactical rules, which are few, simple and always backwards looking. Each new token can be validated only by analyzing the sequence of previous tokens, without requiring the entire sequence to detect mistakes. This in return allows to perform structural error detection and correction on-the-fly during sequence generation."}, {"label": "section_header", "id": 7, "page_no": 11, "cluster": {"id": 7, "label": "section_header", "bbox": {"l": 134.765, "t": 493.821, "r": 197.686, "b": 504.389, "coord_origin": "TOPLEFT"}, "confidence": 0.9403266310691833, "cells": [{"index": 38, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 504.389, "r_x1": 197.686, "r_y1": 504.389, "r_x2": 197.686, "r_y2": 493.821, "r_x3": 134.765, "r_y3": 493.821, "coord_origin": "TOPLEFT"}, "text": "References", "orig": "References", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "References"}, {"label": "list_item", "id": 5, "page_no": 11, "cluster": {"id": 5, "label": "list_item", "bbox": {"l": 139.371, "t": 520.602, "r": 480.592, "b": 563.8720000000001, "coord_origin": "TOPLEFT"}, "confidence": 0.9698606729507446, "cells": [{"index": 39, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 139.371, "r_y0": 531.8910000000001, "r_x1": 146.537, "r_y1": 531.8910000000001, "r_x2": 146.537, "r_y2": 520.602, "r_x3": 139.371, "r_y3": 520.602, "coord_origin": "TOPLEFT"}, "text": "1.", "orig": "1.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 40, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 151.522, "r_y0": 531.8910000000001, "r_x1": 189.958, "r_y1": 531.8910000000001, "r_x2": 189.958, "r_y2": 520.602, "r_x3": 151.522, "r_y3": 520.602, "coord_origin": "TOPLEFT"}, "text": "Auer, C.,", "orig": "Auer, C.,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 41, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 194.342, "r_y0": 531.8910000000001, "r_x1": 216.222, "r_y1": 531.8910000000001, "r_x2": 216.222, "r_y2": 520.602, "r_x3": 194.342, "r_y3": 520.602, "coord_origin": "TOPLEFT"}, "text": "Dolfi,", "orig": "Dolfi,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 42, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 220.607, "r_y0": 531.8910000000001, "r_x1": 277.21, "r_y1": 531.8910000000001, "r_x2": 277.21, "r_y2": 520.602, "r_x3": 220.607, "r_y3": 520.602, "coord_origin": "TOPLEFT"}, "text": "M., Carvalho,", "orig": "M., Carvalho,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 43, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 281.594, "r_y0": 531.8910000000001, "r_x1": 293.621, "r_y1": 531.8910000000001, "r_x2": 293.621, "r_y2": 520.602, "r_x3": 281.594, "r_y3": 520.602, "coord_origin": "TOPLEFT"}, "text": "A.,", "orig": "A.,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 44, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 297.996, "r_y0": 531.8910000000001, "r_x1": 379.518, "r_y1": 531.8910000000001, "r_x2": 379.518, "r_y2": 520.602, "r_x3": 297.996, "r_y3": 520.602, "coord_origin": "TOPLEFT"}, "text": "Ramis, C.B., Staar,", "orig": "Ramis, C.B., Staar,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 45, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 383.894, "r_y0": 531.8910000000001, "r_x1": 413.839, "r_y1": 531.8910000000001, "r_x2": 413.839, "r_y2": 520.602, "r_x3": 383.894, "r_y3": 520.602, "coord_origin": "TOPLEFT"}, "text": "P.W.J.:", "orig": "P.W.J.:", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 46, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 418.214, "r_y0": 531.8910000000001, "r_x1": 459.065, "r_y1": 531.8910000000001, "r_x2": 459.065, "r_y2": 520.602, "r_x3": 418.214, "r_y3": 520.602, "coord_origin": "TOPLEFT"}, "text": "Delivering", "orig": "Delivering", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 47, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 463.441, "r_y0": 531.8910000000001, "r_x1": 480.592, "r_y1": 531.8910000000001, "r_x2": 480.592, "r_y2": 520.602, "r_x3": 463.441, "r_y3": 520.602, "coord_origin": "TOPLEFT"}, "text": "doc-", "orig": "doc-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 48, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 151.518, "r_y0": 542.85, "r_x1": 235.799, "r_y1": 542.85, "r_x2": 235.799, "r_y2": 531.5609999999999, "r_x3": 151.518, "r_y3": 531.5609999999999, "coord_origin": "TOPLEFT"}, "text": "ument conversion as", "orig": "ument conversion as", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 49, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 240.246, "r_y0": 542.85, "r_x1": 270.806, "r_y1": 542.85, "r_x2": 270.806, "r_y2": 531.5609999999999, "r_x3": 240.246, "r_y3": 531.5609999999999, "coord_origin": "TOPLEFT"}, "text": "a cloud", "orig": "a cloud", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 50, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 275.262, "r_y0": 542.85, "r_x1": 302.214, "r_y1": 542.85, "r_x2": 302.214, "r_y2": 531.5609999999999, "r_x3": 275.262, "r_y3": 531.5609999999999, "coord_origin": "TOPLEFT"}, "text": "service", "orig": "service", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 51, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 306.661, "r_y0": 542.85, "r_x1": 346.433, "r_y1": 542.85, "r_x2": 346.433, "r_y2": 531.5609999999999, "r_x3": 306.661, "r_y3": 531.5609999999999, "coord_origin": "TOPLEFT"}, "text": "with high", "orig": "with high", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 52, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 350.889, "r_y0": 542.85, "r_x1": 480.587, "r_y1": 542.85, "r_x2": 480.587, "r_y2": 531.5609999999999, "r_x3": 350.889, "r_y3": 531.5609999999999, "coord_origin": "TOPLEFT"}, "text": "throughput and responsiveness.", "orig": "throughput and responsiveness.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 53, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 151.518, "r_y0": 553.809, "r_x1": 176.341, "r_y1": 553.809, "r_x2": 176.341, "r_y2": 542.52, "r_x3": 151.518, "r_y3": 542.52, "coord_origin": "TOPLEFT"}, "text": "CoRR", "orig": "CoRR", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 54, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 179.464, "r_y0": 552.6610000000001, "r_x1": 250.68, "r_y1": 552.6610000000001, "r_x2": 250.68, "r_y2": 544.735, "r_x3": 179.464, "r_y3": 544.735, "coord_origin": "TOPLEFT"}, "text": "abs/2206.00785", "orig": "abs/2206.00785", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 55, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 253.804, "r_y0": 553.809, "r_x1": 281.957, "r_y1": 553.809, "r_x2": 281.957, "r_y2": 542.52, "r_x3": 253.804, "r_y3": 542.52, "coord_origin": "TOPLEFT"}, "text": "(2022).", "orig": "(2022).", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 56, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 285.078, "r_y0": 552.913, "r_x1": 478.034, "r_y1": 552.913, "r_x2": 478.034, "r_y2": 545.444, "r_x3": 285.078, "r_y3": 545.444, "coord_origin": "TOPLEFT"}, "text": "https://doi.org/10.48550/arXiv.2206.00785", "orig": "https://doi.org/10.48550/arXiv.2206.00785", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 57, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 478.032, "r_y0": 553.809, "r_x1": 480.591, "r_y1": 553.809, "r_x2": 480.591, "r_y2": 542.52, "r_x3": 478.032, "r_y3": 542.52, "coord_origin": "TOPLEFT"}, "text": ",", "orig": ",", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 58, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 151.518, "r_y0": 563.8720000000001, "r_x1": 344.474, "r_y1": 563.8720000000001, "r_x2": 344.474, "r_y2": 556.403, "r_x3": 151.518, "r_y3": 556.403, "coord_origin": "TOPLEFT"}, "text": "https://doi.org/10.48550/arXiv.2206.00785", "orig": "https://doi.org/10.48550/arXiv.2206.00785", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "1. Auer, C., Dolfi, M., Carvalho, A., Ramis, C.B., Staar, P.W.J.: Delivering document conversion as a cloud service with high throughput and responsiveness. CoRR abs/2206.00785 (2022). https://doi.org/10.48550/arXiv.2206.00785 , https://doi.org/10.48550/arXiv.2206.00785"}, {"label": "list_item", "id": 4, "page_no": 11, "cluster": {"id": 4, "label": "list_item", "bbox": {"l": 139.371, "t": 565.241, "r": 480.592, "b": 609.407, "coord_origin": "TOPLEFT"}, "confidence": 0.9730570316314697, "cells": [{"index": 59, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 139.371, "r_y0": 576.53, "r_x1": 146.537, "r_y1": 576.53, "r_x2": 146.537, "r_y2": 565.241, "r_x3": 139.371, "r_y3": 565.241, "coord_origin": "TOPLEFT"}, "text": "2.", "orig": "2.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 60, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 151.522, "r_y0": 576.53, "r_x1": 480.586, "r_y1": 576.53, "r_x2": 480.586, "r_y2": 565.241, "r_x3": 151.522, "r_y3": 565.241, "coord_origin": "TOPLEFT"}, "text": "Chen, B., Peng, D., Zhang, J., Ren, Y., Jin, L.: Complex table structure recognition", "orig": "Chen, B., Peng, D., Zhang, J., Ren, Y., Jin, L.: Complex table structure recognition", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 61, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 151.518, "r_y0": 587.489, "r_x1": 480.59, "r_y1": 587.489, "r_x2": 480.59, "r_y2": 576.2, "r_x3": 151.518, "r_y3": 576.2, "coord_origin": "TOPLEFT"}, "text": "in the wild using transformer and identity matrix-based augmentation. In: Porwal,", "orig": "in the wild using transformer and identity matrix-based augmentation. In: Porwal,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 62, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 151.518, "r_y0": 598.448, "r_x1": 480.592, "r_y1": 598.448, "r_x2": 480.592, "r_y2": 587.159, "r_x3": 151.518, "r_y3": 587.159, "coord_origin": "TOPLEFT"}, "text": "U., Forn\u00e9s, A., Shafait, F. (eds.) Frontiers in Handwriting Recognition. pp. 545-", "orig": "U., Forn\u00e9s, A., Shafait, F. (eds.) Frontiers in Handwriting Recognition. pp. 545-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 63, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 151.518, "r_y0": 609.407, "r_x1": 364.179, "r_y1": 609.407, "r_x2": 364.179, "r_y2": 598.1179999999999, "r_x3": 151.518, "r_y3": 598.1179999999999, "coord_origin": "TOPLEFT"}, "text": "561. Springer International Publishing, Cham (2022)", "orig": "561. Springer International Publishing, Cham (2022)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "2. Chen, B., Peng, D., Zhang, J., Ren, Y., Jin, L.: Complex table structure recognition in the wild using transformer and identity matrix-based augmentation. In: Porwal, U., Forn\u00e9s, A., Shafait, F. (eds.) Frontiers in Handwriting Recognition. pp. 545561. Springer International Publishing, Cham (2022)"}, {"label": "list_item", "id": 6, "page_no": 11, "cluster": {"id": 6, "label": "list_item", "bbox": {"l": 139.371, "t": 609.881, "r": 480.587, "b": 632.129, "coord_origin": "TOPLEFT"}, "confidence": 0.9617196321487427, "cells": [{"index": 64, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 139.371, "r_y0": 621.17, "r_x1": 146.537, "r_y1": 621.17, "r_x2": 146.537, "r_y2": 609.881, "r_x3": 139.371, "r_y3": 609.881, "coord_origin": "TOPLEFT"}, "text": "3.", "orig": "3.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 65, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 151.522, "r_y0": 621.17, "r_x1": 168.412, "r_y1": 621.17, "r_x2": 168.412, "r_y2": 609.881, "r_x3": 151.522, "r_y3": 609.881, "coord_origin": "TOPLEFT"}, "text": "Chi,", "orig": "Chi,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 66, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 172.68, "r_y0": 621.17, "r_x1": 183.428, "r_y1": 621.17, "r_x2": 183.428, "r_y2": 609.881, "r_x3": 172.68, "r_y3": 609.881, "coord_origin": "TOPLEFT"}, "text": "Z.,", "orig": "Z.,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 67, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 187.696, "r_y0": 621.17, "r_x1": 480.587, "r_y1": 621.17, "r_x2": 480.587, "r_y2": 609.881, "r_x3": 187.696, "r_y3": 609.881, "coord_origin": "TOPLEFT"}, "text": "Huang, H., Xu, H.D., Yu, H., Yin, W., Mao, X.L.: Complicated table", "orig": "Huang, H., Xu, H.D., Yu, H., Yin, W., Mao, X.L.: Complicated table", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 68, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 151.518, "r_y0": 632.129, "r_x1": 400.225, "r_y1": 632.129, "r_x2": 400.225, "r_y2": 620.84, "r_x3": 151.518, "r_y3": 620.84, "coord_origin": "TOPLEFT"}, "text": "structure recognition. arXiv preprint arXiv:1908.04729 (2019)", "orig": "structure recognition. arXiv preprint arXiv:1908.04729 (2019)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "3. Chi, Z., Huang, H., Xu, H.D., Yu, H., Yin, W., Mao, X.L.: Complicated table structure recognition. arXiv preprint arXiv:1908.04729 (2019)"}, {"label": "list_item", "id": 3, "page_no": 11, "cluster": {"id": 3, "label": "list_item", "bbox": {"l": 139.371, "t": 632.6030000000001, "r": 480.588, "b": 665.809, "coord_origin": "TOPLEFT"}, "confidence": 0.9754673838615417, "cells": [{"index": 69, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 139.371, "r_y0": 643.892, "r_x1": 146.537, "r_y1": 643.892, "r_x2": 146.537, "r_y2": 632.6030000000001, "r_x3": 139.371, "r_y3": 632.6030000000001, "coord_origin": "TOPLEFT"}, "text": "4.", "orig": "4.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 70, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 151.522, "r_y0": 643.892, "r_x1": 191.523, "r_y1": 643.892, "r_x2": 191.523, "r_y2": 632.6030000000001, "r_x3": 151.522, "r_y3": 632.6030000000001, "coord_origin": "TOPLEFT"}, "text": "Deng, Y.,", "orig": "Deng, Y.,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 71, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 196.087, "r_y0": 643.892, "r_x1": 240.312, "r_y1": 643.892, "r_x2": 240.312, "r_y2": 632.6030000000001, "r_x3": 196.087, "r_y3": 632.6030000000001, "coord_origin": "TOPLEFT"}, "text": "Rosenberg,", "orig": "Rosenberg,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 72, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 244.876, "r_y0": 643.892, "r_x1": 257.031, "r_y1": 643.892, "r_x2": 257.031, "r_y2": 632.6030000000001, "r_x3": 244.876, "r_y3": 632.6030000000001, "coord_origin": "TOPLEFT"}, "text": "D.,", "orig": "D.,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 73, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 261.586, "r_y0": 643.892, "r_x1": 351.96, "r_y1": 643.892, "r_x2": 351.96, "r_y2": 632.6030000000001, "r_x3": 261.586, "r_y3": 632.6030000000001, "coord_origin": "TOPLEFT"}, "text": "Mann, G.: Challenges", "orig": "Mann, G.: Challenges", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 74, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 356.524, "r_y0": 643.892, "r_x1": 364.201, "r_y1": 643.892, "r_x2": 364.201, "r_y2": 632.6030000000001, "r_x3": 356.524, "r_y3": 632.6030000000001, "coord_origin": "TOPLEFT"}, "text": "in", "orig": "in", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 75, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 368.756, "r_y0": 643.892, "r_x1": 411.757, "r_y1": 643.892, "r_x2": 411.757, "r_y2": 632.6030000000001, "r_x3": 368.756, "r_y3": 632.6030000000001, "coord_origin": "TOPLEFT"}, "text": "end-to-end", "orig": "end-to-end", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 76, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 416.321, "r_y0": 643.892, "r_x1": 441.425, "r_y1": 643.892, "r_x2": 441.425, "r_y2": 632.6030000000001, "r_x3": 416.321, "r_y3": 632.6030000000001, "coord_origin": "TOPLEFT"}, "text": "neural", "orig": "neural", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 77, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 445.989, "r_y0": 643.892, "r_x1": 480.588, "r_y1": 643.892, "r_x2": 480.588, "r_y2": 632.6030000000001, "r_x3": 445.989, "r_y3": 632.6030000000001, "coord_origin": "TOPLEFT"}, "text": "scientific", "orig": "scientific", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 78, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 151.518, "r_y0": 654.851, "r_x1": 171.483, "r_y1": 654.851, "r_x2": 171.483, "r_y2": 643.562, "r_x3": 151.518, "r_y3": 643.562, "coord_origin": "TOPLEFT"}, "text": "table", "orig": "table", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 79, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 175.509, "r_y0": 654.851, "r_x1": 222.623, "r_y1": 654.851, "r_x2": 222.623, "r_y2": 643.562, "r_x3": 175.509, "r_y3": 643.562, "coord_origin": "TOPLEFT"}, "text": "recognition.", "orig": "recognition.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 80, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 226.649, "r_y0": 654.851, "r_x1": 237.652, "r_y1": 654.851, "r_x2": 237.652, "r_y2": 643.562, "r_x3": 226.649, "r_y3": 643.562, "coord_origin": "TOPLEFT"}, "text": "In:", "orig": "In:", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 81, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 241.678, "r_y0": 654.851, "r_x1": 480.588, "r_y1": 654.851, "r_x2": 480.588, "r_y2": 643.562, "r_x3": 241.678, "r_y3": 643.562, "coord_origin": "TOPLEFT"}, "text": "2019 International Conference on Document Analysis and", "orig": "2019 International Conference on Document Analysis and", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 82, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 151.518, "r_y0": 665.809, "r_x1": 350.111, "r_y1": 665.809, "r_x2": 350.111, "r_y2": 654.52, "r_x3": 151.518, "r_y3": 654.52, "coord_origin": "TOPLEFT"}, "text": "Recognition (ICDAR). pp. 894-901. IEEE (2019)", "orig": "Recognition (ICDAR). pp. 894-901. IEEE (2019)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "4. Deng, Y., Rosenberg, D., Mann, G.: Challenges in end-to-end neural scientific table recognition. In: 2019 International Conference on Document Analysis and Recognition (ICDAR). pp. 894-901. IEEE (2019)"}], "headers": [{"label": "page_header", "id": 10, "page_no": 11, "cluster": {"id": 10, "label": "page_header", "bbox": {"l": 134.765, "t": 91.49300000000005, "r": 143.979, "b": 102.78200000000004, "coord_origin": "TOPLEFT"}, "confidence": 0.8610832691192627, "cells": [{"index": 0, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 102.78200000000004, "r_x1": 143.979, "r_y1": 102.78200000000004, "r_x2": 143.979, "r_y2": 91.49300000000005, "r_x3": 134.765, "r_y3": 91.49300000000005, "coord_origin": "TOPLEFT"}, "text": "12", "orig": "12", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "12"}, {"label": "page_header", "id": 9, "page_no": 11, "cluster": {"id": 9, "label": "page_header", "bbox": {"l": 167.821, "t": 91.49300000000005, "r": 231.72, "b": 102.78200000000004, "coord_origin": "TOPLEFT"}, "confidence": 0.8927664756774902, "cells": [{"index": 1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 167.821, "r_y0": 102.78200000000004, "r_x1": 231.72, "r_y1": 102.78200000000004, "r_x2": 231.72, "r_y2": 91.49300000000005, "r_x3": 167.821, "r_y3": 91.49300000000005, "coord_origin": "TOPLEFT"}, "text": "M. Lysak, et al.", "orig": "M. Lysak, et al.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "M. Lysak, et al."}]}}, {"page_no": 12, "size": {"width": 612.0, "height": 792.0}, "cells": [{"index": 0, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 194.478, "r_y0": 102.78200000000004, "r_x1": 447.543, "r_y1": 102.78200000000004, "r_x2": 447.543, "r_y2": 91.49300000000005, "r_x3": 194.478, "r_y3": 91.49300000000005, "coord_origin": "TOPLEFT"}, "text": "Optimized Table Tokenization for Table Structure Recognition", "orig": "Optimized Table Tokenization for Table Structure Recognition", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 471.376, "r_y0": 102.78200000000004, "r_x1": 480.59, "r_y1": 102.78200000000004, "r_x2": 480.59, "r_y2": 91.49300000000005, "r_x3": 471.376, "r_y3": 91.49300000000005, "coord_origin": "TOPLEFT"}, "text": "13", "orig": "13", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 2, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 139.371, "r_y0": 128.68499999999995, "r_x1": 146.537, "r_y1": 128.68499999999995, "r_x2": 146.537, "r_y2": 117.39599999999996, "r_x3": 139.371, "r_y3": 117.39599999999996, "coord_origin": "TOPLEFT"}, "text": "5.", "orig": "5.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 3, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 151.522, "r_y0": 128.68499999999995, "r_x1": 480.588, "r_y1": 128.68499999999995, "r_x2": 480.588, "r_y2": 117.39599999999996, "r_x3": 151.522, "r_y3": 117.39599999999996, "coord_origin": "TOPLEFT"}, "text": "Kayal, P., Anand, M., Desai, H., Singh, M.: Tables to latex: structure and content", "orig": "Kayal, P., Anand, M., Desai, H., Singh, M.: Tables to latex: structure and content", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 4, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 151.518, "r_y0": 139.644, "r_x1": 480.595, "r_y1": 139.644, "r_x2": 480.595, "r_y2": 128.35500000000002, "r_x3": 151.518, "r_y3": 128.35500000000002, "coord_origin": "TOPLEFT"}, "text": "extraction from scientific tables. International Journal on Document Analysis and", "orig": "extraction from scientific tables. International Journal on Document Analysis and", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 5, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 151.518, "r_y0": 150.60299999999995, "r_x1": 304.044, "r_y1": 150.60299999999995, "r_x2": 304.044, "r_y2": 139.31399999999996, "r_x3": 151.518, "r_y3": 139.31399999999996, "coord_origin": "TOPLEFT"}, "text": "Recognition (IJDAR) pp. 1-10 (2022)", "orig": "Recognition (IJDAR) pp. 1-10 (2022)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 6, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 139.371, "r_y0": 161.57299999999998, "r_x1": 146.537, "r_y1": 161.57299999999998, "r_x2": 146.537, "r_y2": 150.284, "r_x3": 139.371, "r_y3": 150.284, "coord_origin": "TOPLEFT"}, "text": "6.", "orig": "6.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 7, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 151.522, "r_y0": 161.57299999999998, "r_x1": 480.59, "r_y1": 161.57299999999998, "r_x2": 480.59, "r_y2": 150.284, "r_x3": 151.522, "r_y3": 150.284, "coord_origin": "TOPLEFT"}, "text": "Lee, E., Kwon, J., Yang, H., Park, J., Lee, S., Koo, H.I., Cho, N.I.: Table structure", "orig": "Lee, E., Kwon, J., Yang, H., Park, J., Lee, S., Koo, H.I., Cho, N.I.: Table structure", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 8, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 151.518, "r_y0": 172.53200000000004, "r_x1": 480.59, "r_y1": 172.53200000000004, "r_x2": 480.59, "r_y2": 161.24300000000005, "r_x3": 151.518, "r_y3": 161.24300000000005, "coord_origin": "TOPLEFT"}, "text": "recognition based on grid shape graph. In: 2022 Asia-Pacific Signal and Information", "orig": "recognition based on grid shape graph. In: 2022 Asia-Pacific Signal and Information", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 9, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 151.518, "r_y0": 183.49099999999999, "r_x1": 480.593, "r_y1": 183.49099999999999, "r_x2": 480.593, "r_y2": 172.202, "r_x3": 151.518, "r_y3": 172.202, "coord_origin": "TOPLEFT"}, "text": "Processing Association Annual Summit and Conference (APSIPA ASC). pp. 1868-", "orig": "Processing Association Annual Summit and Conference (APSIPA ASC). pp. 1868-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 10, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 151.518, "r_y0": 194.45000000000005, "r_x1": 226.374, "r_y1": 194.45000000000005, "r_x2": 226.374, "r_y2": 183.16099999999994, "r_x3": 151.518, "r_y3": 183.16099999999994, "coord_origin": "TOPLEFT"}, "text": "1873. IEEE (2022)", "orig": "1873. IEEE (2022)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 11, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 139.371, "r_y0": 205.41999999999996, "r_x1": 146.537, "r_y1": 205.41999999999996, "r_x2": 146.537, "r_y2": 194.13099999999997, "r_x3": 139.371, "r_y3": 194.13099999999997, "coord_origin": "TOPLEFT"}, "text": "7.", "orig": "7.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 12, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 151.522, "r_y0": 205.41999999999996, "r_x1": 162.398, "r_y1": 205.41999999999996, "r_x2": 162.398, "r_y2": 194.13099999999997, "r_x3": 151.522, "r_y3": 194.13099999999997, "coord_origin": "TOPLEFT"}, "text": "Li,", "orig": "Li,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 13, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 166.298, "r_y0": 205.41999999999996, "r_x1": 480.59, "r_y1": 205.41999999999996, "r_x2": 480.59, "r_y2": 194.13099999999997, "r_x3": 166.298, "r_y3": 194.13099999999997, "coord_origin": "TOPLEFT"}, "text": "M., Cui, L., Huang, S., Wei, F., Zhou, M., Li, Z.: Tablebank: A benchmark", "orig": "M., Cui, L., Huang, S., Wei, F., Zhou, M., Li, Z.: Tablebank: A benchmark", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 14, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 151.518, "r_y0": 216.37900000000002, "r_x1": 352.017, "r_y1": 216.37900000000002, "r_x2": 352.017, "r_y2": 205.09000000000003, "r_x3": 151.518, "r_y3": 205.09000000000003, "coord_origin": "TOPLEFT"}, "text": "dataset for table detection and recognition (2019)", "orig": "dataset for table detection and recognition (2019)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 15, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 139.371, "r_y0": 227.35000000000002, "r_x1": 146.537, "r_y1": 227.35000000000002, "r_x2": 146.537, "r_y2": 216.06100000000004, "r_x3": 139.371, "r_y3": 216.06100000000004, "coord_origin": "TOPLEFT"}, "text": "8.", "orig": "8.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 16, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 151.522, "r_y0": 227.35000000000002, "r_x1": 480.587, "r_y1": 227.35000000000002, "r_x2": 480.587, "r_y2": 216.06100000000004, "r_x3": 151.522, "r_y3": 216.06100000000004, "coord_origin": "TOPLEFT"}, "text": "Livathinos, N., Berrospi, C., Lysak, M., Kuropiatnyk, V., Nassar, A., Carvalho,", "orig": "Livathinos, N., Berrospi, C., Lysak, M., Kuropiatnyk, V., Nassar, A., Carvalho,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 17, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 151.518, "r_y0": 238.30899999999997, "r_x1": 189.414, "r_y1": 238.30899999999997, "r_x2": 189.414, "r_y2": 227.01999999999998, "r_x3": 151.518, "r_y3": 227.01999999999998, "coord_origin": "TOPLEFT"}, "text": "A., Dolfi,", "orig": "A., Dolfi,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 18, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 193.414, "r_y0": 238.30899999999997, "r_x1": 480.59, "r_y1": 238.30899999999997, "r_x2": 480.59, "r_y2": 227.01999999999998, "r_x3": 193.414, "r_y3": 227.01999999999998, "coord_origin": "TOPLEFT"}, "text": "M., Auer, C., Dinkla, K., Staar, P.: Robust pdf document conversion", "orig": "M., Auer, C., Dinkla, K., Staar, P.: Robust pdf document conversion", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 19, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 151.518, "r_y0": 249.26800000000003, "r_x1": 480.595, "r_y1": 249.26800000000003, "r_x2": 480.595, "r_y2": 237.97900000000004, "r_x3": 151.518, "r_y3": 237.97900000000004, "coord_origin": "TOPLEFT"}, "text": "using recurrent neural networks. Proceedings of the AAAI Conference on Artificial", "orig": "using recurrent neural networks. Proceedings of the AAAI Conference on Artificial", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 20, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 151.518, "r_y0": 260.227, "r_x1": 197.086, "r_y1": 260.227, "r_x2": 197.086, "r_y2": 248.938, "r_x3": 151.518, "r_y3": 248.938, "coord_origin": "TOPLEFT"}, "text": "Intelligence", "orig": "Intelligence", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 21, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 199.4, "r_y0": 259.07899999999995, "r_x1": 210.007, "r_y1": 259.07899999999995, "r_x2": 210.007, "r_y2": 251.15300000000002, "r_x3": 199.4, "r_y3": 251.15300000000002, "coord_origin": "TOPLEFT"}, "text": "35", "orig": "35", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 22, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 210.007, "r_y0": 260.227, "r_x1": 332.377, "r_y1": 260.227, "r_x2": 332.377, "r_y2": 248.938, "r_x3": 210.007, "r_y3": 248.938, "coord_origin": "TOPLEFT"}, "text": "(17), 15137-15145 (May 2021),", "orig": "(17), 15137-15145 (May 2021),", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 23, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 334.699, "r_y0": 259.331, "r_x1": 480.59, "r_y1": 259.331, "r_x2": 480.59, "r_y2": 251.86199999999997, "r_x3": 334.699, "r_y3": 251.86199999999997, "coord_origin": "TOPLEFT"}, "text": "https://ojs.aaai.org/index.php/", "orig": "https://ojs.aaai.org/index.php/", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 24, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 151.518, "r_y0": 270.289, "r_x1": 259.758, "r_y1": 270.289, "r_x2": 259.758, "r_y2": 262.82000000000005, "r_x3": 151.518, "r_y3": 262.82000000000005, "coord_origin": "TOPLEFT"}, "text": "AAAI/article/view/17777", "orig": "AAAI/article/view/17777", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 25, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 139.371, "r_y0": 282.156, "r_x1": 146.537, "r_y1": 282.156, "r_x2": 146.537, "r_y2": 270.86699999999996, "r_x3": 139.371, "r_y3": 270.86699999999996, "coord_origin": "TOPLEFT"}, "text": "9.", "orig": "9.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 26, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 151.522, "r_y0": 282.156, "r_x1": 480.588, "r_y1": 282.156, "r_x2": 480.588, "r_y2": 270.86699999999996, "r_x3": 151.522, "r_y3": 270.86699999999996, "coord_origin": "TOPLEFT"}, "text": "Nassar, A., Livathinos, N., Lysak, M., Staar, P.: Tableformer: Table structure un-", "orig": "Nassar, A., Livathinos, N., Lysak, M., Staar, P.: Tableformer: Table structure un-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 27, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 151.518, "r_y0": 293.115, "r_x1": 480.594, "r_y1": 293.115, "r_x2": 480.594, "r_y2": 281.826, "r_x3": 151.518, "r_y3": 281.826, "coord_origin": "TOPLEFT"}, "text": "derstanding with transformers. In: Proceedings of the IEEE/CVF Conference on", "orig": "derstanding with transformers. In: Proceedings of the IEEE/CVF Conference on", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 28, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 151.518, "r_y0": 304.074, "r_x1": 473.443, "r_y1": 304.074, "r_x2": 473.443, "r_y2": 292.785, "r_x3": 151.518, "r_y3": 292.785, "coord_origin": "TOPLEFT"}, "text": "Computer Vision and Pattern Recognition (CVPR). pp. 4614-4623 (June 2022)", "orig": "Computer Vision and Pattern Recognition (CVPR). pp. 4614-4623 (June 2022)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 29, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.764, "r_y0": 315.044, "r_x1": 146.537, "r_y1": 315.044, "r_x2": 146.537, "r_y2": 303.755, "r_x3": 134.764, "r_y3": 303.755, "coord_origin": "TOPLEFT"}, "text": "10.", "orig": "10.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 30, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 151.522, "r_y0": 315.044, "r_x1": 195.667, "r_y1": 315.044, "r_x2": 195.667, "r_y2": 303.755, "r_x3": 151.522, "r_y3": 303.755, "coord_origin": "TOPLEFT"}, "text": "Pfitzmann,", "orig": "Pfitzmann,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 31, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 200.249, "r_y0": 315.044, "r_x1": 211.893, "r_y1": 315.044, "r_x2": 211.893, "r_y2": 303.755, "r_x3": 200.249, "r_y3": 303.755, "coord_origin": "TOPLEFT"}, "text": "B.,", "orig": "B.,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 32, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 216.484, "r_y0": 315.044, "r_x1": 238.772, "r_y1": 315.044, "r_x2": 238.772, "r_y2": 303.755, "r_x3": 216.484, "r_y3": 303.755, "coord_origin": "TOPLEFT"}, "text": "Auer,", "orig": "Auer,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 33, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 243.362, "r_y0": 315.044, "r_x1": 255.134, "r_y1": 315.044, "r_x2": 255.134, "r_y2": 303.755, "r_x3": 243.362, "r_y3": 303.755, "coord_origin": "TOPLEFT"}, "text": "C.,", "orig": "C.,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 34, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 259.725, "r_y0": 315.044, "r_x1": 281.605, "r_y1": 315.044, "r_x2": 281.605, "r_y2": 303.755, "r_x3": 259.725, "r_y3": 303.755, "coord_origin": "TOPLEFT"}, "text": "Dolfi,", "orig": "Dolfi,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 35, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 286.187, "r_y0": 315.044, "r_x1": 299.748, "r_y1": 315.044, "r_x2": 299.748, "r_y2": 303.755, "r_x3": 286.187, "r_y3": 303.755, "coord_origin": "TOPLEFT"}, "text": "M.,", "orig": "M.,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 36, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 304.339, "r_y0": 315.044, "r_x1": 333.893, "r_y1": 315.044, "r_x2": 333.893, "r_y2": 303.755, "r_x3": 304.339, "r_y3": 303.755, "coord_origin": "TOPLEFT"}, "text": "Nassar,", "orig": "Nassar,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 37, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 338.483, "r_y0": 315.044, "r_x1": 358.187, "r_y1": 315.044, "r_x2": 358.187, "r_y2": 303.755, "r_x3": 338.483, "r_y3": 303.755, "coord_origin": "TOPLEFT"}, "text": "A.S.,", "orig": "A.S.,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 38, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 362.778, "r_y0": 315.044, "r_x1": 386.855, "r_y1": 315.044, "r_x2": 386.855, "r_y2": 303.755, "r_x3": 362.778, "r_y3": 303.755, "coord_origin": "TOPLEFT"}, "text": "Staar,", "orig": "Staar,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 39, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 391.437, "r_y0": 315.044, "r_x1": 421.382, "r_y1": 315.044, "r_x2": 421.382, "r_y2": 303.755, "r_x3": 391.437, "r_y3": 303.755, "coord_origin": "TOPLEFT"}, "text": "P.W.J.:", "orig": "P.W.J.:", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 40, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 425.973, "r_y0": 315.044, "r_x1": 469.09, "r_y1": 315.044, "r_x2": 469.09, "r_y2": 303.755, "r_x3": 425.973, "r_y3": 303.755, "coord_origin": "TOPLEFT"}, "text": "Doclaynet:", "orig": "Doclaynet:", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 41, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 473.68, "r_y0": 315.044, "r_x1": 480.589, "r_y1": 315.044, "r_x2": 480.589, "r_y2": 303.755, "r_x3": 473.68, "r_y3": 303.755, "coord_origin": "TOPLEFT"}, "text": "A", "orig": "A", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 42, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 151.518, "r_y0": 326.003, "r_x1": 480.59, "r_y1": 326.003, "r_x2": 480.59, "r_y2": 314.714, "r_x3": 151.518, "r_y3": 314.714, "coord_origin": "TOPLEFT"}, "text": "large human-annotated dataset for document-layout segmentation. In: Zhang, A.,", "orig": "large human-annotated dataset for document-layout segmentation. In: Zhang, A.,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 43, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 151.518, "r_y0": 336.962, "r_x1": 480.591, "r_y1": 336.962, "r_x2": 480.591, "r_y2": 325.673, "r_x3": 151.518, "r_y3": 325.673, "coord_origin": "TOPLEFT"}, "text": "Rangwala, H. (eds.) KDD '22: The 28th ACM SIGKDD Conference on Knowledge", "orig": "Rangwala, H. (eds.) KDD '22: The 28th ACM SIGKDD Conference on Knowledge", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 44, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 151.518, "r_y0": 347.921, "r_x1": 480.591, "r_y1": 347.921, "r_x2": 480.591, "r_y2": 336.632, "r_x3": 151.518, "r_y3": 336.632, "coord_origin": "TOPLEFT"}, "text": "Discovery and Data Mining, Washington, DC, USA, August 14 - 18, 2022. pp.", "orig": "Discovery and Data Mining, Washington, DC, USA, August 14 - 18, 2022. pp.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 45, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 151.518, "r_y0": 358.88, "r_x1": 251.141, "r_y1": 358.88, "r_x2": 251.141, "r_y2": 347.591, "r_x3": 151.518, "r_y3": 347.591, "coord_origin": "TOPLEFT"}, "text": "3743-3751. ACM (2022).", "orig": "3743-3751. ACM (2022).", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 46, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 253.99, "r_y0": 357.984, "r_x1": 437.533, "r_y1": 357.984, "r_x2": 437.533, "r_y2": 350.515, "r_x3": 253.99, "r_y3": 350.515, "coord_origin": "TOPLEFT"}, "text": "https://doi.org/10.1145/3534678.3539043", "orig": "https://doi.org/10.1145/3534678.3539043", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 47, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 437.532, "r_y0": 358.88, "r_x1": 440.091, "r_y1": 358.88, "r_x2": 440.091, "r_y2": 347.591, "r_x3": 437.532, "r_y3": 347.591, "coord_origin": "TOPLEFT"}, "text": ",", "orig": ",", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 48, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 442.942, "r_y0": 357.984, "r_x1": 480.594, "r_y1": 357.984, "r_x2": 480.594, "r_y2": 350.515, "r_x3": 442.942, "r_y3": 350.515, "coord_origin": "TOPLEFT"}, "text": "https://", "orig": "https://", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 49, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 151.518, "r_y0": 368.943, "r_x1": 297.409, "r_y1": 368.943, "r_x2": 297.409, "r_y2": 361.474, "r_x3": 151.518, "r_y3": 361.474, "coord_origin": "TOPLEFT"}, "text": "doi.org/10.1145/3534678.3539043", "orig": "doi.org/10.1145/3534678.3539043", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 50, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.764, "r_y0": 380.809, "r_x1": 146.537, "r_y1": 380.809, "r_x2": 146.537, "r_y2": 369.52, "r_x3": 134.764, "r_y3": 369.52, "coord_origin": "TOPLEFT"}, "text": "11.", "orig": "11.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 51, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 151.522, "r_y0": 380.809, "r_x1": 480.589, "r_y1": 380.809, "r_x2": 480.589, "r_y2": 369.52, "r_x3": 151.522, "r_y3": 369.52, "coord_origin": "TOPLEFT"}, "text": "Prasad, D., Gadpal, A., Kapadni, K., Visave, M., Sultanpure, K.: Cascadetabnet:", "orig": "Prasad, D., Gadpal, A., Kapadni, K., Visave, M., Sultanpure, K.: Cascadetabnet:", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 52, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 151.518, "r_y0": 391.768, "r_x1": 480.593, "r_y1": 391.768, "r_x2": 480.593, "r_y2": 380.479, "r_x3": 151.518, "r_y3": 380.479, "coord_origin": "TOPLEFT"}, "text": "An approach for end to end table detection and structure recognition from image-", "orig": "An approach for end to end table detection and structure recognition from image-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 53, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 151.518, "r_y0": 402.727, "r_x1": 480.593, "r_y1": 402.727, "r_x2": 480.593, "r_y2": 391.438, "r_x3": 151.518, "r_y3": 391.438, "coord_origin": "TOPLEFT"}, "text": "based documents. In: Proceedings of the IEEE/CVF conference on computer vision", "orig": "based documents. In: Proceedings of the IEEE/CVF conference on computer vision", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 54, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 151.518, "r_y0": 413.686, "r_x1": 373.827, "r_y1": 413.686, "r_x2": 373.827, "r_y2": 402.397, "r_x3": 151.518, "r_y3": 402.397, "coord_origin": "TOPLEFT"}, "text": "and pattern recognition workshops. pp. 572-573 (2020)", "orig": "and pattern recognition workshops. pp. 572-573 (2020)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 55, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.764, "r_y0": 424.656, "r_x1": 146.537, "r_y1": 424.656, "r_x2": 146.537, "r_y2": 413.367, "r_x3": 134.764, "r_y3": 413.367, "coord_origin": "TOPLEFT"}, "text": "12.", "orig": "12.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 56, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 151.522, "r_y0": 424.656, "r_x1": 480.587, "r_y1": 424.656, "r_x2": 480.587, "r_y2": 413.367, "r_x3": 151.522, "r_y3": 413.367, "coord_origin": "TOPLEFT"}, "text": "Schreiber, S., Agne, S., Wolf, I., Dengel, A., Ahmed, S.: Deepdesrt: Deep learning", "orig": "Schreiber, S., Agne, S., Wolf, I., Dengel, A., Ahmed, S.: Deepdesrt: Deep learning", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 57, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 151.518, "r_y0": 435.615, "r_x1": 480.595, "r_y1": 435.615, "r_x2": 480.595, "r_y2": 424.326, "r_x3": 151.518, "r_y3": 424.326, "coord_origin": "TOPLEFT"}, "text": "for detection and structure recognition of tables in document images. In: 2017 14th", "orig": "for detection and structure recognition of tables in document images. In: 2017 14th", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 58, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 151.518, "r_y0": 446.574, "r_x1": 480.588, "r_y1": 446.574, "r_x2": 480.588, "r_y2": 435.285, "r_x3": 151.518, "r_y3": 435.285, "coord_origin": "TOPLEFT"}, "text": "IAPR international conference on document analysis and recognition (ICDAR).", "orig": "IAPR international conference on document analysis and recognition (ICDAR).", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 59, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 151.518, "r_y0": 457.533, "r_x1": 292.915, "r_y1": 457.533, "r_x2": 292.915, "r_y2": 446.244, "r_x3": 151.518, "r_y3": 446.244, "coord_origin": "TOPLEFT"}, "text": "vol. 1, pp. 1162-1167. IEEE (2017)", "orig": "vol. 1, pp. 1162-1167. IEEE (2017)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 60, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.764, "r_y0": 468.503, "r_x1": 146.537, "r_y1": 468.503, "r_x2": 146.537, "r_y2": 457.214, "r_x3": 134.764, "r_y3": 457.214, "coord_origin": "TOPLEFT"}, "text": "13.", "orig": "13.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 61, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 151.522, "r_y0": 468.503, "r_x1": 480.59, "r_y1": 468.503, "r_x2": 480.59, "r_y2": 457.214, "r_x3": 151.522, "r_y3": 457.214, "coord_origin": "TOPLEFT"}, "text": "Siddiqui, S.A., Fateh, I.A., Rizvi, S.T.R., Dengel, A., Ahmed, S.: Deeptabstr: Deep", "orig": "Siddiqui, S.A., Fateh, I.A., Rizvi, S.T.R., Dengel, A., Ahmed, S.: Deeptabstr: Deep", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 62, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 151.518, "r_y0": 479.462, "r_x1": 480.591, "r_y1": 479.462, "r_x2": 480.591, "r_y2": 468.173, "r_x3": 151.518, "r_y3": 468.173, "coord_origin": "TOPLEFT"}, "text": "learning based table structure recognition. In: 2019 International Conference on", "orig": "learning based table structure recognition. In: 2019 International Conference on", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 63, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 151.518, "r_y0": 490.421, "r_x1": 439.06, "r_y1": 490.421, "r_x2": 439.06, "r_y2": 479.132, "r_x3": 151.518, "r_y3": 479.132, "coord_origin": "TOPLEFT"}, "text": "Document Analysis and Recognition (ICDAR). pp. 1403-1409 (2019).", "orig": "Document Analysis and Recognition (ICDAR). pp. 1403-1409 (2019).", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 64, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 442.942, "r_y0": 489.525, "r_x1": 480.594, "r_y1": 489.525, "r_x2": 480.594, "r_y2": 482.056, "r_x3": 442.942, "r_y3": 482.056, "coord_origin": "TOPLEFT"}, "text": "https://", "orig": "https://", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 65, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 151.518, "r_y0": 500.484, "r_x1": 302.116, "r_y1": 500.484, "r_x2": 302.116, "r_y2": 493.015, "r_x3": 151.518, "r_y3": 493.015, "coord_origin": "TOPLEFT"}, "text": "doi.org/10.1109/ICDAR.2019.00226", "orig": "doi.org/10.1109/ICDAR.2019.00226", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 66, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.764, "r_y0": 512.35, "r_x1": 146.537, "r_y1": 512.35, "r_x2": 146.537, "r_y2": 501.061, "r_x3": 134.764, "r_y3": 501.061, "coord_origin": "TOPLEFT"}, "text": "14.", "orig": "14.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 67, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 151.522, "r_y0": 512.35, "r_x1": 480.591, "r_y1": 512.35, "r_x2": 480.591, "r_y2": 501.061, "r_x3": 151.522, "r_y3": 501.061, "coord_origin": "TOPLEFT"}, "text": "Smock, B., Pesala, R., Abraham, R.: PubTables-1M: Towards comprehensive ta-", "orig": "Smock, B., Pesala, R., Abraham, R.: PubTables-1M: Towards comprehensive ta-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 68, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 151.518, "r_y0": 523.309, "r_x1": 480.593, "r_y1": 523.309, "r_x2": 480.593, "r_y2": 512.02, "r_x3": 151.518, "r_y3": 512.02, "coord_origin": "TOPLEFT"}, "text": "ble extraction from unstructured documents. In: Proceedings of the IEEE/CVF", "orig": "ble extraction from unstructured documents. In: Proceedings of the IEEE/CVF", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 69, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 151.518, "r_y0": 534.268, "r_x1": 480.588, "r_y1": 534.268, "r_x2": 480.588, "r_y2": 522.979, "r_x3": 151.518, "r_y3": 522.979, "coord_origin": "TOPLEFT"}, "text": "Conference on Computer Vision and Pattern Recognition (CVPR). pp. 4634-4642", "orig": "Conference on Computer Vision and Pattern Recognition (CVPR). pp. 4634-4642", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 70, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 151.518, "r_y0": 545.227, "r_x1": 199.247, "r_y1": 545.227, "r_x2": 199.247, "r_y2": 533.938, "r_x3": 151.518, "r_y3": 533.938, "coord_origin": "TOPLEFT"}, "text": "(June 2022)", "orig": "(June 2022)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 71, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.764, "r_y0": 556.197, "r_x1": 146.537, "r_y1": 556.197, "r_x2": 146.537, "r_y2": 544.908, "r_x3": 134.764, "r_y3": 544.908, "coord_origin": "TOPLEFT"}, "text": "15.", "orig": "15.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 72, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 151.522, "r_y0": 556.197, "r_x1": 480.587, "r_y1": 556.197, "r_x2": 480.587, "r_y2": 544.908, "r_x3": 151.522, "r_y3": 544.908, "coord_origin": "TOPLEFT"}, "text": "Staar, P.W.J., Dolfi, M., Auer, C., Bekas, C.: Corpus conversion service: A ma-", "orig": "Staar, P.W.J., Dolfi, M., Auer, C., Bekas, C.: Corpus conversion service: A ma-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 73, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 151.518, "r_y0": 567.156, "r_x1": 480.588, "r_y1": 567.156, "r_x2": 480.588, "r_y2": 555.867, "r_x3": 151.518, "r_y3": 555.867, "coord_origin": "TOPLEFT"}, "text": "chine learning platform to ingest documents at scale. In: Proceedings of the 24th", "orig": "chine learning platform to ingest documents at scale. In: Proceedings of the 24th", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 74, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 151.518, "r_y0": 578.115, "r_x1": 480.591, "r_y1": 578.115, "r_x2": 480.591, "r_y2": 566.826, "r_x3": 151.518, "r_y3": 566.826, "coord_origin": "TOPLEFT"}, "text": "ACM SIGKDD International Conference on Knowledge Discovery & Data Min-", "orig": "ACM SIGKDD International Conference on Knowledge Discovery & Data Min-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 75, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 151.518, "r_y0": 589.0740000000001, "r_x1": 480.592, "r_y1": 589.0740000000001, "r_x2": 480.592, "r_y2": 577.785, "r_x3": 151.518, "r_y3": 577.785, "coord_origin": "TOPLEFT"}, "text": "ing. pp. 774-782. KDD '18, Association for Computing Machinery, New York, NY,", "orig": "ing. pp. 774-782. KDD '18, Association for Computing Machinery, New York, NY,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 76, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 151.518, "r_y0": 600.033, "r_x1": 200.758, "r_y1": 600.033, "r_x2": 200.758, "r_y2": 588.744, "r_x3": 151.518, "r_y3": 588.744, "coord_origin": "TOPLEFT"}, "text": "USA (2018).", "orig": "USA (2018).", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 77, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 202.916, "r_y0": 599.137, "r_x1": 386.459, "r_y1": 599.137, "r_x2": 386.459, "r_y2": 591.668, "r_x3": 202.916, "r_y3": 591.668, "coord_origin": "TOPLEFT"}, "text": "https://doi.org/10.1145/3219819.3219834", "orig": "https://doi.org/10.1145/3219819.3219834", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 78, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 386.458, "r_y0": 600.033, "r_x1": 389.017, "r_y1": 600.033, "r_x2": 389.017, "r_y2": 588.744, "r_x3": 386.458, "r_y3": 588.744, "coord_origin": "TOPLEFT"}, "text": ",", "orig": ",", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 79, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 391.173, "r_y0": 599.137, "r_x1": 480.596, "r_y1": 599.137, "r_x2": 480.596, "r_y2": 591.668, "r_x3": 391.173, "r_y3": 591.668, "coord_origin": "TOPLEFT"}, "text": "https://doi.org/10.", "orig": "https://doi.org/10.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 80, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 151.518, "r_y0": 610.096, "r_x1": 245.638, "r_y1": 610.096, "r_x2": 245.638, "r_y2": 602.627, "r_x3": 151.518, "r_y3": 602.627, "coord_origin": "TOPLEFT"}, "text": "1145/3219819.3219834", "orig": "1145/3219819.3219834", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 81, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.764, "r_y0": 621.962, "r_x1": 146.537, "r_y1": 621.962, "r_x2": 146.537, "r_y2": 610.673, "r_x3": 134.764, "r_y3": 610.673, "coord_origin": "TOPLEFT"}, "text": "16.", "orig": "16.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 82, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 151.522, "r_y0": 621.962, "r_x1": 194.229, "r_y1": 621.962, "r_x2": 194.229, "r_y2": 610.673, "r_x3": 151.522, "r_y3": 610.673, "coord_origin": "TOPLEFT"}, "text": "Wang, X.:", "orig": "Wang, X.:", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 83, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 199.313, "r_y0": 621.962, "r_x1": 230.817, "r_y1": 621.962, "r_x2": 230.817, "r_y2": 610.673, "r_x3": 199.313, "r_y3": 610.673, "coord_origin": "TOPLEFT"}, "text": "Tabular", "orig": "Tabular", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 84, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 235.91, "r_y0": 621.962, "r_x1": 285.885, "r_y1": 621.962, "r_x2": 285.885, "r_y2": 610.673, "r_x3": 235.91, "r_y3": 610.673, "coord_origin": "TOPLEFT"}, "text": "Abstraction,", "orig": "Abstraction,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 85, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 290.969, "r_y0": 621.962, "r_x1": 323.342, "r_y1": 621.962, "r_x2": 323.342, "r_y2": 610.673, "r_x3": 290.969, "r_y3": 610.673, "coord_origin": "TOPLEFT"}, "text": "Editing,", "orig": "Editing,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 86, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 328.435, "r_y0": 621.962, "r_x1": 343.278, "r_y1": 621.962, "r_x2": 343.278, "r_y2": 610.673, "r_x3": 328.435, "r_y3": 610.673, "coord_origin": "TOPLEFT"}, "text": "and", "orig": "and", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 87, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 348.371, "r_y0": 621.962, "r_x1": 396.118, "r_y1": 621.962, "r_x2": 396.118, "r_y2": 610.673, "r_x3": 348.371, "r_y3": 610.673, "coord_origin": "TOPLEFT"}, "text": "Formatting.", "orig": "Formatting.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 88, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 401.21, "r_y0": 621.962, "r_x1": 424.753, "r_y1": 621.962, "r_x2": 424.753, "r_y2": 610.673, "r_x3": 401.21, "r_y3": 610.673, "coord_origin": "TOPLEFT"}, "text": "Ph.D.", "orig": "Ph.D.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 89, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 429.846, "r_y0": 621.962, "r_x1": 455.031, "r_y1": 621.962, "r_x2": 455.031, "r_y2": 610.673, "r_x3": 429.846, "r_y3": 610.673, "coord_origin": "TOPLEFT"}, "text": "thesis,", "orig": "thesis,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 90, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 460.124, "r_y0": 621.962, "r_x1": 480.595, "r_y1": 621.962, "r_x2": 480.595, "r_y2": 610.673, "r_x3": 460.124, "r_y3": 610.673, "coord_origin": "TOPLEFT"}, "text": "CAN", "orig": "CAN", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 91, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 151.518, "r_y0": 632.921, "r_x1": 234.43, "r_y1": 632.921, "r_x2": 234.43, "r_y2": 621.6320000000001, "r_x3": 151.518, "r_y3": 621.6320000000001, "coord_origin": "TOPLEFT"}, "text": "(1996), aAINN09397", "orig": "(1996), aAINN09397", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 92, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.764, "r_y0": 643.891, "r_x1": 146.537, "r_y1": 643.891, "r_x2": 146.537, "r_y2": 632.602, "r_x3": 134.764, "r_y3": 632.602, "coord_origin": "TOPLEFT"}, "text": "17.", "orig": "17.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 93, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 151.522, "r_y0": 643.891, "r_x1": 480.587, "r_y1": 643.891, "r_x2": 480.587, "r_y2": 632.602, "r_x3": 151.522, "r_y3": 632.602, "coord_origin": "TOPLEFT"}, "text": "Xue, W., Li, Q., Tao, D.: Res2tim: Reconstruct syntactic structures from table", "orig": "Xue, W., Li, Q., Tao, D.: Res2tim: Reconstruct syntactic structures from table", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 94, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 151.518, "r_y0": 654.85, "r_x1": 480.591, "r_y1": 654.85, "r_x2": 480.591, "r_y2": 643.561, "r_x3": 151.518, "r_y3": 643.561, "coord_origin": "TOPLEFT"}, "text": "images. In: 2019 International Conference on Document Analysis and Recognition", "orig": "images. In: 2019 International Conference on Document Analysis and Recognition", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 95, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 151.518, "r_y0": 665.809, "r_x1": 299.303, "r_y1": 665.809, "r_x2": 299.303, "r_y2": 654.52, "r_x3": 151.518, "r_y3": 654.52, "coord_origin": "TOPLEFT"}, "text": "(ICDAR). pp. 749-755. IEEE (2019)", "orig": "(ICDAR). pp. 749-755. IEEE (2019)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "parsed_page": null, "predictions": {"layout": {"clusters": [{"id": 13, "label": "page_header", "bbox": {"l": 194.478, "t": 91.49300000000005, "r": 447.543, "b": 102.78200000000004, "coord_origin": "TOPLEFT"}, "confidence": 0.9163166880607605, "cells": [{"index": 0, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 194.478, "r_y0": 102.78200000000004, "r_x1": 447.543, "r_y1": 102.78200000000004, "r_x2": 447.543, "r_y2": 91.49300000000005, "r_x3": 194.478, "r_y3": 91.49300000000005, "coord_origin": "TOPLEFT"}, "text": "Optimized Table Tokenization for Table Structure Recognition", "orig": "Optimized Table Tokenization for Table Structure Recognition", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 14, "label": "page_header", "bbox": {"l": 471.376, "t": 91.49300000000005, "r": 480.59, "b": 102.78200000000004, "coord_origin": "TOPLEFT"}, "confidence": 0.9061064720153809, "cells": [{"index": 1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 471.376, "r_y0": 102.78200000000004, "r_x1": 480.59, "r_y1": 102.78200000000004, "r_x2": 480.59, "r_y2": 91.49300000000005, "r_x3": 471.376, "r_y3": 91.49300000000005, "coord_origin": "TOPLEFT"}, "text": "13", "orig": "13", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 5, "label": "list_item", "bbox": {"l": 139.371, "t": 117.39599999999996, "r": 480.595, "b": 150.60299999999995, "coord_origin": "TOPLEFT"}, "confidence": 0.9677112698554993, "cells": [{"index": 2, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 139.371, "r_y0": 128.68499999999995, "r_x1": 146.537, "r_y1": 128.68499999999995, "r_x2": 146.537, "r_y2": 117.39599999999996, "r_x3": 139.371, "r_y3": 117.39599999999996, "coord_origin": "TOPLEFT"}, "text": "5.", "orig": "5.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 3, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 151.522, "r_y0": 128.68499999999995, "r_x1": 480.588, "r_y1": 128.68499999999995, "r_x2": 480.588, "r_y2": 117.39599999999996, "r_x3": 151.522, "r_y3": 117.39599999999996, "coord_origin": "TOPLEFT"}, "text": "Kayal, P., Anand, M., Desai, H., Singh, M.: Tables to latex: structure and content", "orig": "Kayal, P., Anand, M., Desai, H., Singh, M.: Tables to latex: structure and content", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 4, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 151.518, "r_y0": 139.644, "r_x1": 480.595, "r_y1": 139.644, "r_x2": 480.595, "r_y2": 128.35500000000002, "r_x3": 151.518, "r_y3": 128.35500000000002, "coord_origin": "TOPLEFT"}, "text": "extraction from scientific tables. International Journal on Document Analysis and", "orig": "extraction from scientific tables. International Journal on Document Analysis and", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 5, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 151.518, "r_y0": 150.60299999999995, "r_x1": 304.044, "r_y1": 150.60299999999995, "r_x2": 304.044, "r_y2": 139.31399999999996, "r_x3": 151.518, "r_y3": 139.31399999999996, "coord_origin": "TOPLEFT"}, "text": "Recognition (IJDAR) pp. 1-10 (2022)", "orig": "Recognition (IJDAR) pp. 1-10 (2022)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 1, "label": "list_item", "bbox": {"l": 139.371, "t": 150.284, "r": 480.593, "b": 194.45000000000005, "coord_origin": "TOPLEFT"}, "confidence": 0.973045289516449, "cells": [{"index": 6, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 139.371, "r_y0": 161.57299999999998, "r_x1": 146.537, "r_y1": 161.57299999999998, "r_x2": 146.537, "r_y2": 150.284, "r_x3": 139.371, "r_y3": 150.284, "coord_origin": "TOPLEFT"}, "text": "6.", "orig": "6.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 7, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 151.522, "r_y0": 161.57299999999998, "r_x1": 480.59, "r_y1": 161.57299999999998, "r_x2": 480.59, "r_y2": 150.284, "r_x3": 151.522, "r_y3": 150.284, "coord_origin": "TOPLEFT"}, "text": "Lee, E., Kwon, J., Yang, H., Park, J., Lee, S., Koo, H.I., Cho, N.I.: Table structure", "orig": "Lee, E., Kwon, J., Yang, H., Park, J., Lee, S., Koo, H.I., Cho, N.I.: Table structure", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 8, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 151.518, "r_y0": 172.53200000000004, "r_x1": 480.59, "r_y1": 172.53200000000004, "r_x2": 480.59, "r_y2": 161.24300000000005, "r_x3": 151.518, "r_y3": 161.24300000000005, "coord_origin": "TOPLEFT"}, "text": "recognition based on grid shape graph. In: 2022 Asia-Pacific Signal and Information", "orig": "recognition based on grid shape graph. In: 2022 Asia-Pacific Signal and Information", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 9, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 151.518, "r_y0": 183.49099999999999, "r_x1": 480.593, "r_y1": 183.49099999999999, "r_x2": 480.593, "r_y2": 172.202, "r_x3": 151.518, "r_y3": 172.202, "coord_origin": "TOPLEFT"}, "text": "Processing Association Annual Summit and Conference (APSIPA ASC). pp. 1868-", "orig": "Processing Association Annual Summit and Conference (APSIPA ASC). pp. 1868-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 10, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 151.518, "r_y0": 194.45000000000005, "r_x1": 226.374, "r_y1": 194.45000000000005, "r_x2": 226.374, "r_y2": 183.16099999999994, "r_x3": 151.518, "r_y3": 183.16099999999994, "coord_origin": "TOPLEFT"}, "text": "1873. IEEE (2022)", "orig": "1873. IEEE (2022)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 10, "label": "list_item", "bbox": {"l": 139.371, "t": 194.13099999999997, "r": 480.59, "b": 216.37900000000002, "coord_origin": "TOPLEFT"}, "confidence": 0.9582491517066956, "cells": [{"index": 11, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 139.371, "r_y0": 205.41999999999996, "r_x1": 146.537, "r_y1": 205.41999999999996, "r_x2": 146.537, "r_y2": 194.13099999999997, "r_x3": 139.371, "r_y3": 194.13099999999997, "coord_origin": "TOPLEFT"}, "text": "7.", "orig": "7.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 12, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 151.522, "r_y0": 205.41999999999996, "r_x1": 162.398, "r_y1": 205.41999999999996, "r_x2": 162.398, "r_y2": 194.13099999999997, "r_x3": 151.522, "r_y3": 194.13099999999997, "coord_origin": "TOPLEFT"}, "text": "Li,", "orig": "Li,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 13, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 166.298, "r_y0": 205.41999999999996, "r_x1": 480.59, "r_y1": 205.41999999999996, "r_x2": 480.59, "r_y2": 194.13099999999997, "r_x3": 166.298, "r_y3": 194.13099999999997, "coord_origin": "TOPLEFT"}, "text": "M., Cui, L., Huang, S., Wei, F., Zhou, M., Li, Z.: Tablebank: A benchmark", "orig": "M., Cui, L., Huang, S., Wei, F., Zhou, M., Li, Z.: Tablebank: A benchmark", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 14, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 151.518, "r_y0": 216.37900000000002, "r_x1": 352.017, "r_y1": 216.37900000000002, "r_x2": 352.017, "r_y2": 205.09000000000003, "r_x3": 151.518, "r_y3": 205.09000000000003, "coord_origin": "TOPLEFT"}, "text": "dataset for table detection and recognition (2019)", "orig": "dataset for table detection and recognition (2019)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 4, "label": "list_item", "bbox": {"l": 139.371, "t": 216.06100000000004, "r": 480.595, "b": 270.289, "coord_origin": "TOPLEFT"}, "confidence": 0.967814564704895, "cells": [{"index": 15, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 139.371, "r_y0": 227.35000000000002, "r_x1": 146.537, "r_y1": 227.35000000000002, "r_x2": 146.537, "r_y2": 216.06100000000004, "r_x3": 139.371, "r_y3": 216.06100000000004, "coord_origin": "TOPLEFT"}, "text": "8.", "orig": "8.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 16, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 151.522, "r_y0": 227.35000000000002, "r_x1": 480.587, "r_y1": 227.35000000000002, "r_x2": 480.587, "r_y2": 216.06100000000004, "r_x3": 151.522, "r_y3": 216.06100000000004, "coord_origin": "TOPLEFT"}, "text": "Livathinos, N., Berrospi, C., Lysak, M., Kuropiatnyk, V., Nassar, A., Carvalho,", "orig": "Livathinos, N., Berrospi, C., Lysak, M., Kuropiatnyk, V., Nassar, A., Carvalho,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 17, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 151.518, "r_y0": 238.30899999999997, "r_x1": 189.414, "r_y1": 238.30899999999997, "r_x2": 189.414, "r_y2": 227.01999999999998, "r_x3": 151.518, "r_y3": 227.01999999999998, "coord_origin": "TOPLEFT"}, "text": "A., Dolfi,", "orig": "A., Dolfi,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 18, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 193.414, "r_y0": 238.30899999999997, "r_x1": 480.59, "r_y1": 238.30899999999997, "r_x2": 480.59, "r_y2": 227.01999999999998, "r_x3": 193.414, "r_y3": 227.01999999999998, "coord_origin": "TOPLEFT"}, "text": "M., Auer, C., Dinkla, K., Staar, P.: Robust pdf document conversion", "orig": "M., Auer, C., Dinkla, K., Staar, P.: Robust pdf document conversion", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 19, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 151.518, "r_y0": 249.26800000000003, "r_x1": 480.595, "r_y1": 249.26800000000003, "r_x2": 480.595, "r_y2": 237.97900000000004, "r_x3": 151.518, "r_y3": 237.97900000000004, "coord_origin": "TOPLEFT"}, "text": "using recurrent neural networks. Proceedings of the AAAI Conference on Artificial", "orig": "using recurrent neural networks. Proceedings of the AAAI Conference on Artificial", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 20, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 151.518, "r_y0": 260.227, "r_x1": 197.086, "r_y1": 260.227, "r_x2": 197.086, "r_y2": 248.938, "r_x3": 151.518, "r_y3": 248.938, "coord_origin": "TOPLEFT"}, "text": "Intelligence", "orig": "Intelligence", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 21, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 199.4, "r_y0": 259.07899999999995, "r_x1": 210.007, "r_y1": 259.07899999999995, "r_x2": 210.007, "r_y2": 251.15300000000002, "r_x3": 199.4, "r_y3": 251.15300000000002, "coord_origin": "TOPLEFT"}, "text": "35", "orig": "35", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 22, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 210.007, "r_y0": 260.227, "r_x1": 332.377, "r_y1": 260.227, "r_x2": 332.377, "r_y2": 248.938, "r_x3": 210.007, "r_y3": 248.938, "coord_origin": "TOPLEFT"}, "text": "(17), 15137-15145 (May 2021),", "orig": "(17), 15137-15145 (May 2021),", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 23, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 334.699, "r_y0": 259.331, "r_x1": 480.59, "r_y1": 259.331, "r_x2": 480.59, "r_y2": 251.86199999999997, "r_x3": 334.699, "r_y3": 251.86199999999997, "coord_origin": "TOPLEFT"}, "text": "https://ojs.aaai.org/index.php/", "orig": "https://ojs.aaai.org/index.php/", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 24, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 151.518, "r_y0": 270.289, "r_x1": 259.758, "r_y1": 270.289, "r_x2": 259.758, "r_y2": 262.82000000000005, "r_x3": 151.518, "r_y3": 262.82000000000005, "coord_origin": "TOPLEFT"}, "text": "AAAI/article/view/17777", "orig": "AAAI/article/view/17777", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 11, "label": "list_item", "bbox": {"l": 139.371, "t": 270.86699999999996, "r": 480.594, "b": 304.074, "coord_origin": "TOPLEFT"}, "confidence": 0.9557179808616638, "cells": [{"index": 25, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 139.371, "r_y0": 282.156, "r_x1": 146.537, "r_y1": 282.156, "r_x2": 146.537, "r_y2": 270.86699999999996, "r_x3": 139.371, "r_y3": 270.86699999999996, "coord_origin": "TOPLEFT"}, "text": "9.", "orig": "9.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 26, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 151.522, "r_y0": 282.156, "r_x1": 480.588, "r_y1": 282.156, "r_x2": 480.588, "r_y2": 270.86699999999996, "r_x3": 151.522, "r_y3": 270.86699999999996, "coord_origin": "TOPLEFT"}, "text": "Nassar, A., Livathinos, N., Lysak, M., Staar, P.: Tableformer: Table structure un-", "orig": "Nassar, A., Livathinos, N., Lysak, M., Staar, P.: Tableformer: Table structure un-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 27, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 151.518, "r_y0": 293.115, "r_x1": 480.594, "r_y1": 293.115, "r_x2": 480.594, "r_y2": 281.826, "r_x3": 151.518, "r_y3": 281.826, "coord_origin": "TOPLEFT"}, "text": "derstanding with transformers. In: Proceedings of the IEEE/CVF Conference on", "orig": "derstanding with transformers. In: Proceedings of the IEEE/CVF Conference on", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 28, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 151.518, "r_y0": 304.074, "r_x1": 473.443, "r_y1": 304.074, "r_x2": 473.443, "r_y2": 292.785, "r_x3": 151.518, "r_y3": 292.785, "coord_origin": "TOPLEFT"}, "text": "Computer Vision and Pattern Recognition (CVPR). pp. 4614-4623 (June 2022)", "orig": "Computer Vision and Pattern Recognition (CVPR). pp. 4614-4623 (June 2022)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 9, "label": "list_item", "bbox": {"l": 134.764, "t": 303.755, "r": 480.594, "b": 368.943, "coord_origin": "TOPLEFT"}, "confidence": 0.9639304876327515, "cells": [{"index": 29, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.764, "r_y0": 315.044, "r_x1": 146.537, "r_y1": 315.044, "r_x2": 146.537, "r_y2": 303.755, "r_x3": 134.764, "r_y3": 303.755, "coord_origin": "TOPLEFT"}, "text": "10.", "orig": "10.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 30, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 151.522, "r_y0": 315.044, "r_x1": 195.667, "r_y1": 315.044, "r_x2": 195.667, "r_y2": 303.755, "r_x3": 151.522, "r_y3": 303.755, "coord_origin": "TOPLEFT"}, "text": "Pfitzmann,", "orig": "Pfitzmann,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 31, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 200.249, "r_y0": 315.044, "r_x1": 211.893, "r_y1": 315.044, "r_x2": 211.893, "r_y2": 303.755, "r_x3": 200.249, "r_y3": 303.755, "coord_origin": "TOPLEFT"}, "text": "B.,", "orig": "B.,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 32, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 216.484, "r_y0": 315.044, "r_x1": 238.772, "r_y1": 315.044, "r_x2": 238.772, "r_y2": 303.755, "r_x3": 216.484, "r_y3": 303.755, "coord_origin": "TOPLEFT"}, "text": "Auer,", "orig": "Auer,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 33, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 243.362, "r_y0": 315.044, "r_x1": 255.134, "r_y1": 315.044, "r_x2": 255.134, "r_y2": 303.755, "r_x3": 243.362, "r_y3": 303.755, "coord_origin": "TOPLEFT"}, "text": "C.,", "orig": "C.,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 34, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 259.725, "r_y0": 315.044, "r_x1": 281.605, "r_y1": 315.044, "r_x2": 281.605, "r_y2": 303.755, "r_x3": 259.725, "r_y3": 303.755, "coord_origin": "TOPLEFT"}, "text": "Dolfi,", "orig": "Dolfi,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 35, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 286.187, "r_y0": 315.044, "r_x1": 299.748, "r_y1": 315.044, "r_x2": 299.748, "r_y2": 303.755, "r_x3": 286.187, "r_y3": 303.755, "coord_origin": "TOPLEFT"}, "text": "M.,", "orig": "M.,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 36, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 304.339, "r_y0": 315.044, "r_x1": 333.893, "r_y1": 315.044, "r_x2": 333.893, "r_y2": 303.755, "r_x3": 304.339, "r_y3": 303.755, "coord_origin": "TOPLEFT"}, "text": "Nassar,", "orig": "Nassar,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 37, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 338.483, "r_y0": 315.044, "r_x1": 358.187, "r_y1": 315.044, "r_x2": 358.187, "r_y2": 303.755, "r_x3": 338.483, "r_y3": 303.755, "coord_origin": "TOPLEFT"}, "text": "A.S.,", "orig": "A.S.,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 38, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 362.778, "r_y0": 315.044, "r_x1": 386.855, "r_y1": 315.044, "r_x2": 386.855, "r_y2": 303.755, "r_x3": 362.778, "r_y3": 303.755, "coord_origin": "TOPLEFT"}, "text": "Staar,", "orig": "Staar,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 39, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 391.437, "r_y0": 315.044, "r_x1": 421.382, "r_y1": 315.044, "r_x2": 421.382, "r_y2": 303.755, "r_x3": 391.437, "r_y3": 303.755, "coord_origin": "TOPLEFT"}, "text": "P.W.J.:", "orig": "P.W.J.:", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 40, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 425.973, "r_y0": 315.044, "r_x1": 469.09, "r_y1": 315.044, "r_x2": 469.09, "r_y2": 303.755, "r_x3": 425.973, "r_y3": 303.755, "coord_origin": "TOPLEFT"}, "text": "Doclaynet:", "orig": "Doclaynet:", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 41, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 473.68, "r_y0": 315.044, "r_x1": 480.589, "r_y1": 315.044, "r_x2": 480.589, "r_y2": 303.755, "r_x3": 473.68, "r_y3": 303.755, "coord_origin": "TOPLEFT"}, "text": "A", "orig": "A", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 42, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 151.518, "r_y0": 326.003, "r_x1": 480.59, "r_y1": 326.003, "r_x2": 480.59, "r_y2": 314.714, "r_x3": 151.518, "r_y3": 314.714, "coord_origin": "TOPLEFT"}, "text": "large human-annotated dataset for document-layout segmentation. In: Zhang, A.,", "orig": "large human-annotated dataset for document-layout segmentation. In: Zhang, A.,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 43, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 151.518, "r_y0": 336.962, "r_x1": 480.591, "r_y1": 336.962, "r_x2": 480.591, "r_y2": 325.673, "r_x3": 151.518, "r_y3": 325.673, "coord_origin": "TOPLEFT"}, "text": "Rangwala, H. (eds.) KDD '22: The 28th ACM SIGKDD Conference on Knowledge", "orig": "Rangwala, H. (eds.) KDD '22: The 28th ACM SIGKDD Conference on Knowledge", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 44, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 151.518, "r_y0": 347.921, "r_x1": 480.591, "r_y1": 347.921, "r_x2": 480.591, "r_y2": 336.632, "r_x3": 151.518, "r_y3": 336.632, "coord_origin": "TOPLEFT"}, "text": "Discovery and Data Mining, Washington, DC, USA, August 14 - 18, 2022. pp.", "orig": "Discovery and Data Mining, Washington, DC, USA, August 14 - 18, 2022. pp.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 45, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 151.518, "r_y0": 358.88, "r_x1": 251.141, "r_y1": 358.88, "r_x2": 251.141, "r_y2": 347.591, "r_x3": 151.518, "r_y3": 347.591, "coord_origin": "TOPLEFT"}, "text": "3743-3751. ACM (2022).", "orig": "3743-3751. ACM (2022).", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 46, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 253.99, "r_y0": 357.984, "r_x1": 437.533, "r_y1": 357.984, "r_x2": 437.533, "r_y2": 350.515, "r_x3": 253.99, "r_y3": 350.515, "coord_origin": "TOPLEFT"}, "text": "https://doi.org/10.1145/3534678.3539043", "orig": "https://doi.org/10.1145/3534678.3539043", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 47, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 437.532, "r_y0": 358.88, "r_x1": 440.091, "r_y1": 358.88, "r_x2": 440.091, "r_y2": 347.591, "r_x3": 437.532, "r_y3": 347.591, "coord_origin": "TOPLEFT"}, "text": ",", "orig": ",", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 48, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 442.942, "r_y0": 357.984, "r_x1": 480.594, "r_y1": 357.984, "r_x2": 480.594, "r_y2": 350.515, "r_x3": 442.942, "r_y3": 350.515, "coord_origin": "TOPLEFT"}, "text": "https://", "orig": "https://", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 49, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 151.518, "r_y0": 368.943, "r_x1": 297.409, "r_y1": 368.943, "r_x2": 297.409, "r_y2": 361.474, "r_x3": 151.518, "r_y3": 361.474, "coord_origin": "TOPLEFT"}, "text": "doi.org/10.1145/3534678.3539043", "orig": "doi.org/10.1145/3534678.3539043", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 0, "label": "list_item", "bbox": {"l": 134.764, "t": 369.52, "r": 480.593, "b": 413.686, "coord_origin": "TOPLEFT"}, "confidence": 0.9752162098884583, "cells": [{"index": 50, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.764, "r_y0": 380.809, "r_x1": 146.537, "r_y1": 380.809, "r_x2": 146.537, "r_y2": 369.52, "r_x3": 134.764, "r_y3": 369.52, "coord_origin": "TOPLEFT"}, "text": "11.", "orig": "11.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 51, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 151.522, "r_y0": 380.809, "r_x1": 480.589, "r_y1": 380.809, "r_x2": 480.589, "r_y2": 369.52, "r_x3": 151.522, "r_y3": 369.52, "coord_origin": "TOPLEFT"}, "text": "Prasad, D., Gadpal, A., Kapadni, K., Visave, M., Sultanpure, K.: Cascadetabnet:", "orig": "Prasad, D., Gadpal, A., Kapadni, K., Visave, M., Sultanpure, K.: Cascadetabnet:", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 52, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 151.518, "r_y0": 391.768, "r_x1": 480.593, "r_y1": 391.768, "r_x2": 480.593, "r_y2": 380.479, "r_x3": 151.518, "r_y3": 380.479, "coord_origin": "TOPLEFT"}, "text": "An approach for end to end table detection and structure recognition from image-", "orig": "An approach for end to end table detection and structure recognition from image-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 53, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 151.518, "r_y0": 402.727, "r_x1": 480.593, "r_y1": 402.727, "r_x2": 480.593, "r_y2": 391.438, "r_x3": 151.518, "r_y3": 391.438, "coord_origin": "TOPLEFT"}, "text": "based documents. In: Proceedings of the IEEE/CVF conference on computer vision", "orig": "based documents. In: Proceedings of the IEEE/CVF conference on computer vision", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 54, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 151.518, "r_y0": 413.686, "r_x1": 373.827, "r_y1": 413.686, "r_x2": 373.827, "r_y2": 402.397, "r_x3": 151.518, "r_y3": 402.397, "coord_origin": "TOPLEFT"}, "text": "and pattern recognition workshops. pp. 572-573 (2020)", "orig": "and pattern recognition workshops. pp. 572-573 (2020)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 3, "label": "list_item", "bbox": {"l": 134.764, "t": 413.367, "r": 480.595, "b": 457.533, "coord_origin": "TOPLEFT"}, "confidence": 0.9707236886024475, "cells": [{"index": 55, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.764, "r_y0": 424.656, "r_x1": 146.537, "r_y1": 424.656, "r_x2": 146.537, "r_y2": 413.367, "r_x3": 134.764, "r_y3": 413.367, "coord_origin": "TOPLEFT"}, "text": "12.", "orig": "12.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 56, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 151.522, "r_y0": 424.656, "r_x1": 480.587, "r_y1": 424.656, "r_x2": 480.587, "r_y2": 413.367, "r_x3": 151.522, "r_y3": 413.367, "coord_origin": "TOPLEFT"}, "text": "Schreiber, S., Agne, S., Wolf, I., Dengel, A., Ahmed, S.: Deepdesrt: Deep learning", "orig": "Schreiber, S., Agne, S., Wolf, I., Dengel, A., Ahmed, S.: Deepdesrt: Deep learning", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 57, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 151.518, "r_y0": 435.615, "r_x1": 480.595, "r_y1": 435.615, "r_x2": 480.595, "r_y2": 424.326, "r_x3": 151.518, "r_y3": 424.326, "coord_origin": "TOPLEFT"}, "text": "for detection and structure recognition of tables in document images. In: 2017 14th", "orig": "for detection and structure recognition of tables in document images. In: 2017 14th", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 58, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 151.518, "r_y0": 446.574, "r_x1": 480.588, "r_y1": 446.574, "r_x2": 480.588, "r_y2": 435.285, "r_x3": 151.518, "r_y3": 435.285, "coord_origin": "TOPLEFT"}, "text": "IAPR international conference on document analysis and recognition (ICDAR).", "orig": "IAPR international conference on document analysis and recognition (ICDAR).", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 59, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 151.518, "r_y0": 457.533, "r_x1": 292.915, "r_y1": 457.533, "r_x2": 292.915, "r_y2": 446.244, "r_x3": 151.518, "r_y3": 446.244, "coord_origin": "TOPLEFT"}, "text": "vol. 1, pp. 1162-1167. IEEE (2017)", "orig": "vol. 1, pp. 1162-1167. IEEE (2017)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 7, "label": "list_item", "bbox": {"l": 134.764, "t": 457.214, "r": 480.594, "b": 500.484, "coord_origin": "TOPLEFT"}, "confidence": 0.9658119678497314, "cells": [{"index": 60, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.764, "r_y0": 468.503, "r_x1": 146.537, "r_y1": 468.503, "r_x2": 146.537, "r_y2": 457.214, "r_x3": 134.764, "r_y3": 457.214, "coord_origin": "TOPLEFT"}, "text": "13.", "orig": "13.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 61, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 151.522, "r_y0": 468.503, "r_x1": 480.59, "r_y1": 468.503, "r_x2": 480.59, "r_y2": 457.214, "r_x3": 151.522, "r_y3": 457.214, "coord_origin": "TOPLEFT"}, "text": "Siddiqui, S.A., Fateh, I.A., Rizvi, S.T.R., Dengel, A., Ahmed, S.: Deeptabstr: Deep", "orig": "Siddiqui, S.A., Fateh, I.A., Rizvi, S.T.R., Dengel, A., Ahmed, S.: Deeptabstr: Deep", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 62, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 151.518, "r_y0": 479.462, "r_x1": 480.591, "r_y1": 479.462, "r_x2": 480.591, "r_y2": 468.173, "r_x3": 151.518, "r_y3": 468.173, "coord_origin": "TOPLEFT"}, "text": "learning based table structure recognition. In: 2019 International Conference on", "orig": "learning based table structure recognition. In: 2019 International Conference on", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 63, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 151.518, "r_y0": 490.421, "r_x1": 439.06, "r_y1": 490.421, "r_x2": 439.06, "r_y2": 479.132, "r_x3": 151.518, "r_y3": 479.132, "coord_origin": "TOPLEFT"}, "text": "Document Analysis and Recognition (ICDAR). pp. 1403-1409 (2019).", "orig": "Document Analysis and Recognition (ICDAR). pp. 1403-1409 (2019).", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 64, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 442.942, "r_y0": 489.525, "r_x1": 480.594, "r_y1": 489.525, "r_x2": 480.594, "r_y2": 482.056, "r_x3": 442.942, "r_y3": 482.056, "coord_origin": "TOPLEFT"}, "text": "https://", "orig": "https://", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 65, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 151.518, "r_y0": 500.484, "r_x1": 302.116, "r_y1": 500.484, "r_x2": 302.116, "r_y2": 493.015, "r_x3": 151.518, "r_y3": 493.015, "coord_origin": "TOPLEFT"}, "text": "doi.org/10.1109/ICDAR.2019.00226", "orig": "doi.org/10.1109/ICDAR.2019.00226", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 2, "label": "list_item", "bbox": {"l": 134.764, "t": 501.061, "r": 480.593, "b": 545.227, "coord_origin": "TOPLEFT"}, "confidence": 0.972225546836853, "cells": [{"index": 66, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.764, "r_y0": 512.35, "r_x1": 146.537, "r_y1": 512.35, "r_x2": 146.537, "r_y2": 501.061, "r_x3": 134.764, "r_y3": 501.061, "coord_origin": "TOPLEFT"}, "text": "14.", "orig": "14.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 67, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 151.522, "r_y0": 512.35, "r_x1": 480.591, "r_y1": 512.35, "r_x2": 480.591, "r_y2": 501.061, "r_x3": 151.522, "r_y3": 501.061, "coord_origin": "TOPLEFT"}, "text": "Smock, B., Pesala, R., Abraham, R.: PubTables-1M: Towards comprehensive ta-", "orig": "Smock, B., Pesala, R., Abraham, R.: PubTables-1M: Towards comprehensive ta-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 68, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 151.518, "r_y0": 523.309, "r_x1": 480.593, "r_y1": 523.309, "r_x2": 480.593, "r_y2": 512.02, "r_x3": 151.518, "r_y3": 512.02, "coord_origin": "TOPLEFT"}, "text": "ble extraction from unstructured documents. In: Proceedings of the IEEE/CVF", "orig": "ble extraction from unstructured documents. In: Proceedings of the IEEE/CVF", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 69, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 151.518, "r_y0": 534.268, "r_x1": 480.588, "r_y1": 534.268, "r_x2": 480.588, "r_y2": 522.979, "r_x3": 151.518, "r_y3": 522.979, "coord_origin": "TOPLEFT"}, "text": "Conference on Computer Vision and Pattern Recognition (CVPR). pp. 4634-4642", "orig": "Conference on Computer Vision and Pattern Recognition (CVPR). pp. 4634-4642", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 70, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 151.518, "r_y0": 545.227, "r_x1": 199.247, "r_y1": 545.227, "r_x2": 199.247, "r_y2": 533.938, "r_x3": 151.518, "r_y3": 533.938, "coord_origin": "TOPLEFT"}, "text": "(June 2022)", "orig": "(June 2022)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 6, "label": "list_item", "bbox": {"l": 134.764, "t": 544.908, "r": 480.596, "b": 610.096, "coord_origin": "TOPLEFT"}, "confidence": 0.9674034714698792, "cells": [{"index": 71, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.764, "r_y0": 556.197, "r_x1": 146.537, "r_y1": 556.197, "r_x2": 146.537, "r_y2": 544.908, "r_x3": 134.764, "r_y3": 544.908, "coord_origin": "TOPLEFT"}, "text": "15.", "orig": "15.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 72, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 151.522, "r_y0": 556.197, "r_x1": 480.587, "r_y1": 556.197, "r_x2": 480.587, "r_y2": 544.908, "r_x3": 151.522, "r_y3": 544.908, "coord_origin": "TOPLEFT"}, "text": "Staar, P.W.J., Dolfi, M., Auer, C., Bekas, C.: Corpus conversion service: A ma-", "orig": "Staar, P.W.J., Dolfi, M., Auer, C., Bekas, C.: Corpus conversion service: A ma-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 73, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 151.518, "r_y0": 567.156, "r_x1": 480.588, "r_y1": 567.156, "r_x2": 480.588, "r_y2": 555.867, "r_x3": 151.518, "r_y3": 555.867, "coord_origin": "TOPLEFT"}, "text": "chine learning platform to ingest documents at scale. In: Proceedings of the 24th", "orig": "chine learning platform to ingest documents at scale. In: Proceedings of the 24th", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 74, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 151.518, "r_y0": 578.115, "r_x1": 480.591, "r_y1": 578.115, "r_x2": 480.591, "r_y2": 566.826, "r_x3": 151.518, "r_y3": 566.826, "coord_origin": "TOPLEFT"}, "text": "ACM SIGKDD International Conference on Knowledge Discovery & Data Min-", "orig": "ACM SIGKDD International Conference on Knowledge Discovery & Data Min-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 75, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 151.518, "r_y0": 589.0740000000001, "r_x1": 480.592, "r_y1": 589.0740000000001, "r_x2": 480.592, "r_y2": 577.785, "r_x3": 151.518, "r_y3": 577.785, "coord_origin": "TOPLEFT"}, "text": "ing. pp. 774-782. KDD '18, Association for Computing Machinery, New York, NY,", "orig": "ing. pp. 774-782. KDD '18, Association for Computing Machinery, New York, NY,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 76, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 151.518, "r_y0": 600.033, "r_x1": 200.758, "r_y1": 600.033, "r_x2": 200.758, "r_y2": 588.744, "r_x3": 151.518, "r_y3": 588.744, "coord_origin": "TOPLEFT"}, "text": "USA (2018).", "orig": "USA (2018).", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 77, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 202.916, "r_y0": 599.137, "r_x1": 386.459, "r_y1": 599.137, "r_x2": 386.459, "r_y2": 591.668, "r_x3": 202.916, "r_y3": 591.668, "coord_origin": "TOPLEFT"}, "text": "https://doi.org/10.1145/3219819.3219834", "orig": "https://doi.org/10.1145/3219819.3219834", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 78, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 386.458, "r_y0": 600.033, "r_x1": 389.017, "r_y1": 600.033, "r_x2": 389.017, "r_y2": 588.744, "r_x3": 386.458, "r_y3": 588.744, "coord_origin": "TOPLEFT"}, "text": ",", "orig": ",", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 79, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 391.173, "r_y0": 599.137, "r_x1": 480.596, "r_y1": 599.137, "r_x2": 480.596, "r_y2": 591.668, "r_x3": 391.173, "r_y3": 591.668, "coord_origin": "TOPLEFT"}, "text": "https://doi.org/10.", "orig": "https://doi.org/10.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 80, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 151.518, "r_y0": 610.096, "r_x1": 245.638, "r_y1": 610.096, "r_x2": 245.638, "r_y2": 602.627, "r_x3": 151.518, "r_y3": 602.627, "coord_origin": "TOPLEFT"}, "text": "1145/3219819.3219834", "orig": "1145/3219819.3219834", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 12, "label": "list_item", "bbox": {"l": 134.764, "t": 610.673, "r": 480.595, "b": 632.921, "coord_origin": "TOPLEFT"}, "confidence": 0.9416429996490479, "cells": [{"index": 81, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.764, "r_y0": 621.962, "r_x1": 146.537, "r_y1": 621.962, "r_x2": 146.537, "r_y2": 610.673, "r_x3": 134.764, "r_y3": 610.673, "coord_origin": "TOPLEFT"}, "text": "16.", "orig": "16.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 82, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 151.522, "r_y0": 621.962, "r_x1": 194.229, "r_y1": 621.962, "r_x2": 194.229, "r_y2": 610.673, "r_x3": 151.522, "r_y3": 610.673, "coord_origin": "TOPLEFT"}, "text": "Wang, X.:", "orig": "Wang, X.:", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 83, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 199.313, "r_y0": 621.962, "r_x1": 230.817, "r_y1": 621.962, "r_x2": 230.817, "r_y2": 610.673, "r_x3": 199.313, "r_y3": 610.673, "coord_origin": "TOPLEFT"}, "text": "Tabular", "orig": "Tabular", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 84, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 235.91, "r_y0": 621.962, "r_x1": 285.885, "r_y1": 621.962, "r_x2": 285.885, "r_y2": 610.673, "r_x3": 235.91, "r_y3": 610.673, "coord_origin": "TOPLEFT"}, "text": "Abstraction,", "orig": "Abstraction,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 85, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 290.969, "r_y0": 621.962, "r_x1": 323.342, "r_y1": 621.962, "r_x2": 323.342, "r_y2": 610.673, "r_x3": 290.969, "r_y3": 610.673, "coord_origin": "TOPLEFT"}, "text": "Editing,", "orig": "Editing,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 86, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 328.435, "r_y0": 621.962, "r_x1": 343.278, "r_y1": 621.962, "r_x2": 343.278, "r_y2": 610.673, "r_x3": 328.435, "r_y3": 610.673, "coord_origin": "TOPLEFT"}, "text": "and", "orig": "and", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 87, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 348.371, "r_y0": 621.962, "r_x1": 396.118, "r_y1": 621.962, "r_x2": 396.118, "r_y2": 610.673, "r_x3": 348.371, "r_y3": 610.673, "coord_origin": "TOPLEFT"}, "text": "Formatting.", "orig": "Formatting.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 88, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 401.21, "r_y0": 621.962, "r_x1": 424.753, "r_y1": 621.962, "r_x2": 424.753, "r_y2": 610.673, "r_x3": 401.21, "r_y3": 610.673, "coord_origin": "TOPLEFT"}, "text": "Ph.D.", "orig": "Ph.D.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 89, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 429.846, "r_y0": 621.962, "r_x1": 455.031, "r_y1": 621.962, "r_x2": 455.031, "r_y2": 610.673, "r_x3": 429.846, "r_y3": 610.673, "coord_origin": "TOPLEFT"}, "text": "thesis,", "orig": "thesis,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 90, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 460.124, "r_y0": 621.962, "r_x1": 480.595, "r_y1": 621.962, "r_x2": 480.595, "r_y2": 610.673, "r_x3": 460.124, "r_y3": 610.673, "coord_origin": "TOPLEFT"}, "text": "CAN", "orig": "CAN", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 91, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 151.518, "r_y0": 632.921, "r_x1": 234.43, "r_y1": 632.921, "r_x2": 234.43, "r_y2": 621.6320000000001, "r_x3": 151.518, "r_y3": 621.6320000000001, "coord_origin": "TOPLEFT"}, "text": "(1996), aAINN09397", "orig": "(1996), aAINN09397", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 8, "label": "list_item", "bbox": {"l": 134.764, "t": 632.602, "r": 480.591, "b": 665.809, "coord_origin": "TOPLEFT"}, "confidence": 0.9646382331848145, "cells": [{"index": 92, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.764, "r_y0": 643.891, "r_x1": 146.537, "r_y1": 643.891, "r_x2": 146.537, "r_y2": 632.602, "r_x3": 134.764, "r_y3": 632.602, "coord_origin": "TOPLEFT"}, "text": "17.", "orig": "17.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 93, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 151.522, "r_y0": 643.891, "r_x1": 480.587, "r_y1": 643.891, "r_x2": 480.587, "r_y2": 632.602, "r_x3": 151.522, "r_y3": 632.602, "coord_origin": "TOPLEFT"}, "text": "Xue, W., Li, Q., Tao, D.: Res2tim: Reconstruct syntactic structures from table", "orig": "Xue, W., Li, Q., Tao, D.: Res2tim: Reconstruct syntactic structures from table", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 94, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 151.518, "r_y0": 654.85, "r_x1": 480.591, "r_y1": 654.85, "r_x2": 480.591, "r_y2": 643.561, "r_x3": 151.518, "r_y3": 643.561, "coord_origin": "TOPLEFT"}, "text": "images. In: 2019 International Conference on Document Analysis and Recognition", "orig": "images. In: 2019 International Conference on Document Analysis and Recognition", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 95, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 151.518, "r_y0": 665.809, "r_x1": 299.303, "r_y1": 665.809, "r_x2": 299.303, "r_y2": 654.52, "r_x3": 151.518, "r_y3": 654.52, "coord_origin": "TOPLEFT"}, "text": "(ICDAR). pp. 749-755. IEEE (2019)", "orig": "(ICDAR). pp. 749-755. IEEE (2019)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}]}, "tablestructure": {"table_map": {}}, "figures_classification": null, "equations_prediction": null, "vlm_response": null}, "assembled": {"elements": [{"label": "page_header", "id": 13, "page_no": 12, "cluster": {"id": 13, "label": "page_header", "bbox": {"l": 194.478, "t": 91.49300000000005, "r": 447.543, "b": 102.78200000000004, "coord_origin": "TOPLEFT"}, "confidence": 0.9163166880607605, "cells": [{"index": 0, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 194.478, "r_y0": 102.78200000000004, "r_x1": 447.543, "r_y1": 102.78200000000004, "r_x2": 447.543, "r_y2": 91.49300000000005, "r_x3": 194.478, "r_y3": 91.49300000000005, "coord_origin": "TOPLEFT"}, "text": "Optimized Table Tokenization for Table Structure Recognition", "orig": "Optimized Table Tokenization for Table Structure Recognition", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "Optimized Table Tokenization for Table Structure Recognition"}, {"label": "page_header", "id": 14, "page_no": 12, "cluster": {"id": 14, "label": "page_header", "bbox": {"l": 471.376, "t": 91.49300000000005, "r": 480.59, "b": 102.78200000000004, "coord_origin": "TOPLEFT"}, "confidence": 0.9061064720153809, "cells": [{"index": 1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 471.376, "r_y0": 102.78200000000004, "r_x1": 480.59, "r_y1": 102.78200000000004, "r_x2": 480.59, "r_y2": 91.49300000000005, "r_x3": 471.376, "r_y3": 91.49300000000005, "coord_origin": "TOPLEFT"}, "text": "13", "orig": "13", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "13"}, {"label": "list_item", "id": 5, "page_no": 12, "cluster": {"id": 5, "label": "list_item", "bbox": {"l": 139.371, "t": 117.39599999999996, "r": 480.595, "b": 150.60299999999995, "coord_origin": "TOPLEFT"}, "confidence": 0.9677112698554993, "cells": [{"index": 2, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 139.371, "r_y0": 128.68499999999995, "r_x1": 146.537, "r_y1": 128.68499999999995, "r_x2": 146.537, "r_y2": 117.39599999999996, "r_x3": 139.371, "r_y3": 117.39599999999996, "coord_origin": "TOPLEFT"}, "text": "5.", "orig": "5.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 3, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 151.522, "r_y0": 128.68499999999995, "r_x1": 480.588, "r_y1": 128.68499999999995, "r_x2": 480.588, "r_y2": 117.39599999999996, "r_x3": 151.522, "r_y3": 117.39599999999996, "coord_origin": "TOPLEFT"}, "text": "Kayal, P., Anand, M., Desai, H., Singh, M.: Tables to latex: structure and content", "orig": "Kayal, P., Anand, M., Desai, H., Singh, M.: Tables to latex: structure and content", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 4, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 151.518, "r_y0": 139.644, "r_x1": 480.595, "r_y1": 139.644, "r_x2": 480.595, "r_y2": 128.35500000000002, "r_x3": 151.518, "r_y3": 128.35500000000002, "coord_origin": "TOPLEFT"}, "text": "extraction from scientific tables. International Journal on Document Analysis and", "orig": "extraction from scientific tables. International Journal on Document Analysis and", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 5, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 151.518, "r_y0": 150.60299999999995, "r_x1": 304.044, "r_y1": 150.60299999999995, "r_x2": 304.044, "r_y2": 139.31399999999996, "r_x3": 151.518, "r_y3": 139.31399999999996, "coord_origin": "TOPLEFT"}, "text": "Recognition (IJDAR) pp. 1-10 (2022)", "orig": "Recognition (IJDAR) pp. 1-10 (2022)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "5. Kayal, P., Anand, M., Desai, H., Singh, M.: Tables to latex: structure and content extraction from scientific tables. International Journal on Document Analysis and Recognition (IJDAR) pp. 1-10 (2022)"}, {"label": "list_item", "id": 1, "page_no": 12, "cluster": {"id": 1, "label": "list_item", "bbox": {"l": 139.371, "t": 150.284, "r": 480.593, "b": 194.45000000000005, "coord_origin": "TOPLEFT"}, "confidence": 0.973045289516449, "cells": [{"index": 6, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 139.371, "r_y0": 161.57299999999998, "r_x1": 146.537, "r_y1": 161.57299999999998, "r_x2": 146.537, "r_y2": 150.284, "r_x3": 139.371, "r_y3": 150.284, "coord_origin": "TOPLEFT"}, "text": "6.", "orig": "6.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 7, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 151.522, "r_y0": 161.57299999999998, "r_x1": 480.59, "r_y1": 161.57299999999998, "r_x2": 480.59, "r_y2": 150.284, "r_x3": 151.522, "r_y3": 150.284, "coord_origin": "TOPLEFT"}, "text": "Lee, E., Kwon, J., Yang, H., Park, J., Lee, S., Koo, H.I., Cho, N.I.: Table structure", "orig": "Lee, E., Kwon, J., Yang, H., Park, J., Lee, S., Koo, H.I., Cho, N.I.: Table structure", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 8, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 151.518, "r_y0": 172.53200000000004, "r_x1": 480.59, "r_y1": 172.53200000000004, "r_x2": 480.59, "r_y2": 161.24300000000005, "r_x3": 151.518, "r_y3": 161.24300000000005, "coord_origin": "TOPLEFT"}, "text": "recognition based on grid shape graph. In: 2022 Asia-Pacific Signal and Information", "orig": "recognition based on grid shape graph. In: 2022 Asia-Pacific Signal and Information", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 9, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 151.518, "r_y0": 183.49099999999999, "r_x1": 480.593, "r_y1": 183.49099999999999, "r_x2": 480.593, "r_y2": 172.202, "r_x3": 151.518, "r_y3": 172.202, "coord_origin": "TOPLEFT"}, "text": "Processing Association Annual Summit and Conference (APSIPA ASC). pp. 1868-", "orig": "Processing Association Annual Summit and Conference (APSIPA ASC). pp. 1868-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 10, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 151.518, "r_y0": 194.45000000000005, "r_x1": 226.374, "r_y1": 194.45000000000005, "r_x2": 226.374, "r_y2": 183.16099999999994, "r_x3": 151.518, "r_y3": 183.16099999999994, "coord_origin": "TOPLEFT"}, "text": "1873. IEEE (2022)", "orig": "1873. IEEE (2022)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "6. Lee, E., Kwon, J., Yang, H., Park, J., Lee, S., Koo, H.I., Cho, N.I.: Table structure recognition based on grid shape graph. In: 2022 Asia-Pacific Signal and Information Processing Association Annual Summit and Conference (APSIPA ASC). pp. 18681873. IEEE (2022)"}, {"label": "list_item", "id": 10, "page_no": 12, "cluster": {"id": 10, "label": "list_item", "bbox": {"l": 139.371, "t": 194.13099999999997, "r": 480.59, "b": 216.37900000000002, "coord_origin": "TOPLEFT"}, "confidence": 0.9582491517066956, "cells": [{"index": 11, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 139.371, "r_y0": 205.41999999999996, "r_x1": 146.537, "r_y1": 205.41999999999996, "r_x2": 146.537, "r_y2": 194.13099999999997, "r_x3": 139.371, "r_y3": 194.13099999999997, "coord_origin": "TOPLEFT"}, "text": "7.", "orig": "7.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 12, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 151.522, "r_y0": 205.41999999999996, "r_x1": 162.398, "r_y1": 205.41999999999996, "r_x2": 162.398, "r_y2": 194.13099999999997, "r_x3": 151.522, "r_y3": 194.13099999999997, "coord_origin": "TOPLEFT"}, "text": "Li,", "orig": "Li,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 13, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 166.298, "r_y0": 205.41999999999996, "r_x1": 480.59, "r_y1": 205.41999999999996, "r_x2": 480.59, "r_y2": 194.13099999999997, "r_x3": 166.298, "r_y3": 194.13099999999997, "coord_origin": "TOPLEFT"}, "text": "M., Cui, L., Huang, S., Wei, F., Zhou, M., Li, Z.: Tablebank: A benchmark", "orig": "M., Cui, L., Huang, S., Wei, F., Zhou, M., Li, Z.: Tablebank: A benchmark", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 14, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 151.518, "r_y0": 216.37900000000002, "r_x1": 352.017, "r_y1": 216.37900000000002, "r_x2": 352.017, "r_y2": 205.09000000000003, "r_x3": 151.518, "r_y3": 205.09000000000003, "coord_origin": "TOPLEFT"}, "text": "dataset for table detection and recognition (2019)", "orig": "dataset for table detection and recognition (2019)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "7. Li, M., Cui, L., Huang, S., Wei, F., Zhou, M., Li, Z.: Tablebank: A benchmark dataset for table detection and recognition (2019)"}, {"label": "list_item", "id": 4, "page_no": 12, "cluster": {"id": 4, "label": "list_item", "bbox": {"l": 139.371, "t": 216.06100000000004, "r": 480.595, "b": 270.289, "coord_origin": "TOPLEFT"}, "confidence": 0.967814564704895, "cells": [{"index": 15, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 139.371, "r_y0": 227.35000000000002, "r_x1": 146.537, "r_y1": 227.35000000000002, "r_x2": 146.537, "r_y2": 216.06100000000004, "r_x3": 139.371, "r_y3": 216.06100000000004, "coord_origin": "TOPLEFT"}, "text": "8.", "orig": "8.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 16, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 151.522, "r_y0": 227.35000000000002, "r_x1": 480.587, "r_y1": 227.35000000000002, "r_x2": 480.587, "r_y2": 216.06100000000004, "r_x3": 151.522, "r_y3": 216.06100000000004, "coord_origin": "TOPLEFT"}, "text": "Livathinos, N., Berrospi, C., Lysak, M., Kuropiatnyk, V., Nassar, A., Carvalho,", "orig": "Livathinos, N., Berrospi, C., Lysak, M., Kuropiatnyk, V., Nassar, A., Carvalho,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 17, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 151.518, "r_y0": 238.30899999999997, "r_x1": 189.414, "r_y1": 238.30899999999997, "r_x2": 189.414, "r_y2": 227.01999999999998, "r_x3": 151.518, "r_y3": 227.01999999999998, "coord_origin": "TOPLEFT"}, "text": "A., Dolfi,", "orig": "A., Dolfi,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 18, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 193.414, "r_y0": 238.30899999999997, "r_x1": 480.59, "r_y1": 238.30899999999997, "r_x2": 480.59, "r_y2": 227.01999999999998, "r_x3": 193.414, "r_y3": 227.01999999999998, "coord_origin": "TOPLEFT"}, "text": "M., Auer, C., Dinkla, K., Staar, P.: Robust pdf document conversion", "orig": "M., Auer, C., Dinkla, K., Staar, P.: Robust pdf document conversion", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 19, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 151.518, "r_y0": 249.26800000000003, "r_x1": 480.595, "r_y1": 249.26800000000003, "r_x2": 480.595, "r_y2": 237.97900000000004, "r_x3": 151.518, "r_y3": 237.97900000000004, "coord_origin": "TOPLEFT"}, "text": "using recurrent neural networks. Proceedings of the AAAI Conference on Artificial", "orig": "using recurrent neural networks. Proceedings of the AAAI Conference on Artificial", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 20, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 151.518, "r_y0": 260.227, "r_x1": 197.086, "r_y1": 260.227, "r_x2": 197.086, "r_y2": 248.938, "r_x3": 151.518, "r_y3": 248.938, "coord_origin": "TOPLEFT"}, "text": "Intelligence", "orig": "Intelligence", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 21, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 199.4, "r_y0": 259.07899999999995, "r_x1": 210.007, "r_y1": 259.07899999999995, "r_x2": 210.007, "r_y2": 251.15300000000002, "r_x3": 199.4, "r_y3": 251.15300000000002, "coord_origin": "TOPLEFT"}, "text": "35", "orig": "35", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 22, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 210.007, "r_y0": 260.227, "r_x1": 332.377, "r_y1": 260.227, "r_x2": 332.377, "r_y2": 248.938, "r_x3": 210.007, "r_y3": 248.938, "coord_origin": "TOPLEFT"}, "text": "(17), 15137-15145 (May 2021),", "orig": "(17), 15137-15145 (May 2021),", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 23, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 334.699, "r_y0": 259.331, "r_x1": 480.59, "r_y1": 259.331, "r_x2": 480.59, "r_y2": 251.86199999999997, "r_x3": 334.699, "r_y3": 251.86199999999997, "coord_origin": "TOPLEFT"}, "text": "https://ojs.aaai.org/index.php/", "orig": "https://ojs.aaai.org/index.php/", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 24, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 151.518, "r_y0": 270.289, "r_x1": 259.758, "r_y1": 270.289, "r_x2": 259.758, "r_y2": 262.82000000000005, "r_x3": 151.518, "r_y3": 262.82000000000005, "coord_origin": "TOPLEFT"}, "text": "AAAI/article/view/17777", "orig": "AAAI/article/view/17777", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "8. Livathinos, N., Berrospi, C., Lysak, M., Kuropiatnyk, V., Nassar, A., Carvalho, A., Dolfi, M., Auer, C., Dinkla, K., Staar, P.: Robust pdf document conversion using recurrent neural networks. Proceedings of the AAAI Conference on Artificial Intelligence 35 (17), 15137-15145 (May 2021), https://ojs.aaai.org/index.php/ AAAI/article/view/17777"}, {"label": "list_item", "id": 11, "page_no": 12, "cluster": {"id": 11, "label": "list_item", "bbox": {"l": 139.371, "t": 270.86699999999996, "r": 480.594, "b": 304.074, "coord_origin": "TOPLEFT"}, "confidence": 0.9557179808616638, "cells": [{"index": 25, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 139.371, "r_y0": 282.156, "r_x1": 146.537, "r_y1": 282.156, "r_x2": 146.537, "r_y2": 270.86699999999996, "r_x3": 139.371, "r_y3": 270.86699999999996, "coord_origin": "TOPLEFT"}, "text": "9.", "orig": "9.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 26, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 151.522, "r_y0": 282.156, "r_x1": 480.588, "r_y1": 282.156, "r_x2": 480.588, "r_y2": 270.86699999999996, "r_x3": 151.522, "r_y3": 270.86699999999996, "coord_origin": "TOPLEFT"}, "text": "Nassar, A., Livathinos, N., Lysak, M., Staar, P.: Tableformer: Table structure un-", "orig": "Nassar, A., Livathinos, N., Lysak, M., Staar, P.: Tableformer: Table structure un-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 27, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 151.518, "r_y0": 293.115, "r_x1": 480.594, "r_y1": 293.115, "r_x2": 480.594, "r_y2": 281.826, "r_x3": 151.518, "r_y3": 281.826, "coord_origin": "TOPLEFT"}, "text": "derstanding with transformers. In: Proceedings of the IEEE/CVF Conference on", "orig": "derstanding with transformers. In: Proceedings of the IEEE/CVF Conference on", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 28, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 151.518, "r_y0": 304.074, "r_x1": 473.443, "r_y1": 304.074, "r_x2": 473.443, "r_y2": 292.785, "r_x3": 151.518, "r_y3": 292.785, "coord_origin": "TOPLEFT"}, "text": "Computer Vision and Pattern Recognition (CVPR). pp. 4614-4623 (June 2022)", "orig": "Computer Vision and Pattern Recognition (CVPR). pp. 4614-4623 (June 2022)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "9. Nassar, A., Livathinos, N., Lysak, M., Staar, P.: Tableformer: Table structure understanding with transformers. In: Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR). pp. 4614-4623 (June 2022)"}, {"label": "list_item", "id": 9, "page_no": 12, "cluster": {"id": 9, "label": "list_item", "bbox": {"l": 134.764, "t": 303.755, "r": 480.594, "b": 368.943, "coord_origin": "TOPLEFT"}, "confidence": 0.9639304876327515, "cells": [{"index": 29, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.764, "r_y0": 315.044, "r_x1": 146.537, "r_y1": 315.044, "r_x2": 146.537, "r_y2": 303.755, "r_x3": 134.764, "r_y3": 303.755, "coord_origin": "TOPLEFT"}, "text": "10.", "orig": "10.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 30, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 151.522, "r_y0": 315.044, "r_x1": 195.667, "r_y1": 315.044, "r_x2": 195.667, "r_y2": 303.755, "r_x3": 151.522, "r_y3": 303.755, "coord_origin": "TOPLEFT"}, "text": "Pfitzmann,", "orig": "Pfitzmann,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 31, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 200.249, "r_y0": 315.044, "r_x1": 211.893, "r_y1": 315.044, "r_x2": 211.893, "r_y2": 303.755, "r_x3": 200.249, "r_y3": 303.755, "coord_origin": "TOPLEFT"}, "text": "B.,", "orig": "B.,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 32, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 216.484, "r_y0": 315.044, "r_x1": 238.772, "r_y1": 315.044, "r_x2": 238.772, "r_y2": 303.755, "r_x3": 216.484, "r_y3": 303.755, "coord_origin": "TOPLEFT"}, "text": "Auer,", "orig": "Auer,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 33, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 243.362, "r_y0": 315.044, "r_x1": 255.134, "r_y1": 315.044, "r_x2": 255.134, "r_y2": 303.755, "r_x3": 243.362, "r_y3": 303.755, "coord_origin": "TOPLEFT"}, "text": "C.,", "orig": "C.,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 34, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 259.725, "r_y0": 315.044, "r_x1": 281.605, "r_y1": 315.044, "r_x2": 281.605, "r_y2": 303.755, "r_x3": 259.725, "r_y3": 303.755, "coord_origin": "TOPLEFT"}, "text": "Dolfi,", "orig": "Dolfi,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 35, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 286.187, "r_y0": 315.044, "r_x1": 299.748, "r_y1": 315.044, "r_x2": 299.748, "r_y2": 303.755, "r_x3": 286.187, "r_y3": 303.755, "coord_origin": "TOPLEFT"}, "text": "M.,", "orig": "M.,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 36, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 304.339, "r_y0": 315.044, "r_x1": 333.893, "r_y1": 315.044, "r_x2": 333.893, "r_y2": 303.755, "r_x3": 304.339, "r_y3": 303.755, "coord_origin": "TOPLEFT"}, "text": "Nassar,", "orig": "Nassar,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 37, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 338.483, "r_y0": 315.044, "r_x1": 358.187, "r_y1": 315.044, "r_x2": 358.187, "r_y2": 303.755, "r_x3": 338.483, "r_y3": 303.755, "coord_origin": "TOPLEFT"}, "text": "A.S.,", "orig": "A.S.,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 38, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 362.778, "r_y0": 315.044, "r_x1": 386.855, "r_y1": 315.044, "r_x2": 386.855, "r_y2": 303.755, "r_x3": 362.778, "r_y3": 303.755, "coord_origin": "TOPLEFT"}, "text": "Staar,", "orig": "Staar,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 39, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 391.437, "r_y0": 315.044, "r_x1": 421.382, "r_y1": 315.044, "r_x2": 421.382, "r_y2": 303.755, "r_x3": 391.437, "r_y3": 303.755, "coord_origin": "TOPLEFT"}, "text": "P.W.J.:", "orig": "P.W.J.:", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 40, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 425.973, "r_y0": 315.044, "r_x1": 469.09, "r_y1": 315.044, "r_x2": 469.09, "r_y2": 303.755, "r_x3": 425.973, "r_y3": 303.755, "coord_origin": "TOPLEFT"}, "text": "Doclaynet:", "orig": "Doclaynet:", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 41, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 473.68, "r_y0": 315.044, "r_x1": 480.589, "r_y1": 315.044, "r_x2": 480.589, "r_y2": 303.755, "r_x3": 473.68, "r_y3": 303.755, "coord_origin": "TOPLEFT"}, "text": "A", "orig": "A", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 42, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 151.518, "r_y0": 326.003, "r_x1": 480.59, "r_y1": 326.003, "r_x2": 480.59, "r_y2": 314.714, "r_x3": 151.518, "r_y3": 314.714, "coord_origin": "TOPLEFT"}, "text": "large human-annotated dataset for document-layout segmentation. In: Zhang, A.,", "orig": "large human-annotated dataset for document-layout segmentation. In: Zhang, A.,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 43, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 151.518, "r_y0": 336.962, "r_x1": 480.591, "r_y1": 336.962, "r_x2": 480.591, "r_y2": 325.673, "r_x3": 151.518, "r_y3": 325.673, "coord_origin": "TOPLEFT"}, "text": "Rangwala, H. (eds.) KDD '22: The 28th ACM SIGKDD Conference on Knowledge", "orig": "Rangwala, H. (eds.) KDD '22: The 28th ACM SIGKDD Conference on Knowledge", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 44, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 151.518, "r_y0": 347.921, "r_x1": 480.591, "r_y1": 347.921, "r_x2": 480.591, "r_y2": 336.632, "r_x3": 151.518, "r_y3": 336.632, "coord_origin": "TOPLEFT"}, "text": "Discovery and Data Mining, Washington, DC, USA, August 14 - 18, 2022. pp.", "orig": "Discovery and Data Mining, Washington, DC, USA, August 14 - 18, 2022. pp.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 45, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 151.518, "r_y0": 358.88, "r_x1": 251.141, "r_y1": 358.88, "r_x2": 251.141, "r_y2": 347.591, "r_x3": 151.518, "r_y3": 347.591, "coord_origin": "TOPLEFT"}, "text": "3743-3751. ACM (2022).", "orig": "3743-3751. ACM (2022).", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 46, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 253.99, "r_y0": 357.984, "r_x1": 437.533, "r_y1": 357.984, "r_x2": 437.533, "r_y2": 350.515, "r_x3": 253.99, "r_y3": 350.515, "coord_origin": "TOPLEFT"}, "text": "https://doi.org/10.1145/3534678.3539043", "orig": "https://doi.org/10.1145/3534678.3539043", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 47, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 437.532, "r_y0": 358.88, "r_x1": 440.091, "r_y1": 358.88, "r_x2": 440.091, "r_y2": 347.591, "r_x3": 437.532, "r_y3": 347.591, "coord_origin": "TOPLEFT"}, "text": ",", "orig": ",", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 48, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 442.942, "r_y0": 357.984, "r_x1": 480.594, "r_y1": 357.984, "r_x2": 480.594, "r_y2": 350.515, "r_x3": 442.942, "r_y3": 350.515, "coord_origin": "TOPLEFT"}, "text": "https://", "orig": "https://", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 49, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 151.518, "r_y0": 368.943, "r_x1": 297.409, "r_y1": 368.943, "r_x2": 297.409, "r_y2": 361.474, "r_x3": 151.518, "r_y3": 361.474, "coord_origin": "TOPLEFT"}, "text": "doi.org/10.1145/3534678.3539043", "orig": "doi.org/10.1145/3534678.3539043", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "10. Pfitzmann, B., Auer, C., Dolfi, M., Nassar, A.S., Staar, P.W.J.: Doclaynet: A large human-annotated dataset for document-layout segmentation. In: Zhang, A., Rangwala, H. (eds.) KDD '22: The 28th ACM SIGKDD Conference on Knowledge Discovery and Data Mining, Washington, DC, USA, August 14 - 18, 2022. pp. 3743-3751. ACM (2022). https://doi.org/10.1145/3534678.3539043 , https:// doi.org/10.1145/3534678.3539043"}, {"label": "list_item", "id": 0, "page_no": 12, "cluster": {"id": 0, "label": "list_item", "bbox": {"l": 134.764, "t": 369.52, "r": 480.593, "b": 413.686, "coord_origin": "TOPLEFT"}, "confidence": 0.9752162098884583, "cells": [{"index": 50, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.764, "r_y0": 380.809, "r_x1": 146.537, "r_y1": 380.809, "r_x2": 146.537, "r_y2": 369.52, "r_x3": 134.764, "r_y3": 369.52, "coord_origin": "TOPLEFT"}, "text": "11.", "orig": "11.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 51, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 151.522, "r_y0": 380.809, "r_x1": 480.589, "r_y1": 380.809, "r_x2": 480.589, "r_y2": 369.52, "r_x3": 151.522, "r_y3": 369.52, "coord_origin": "TOPLEFT"}, "text": "Prasad, D., Gadpal, A., Kapadni, K., Visave, M., Sultanpure, K.: Cascadetabnet:", "orig": "Prasad, D., Gadpal, A., Kapadni, K., Visave, M., Sultanpure, K.: Cascadetabnet:", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 52, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 151.518, "r_y0": 391.768, "r_x1": 480.593, "r_y1": 391.768, "r_x2": 480.593, "r_y2": 380.479, "r_x3": 151.518, "r_y3": 380.479, "coord_origin": "TOPLEFT"}, "text": "An approach for end to end table detection and structure recognition from image-", "orig": "An approach for end to end table detection and structure recognition from image-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 53, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 151.518, "r_y0": 402.727, "r_x1": 480.593, "r_y1": 402.727, "r_x2": 480.593, "r_y2": 391.438, "r_x3": 151.518, "r_y3": 391.438, "coord_origin": "TOPLEFT"}, "text": "based documents. In: Proceedings of the IEEE/CVF conference on computer vision", "orig": "based documents. In: Proceedings of the IEEE/CVF conference on computer vision", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 54, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 151.518, "r_y0": 413.686, "r_x1": 373.827, "r_y1": 413.686, "r_x2": 373.827, "r_y2": 402.397, "r_x3": 151.518, "r_y3": 402.397, "coord_origin": "TOPLEFT"}, "text": "and pattern recognition workshops. pp. 572-573 (2020)", "orig": "and pattern recognition workshops. pp. 572-573 (2020)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "11. Prasad, D., Gadpal, A., Kapadni, K., Visave, M., Sultanpure, K.: Cascadetabnet: An approach for end to end table detection and structure recognition from imagebased documents. In: Proceedings of the IEEE/CVF conference on computer vision and pattern recognition workshops. pp. 572-573 (2020)"}, {"label": "list_item", "id": 3, "page_no": 12, "cluster": {"id": 3, "label": "list_item", "bbox": {"l": 134.764, "t": 413.367, "r": 480.595, "b": 457.533, "coord_origin": "TOPLEFT"}, "confidence": 0.9707236886024475, "cells": [{"index": 55, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.764, "r_y0": 424.656, "r_x1": 146.537, "r_y1": 424.656, "r_x2": 146.537, "r_y2": 413.367, "r_x3": 134.764, "r_y3": 413.367, "coord_origin": "TOPLEFT"}, "text": "12.", "orig": "12.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 56, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 151.522, "r_y0": 424.656, "r_x1": 480.587, "r_y1": 424.656, "r_x2": 480.587, "r_y2": 413.367, "r_x3": 151.522, "r_y3": 413.367, "coord_origin": "TOPLEFT"}, "text": "Schreiber, S., Agne, S., Wolf, I., Dengel, A., Ahmed, S.: Deepdesrt: Deep learning", "orig": "Schreiber, S., Agne, S., Wolf, I., Dengel, A., Ahmed, S.: Deepdesrt: Deep learning", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 57, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 151.518, "r_y0": 435.615, "r_x1": 480.595, "r_y1": 435.615, "r_x2": 480.595, "r_y2": 424.326, "r_x3": 151.518, "r_y3": 424.326, "coord_origin": "TOPLEFT"}, "text": "for detection and structure recognition of tables in document images. In: 2017 14th", "orig": "for detection and structure recognition of tables in document images. In: 2017 14th", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 58, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 151.518, "r_y0": 446.574, "r_x1": 480.588, "r_y1": 446.574, "r_x2": 480.588, "r_y2": 435.285, "r_x3": 151.518, "r_y3": 435.285, "coord_origin": "TOPLEFT"}, "text": "IAPR international conference on document analysis and recognition (ICDAR).", "orig": "IAPR international conference on document analysis and recognition (ICDAR).", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 59, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 151.518, "r_y0": 457.533, "r_x1": 292.915, "r_y1": 457.533, "r_x2": 292.915, "r_y2": 446.244, "r_x3": 151.518, "r_y3": 446.244, "coord_origin": "TOPLEFT"}, "text": "vol. 1, pp. 1162-1167. IEEE (2017)", "orig": "vol. 1, pp. 1162-1167. IEEE (2017)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "12. Schreiber, S., Agne, S., Wolf, I., Dengel, A., Ahmed, S.: Deepdesrt: Deep learning for detection and structure recognition of tables in document images. In: 2017 14th IAPR international conference on document analysis and recognition (ICDAR). vol. 1, pp. 1162-1167. IEEE (2017)"}, {"label": "list_item", "id": 7, "page_no": 12, "cluster": {"id": 7, "label": "list_item", "bbox": {"l": 134.764, "t": 457.214, "r": 480.594, "b": 500.484, "coord_origin": "TOPLEFT"}, "confidence": 0.9658119678497314, "cells": [{"index": 60, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.764, "r_y0": 468.503, "r_x1": 146.537, "r_y1": 468.503, "r_x2": 146.537, "r_y2": 457.214, "r_x3": 134.764, "r_y3": 457.214, "coord_origin": "TOPLEFT"}, "text": "13.", "orig": "13.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 61, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 151.522, "r_y0": 468.503, "r_x1": 480.59, "r_y1": 468.503, "r_x2": 480.59, "r_y2": 457.214, "r_x3": 151.522, "r_y3": 457.214, "coord_origin": "TOPLEFT"}, "text": "Siddiqui, S.A., Fateh, I.A., Rizvi, S.T.R., Dengel, A., Ahmed, S.: Deeptabstr: Deep", "orig": "Siddiqui, S.A., Fateh, I.A., Rizvi, S.T.R., Dengel, A., Ahmed, S.: Deeptabstr: Deep", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 62, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 151.518, "r_y0": 479.462, "r_x1": 480.591, "r_y1": 479.462, "r_x2": 480.591, "r_y2": 468.173, "r_x3": 151.518, "r_y3": 468.173, "coord_origin": "TOPLEFT"}, "text": "learning based table structure recognition. In: 2019 International Conference on", "orig": "learning based table structure recognition. In: 2019 International Conference on", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 63, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 151.518, "r_y0": 490.421, "r_x1": 439.06, "r_y1": 490.421, "r_x2": 439.06, "r_y2": 479.132, "r_x3": 151.518, "r_y3": 479.132, "coord_origin": "TOPLEFT"}, "text": "Document Analysis and Recognition (ICDAR). pp. 1403-1409 (2019).", "orig": "Document Analysis and Recognition (ICDAR). pp. 1403-1409 (2019).", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 64, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 442.942, "r_y0": 489.525, "r_x1": 480.594, "r_y1": 489.525, "r_x2": 480.594, "r_y2": 482.056, "r_x3": 442.942, "r_y3": 482.056, "coord_origin": "TOPLEFT"}, "text": "https://", "orig": "https://", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 65, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 151.518, "r_y0": 500.484, "r_x1": 302.116, "r_y1": 500.484, "r_x2": 302.116, "r_y2": 493.015, "r_x3": 151.518, "r_y3": 493.015, "coord_origin": "TOPLEFT"}, "text": "doi.org/10.1109/ICDAR.2019.00226", "orig": "doi.org/10.1109/ICDAR.2019.00226", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "13. Siddiqui, S.A., Fateh, I.A., Rizvi, S.T.R., Dengel, A., Ahmed, S.: Deeptabstr: Deep learning based table structure recognition. In: 2019 International Conference on Document Analysis and Recognition (ICDAR). pp. 1403-1409 (2019). https:// doi.org/10.1109/ICDAR.2019.00226"}, {"label": "list_item", "id": 2, "page_no": 12, "cluster": {"id": 2, "label": "list_item", "bbox": {"l": 134.764, "t": 501.061, "r": 480.593, "b": 545.227, "coord_origin": "TOPLEFT"}, "confidence": 0.972225546836853, "cells": [{"index": 66, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.764, "r_y0": 512.35, "r_x1": 146.537, "r_y1": 512.35, "r_x2": 146.537, "r_y2": 501.061, "r_x3": 134.764, "r_y3": 501.061, "coord_origin": "TOPLEFT"}, "text": "14.", "orig": "14.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 67, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 151.522, "r_y0": 512.35, "r_x1": 480.591, "r_y1": 512.35, "r_x2": 480.591, "r_y2": 501.061, "r_x3": 151.522, "r_y3": 501.061, "coord_origin": "TOPLEFT"}, "text": "Smock, B., Pesala, R., Abraham, R.: PubTables-1M: Towards comprehensive ta-", "orig": "Smock, B., Pesala, R., Abraham, R.: PubTables-1M: Towards comprehensive ta-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 68, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 151.518, "r_y0": 523.309, "r_x1": 480.593, "r_y1": 523.309, "r_x2": 480.593, "r_y2": 512.02, "r_x3": 151.518, "r_y3": 512.02, "coord_origin": "TOPLEFT"}, "text": "ble extraction from unstructured documents. In: Proceedings of the IEEE/CVF", "orig": "ble extraction from unstructured documents. In: Proceedings of the IEEE/CVF", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 69, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 151.518, "r_y0": 534.268, "r_x1": 480.588, "r_y1": 534.268, "r_x2": 480.588, "r_y2": 522.979, "r_x3": 151.518, "r_y3": 522.979, "coord_origin": "TOPLEFT"}, "text": "Conference on Computer Vision and Pattern Recognition (CVPR). pp. 4634-4642", "orig": "Conference on Computer Vision and Pattern Recognition (CVPR). pp. 4634-4642", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 70, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 151.518, "r_y0": 545.227, "r_x1": 199.247, "r_y1": 545.227, "r_x2": 199.247, "r_y2": 533.938, "r_x3": 151.518, "r_y3": 533.938, "coord_origin": "TOPLEFT"}, "text": "(June 2022)", "orig": "(June 2022)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "14. Smock, B., Pesala, R., Abraham, R.: PubTables-1M: Towards comprehensive table extraction from unstructured documents. In: Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR). pp. 4634-4642 (June 2022)"}, {"label": "list_item", "id": 6, "page_no": 12, "cluster": {"id": 6, "label": "list_item", "bbox": {"l": 134.764, "t": 544.908, "r": 480.596, "b": 610.096, "coord_origin": "TOPLEFT"}, "confidence": 0.9674034714698792, "cells": [{"index": 71, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.764, "r_y0": 556.197, "r_x1": 146.537, "r_y1": 556.197, "r_x2": 146.537, "r_y2": 544.908, "r_x3": 134.764, "r_y3": 544.908, "coord_origin": "TOPLEFT"}, "text": "15.", "orig": "15.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 72, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 151.522, "r_y0": 556.197, "r_x1": 480.587, "r_y1": 556.197, "r_x2": 480.587, "r_y2": 544.908, "r_x3": 151.522, "r_y3": 544.908, "coord_origin": "TOPLEFT"}, "text": "Staar, P.W.J., Dolfi, M., Auer, C., Bekas, C.: Corpus conversion service: A ma-", "orig": "Staar, P.W.J., Dolfi, M., Auer, C., Bekas, C.: Corpus conversion service: A ma-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 73, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 151.518, "r_y0": 567.156, "r_x1": 480.588, "r_y1": 567.156, "r_x2": 480.588, "r_y2": 555.867, "r_x3": 151.518, "r_y3": 555.867, "coord_origin": "TOPLEFT"}, "text": "chine learning platform to ingest documents at scale. In: Proceedings of the 24th", "orig": "chine learning platform to ingest documents at scale. In: Proceedings of the 24th", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 74, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 151.518, "r_y0": 578.115, "r_x1": 480.591, "r_y1": 578.115, "r_x2": 480.591, "r_y2": 566.826, "r_x3": 151.518, "r_y3": 566.826, "coord_origin": "TOPLEFT"}, "text": "ACM SIGKDD International Conference on Knowledge Discovery & Data Min-", "orig": "ACM SIGKDD International Conference on Knowledge Discovery & Data Min-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 75, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 151.518, "r_y0": 589.0740000000001, "r_x1": 480.592, "r_y1": 589.0740000000001, "r_x2": 480.592, "r_y2": 577.785, "r_x3": 151.518, "r_y3": 577.785, "coord_origin": "TOPLEFT"}, "text": "ing. pp. 774-782. KDD '18, Association for Computing Machinery, New York, NY,", "orig": "ing. pp. 774-782. KDD '18, Association for Computing Machinery, New York, NY,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 76, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 151.518, "r_y0": 600.033, "r_x1": 200.758, "r_y1": 600.033, "r_x2": 200.758, "r_y2": 588.744, "r_x3": 151.518, "r_y3": 588.744, "coord_origin": "TOPLEFT"}, "text": "USA (2018).", "orig": "USA (2018).", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 77, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 202.916, "r_y0": 599.137, "r_x1": 386.459, "r_y1": 599.137, "r_x2": 386.459, "r_y2": 591.668, "r_x3": 202.916, "r_y3": 591.668, "coord_origin": "TOPLEFT"}, "text": "https://doi.org/10.1145/3219819.3219834", "orig": "https://doi.org/10.1145/3219819.3219834", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 78, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 386.458, "r_y0": 600.033, "r_x1": 389.017, "r_y1": 600.033, "r_x2": 389.017, "r_y2": 588.744, "r_x3": 386.458, "r_y3": 588.744, "coord_origin": "TOPLEFT"}, "text": ",", "orig": ",", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 79, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 391.173, "r_y0": 599.137, "r_x1": 480.596, "r_y1": 599.137, "r_x2": 480.596, "r_y2": 591.668, "r_x3": 391.173, "r_y3": 591.668, "coord_origin": "TOPLEFT"}, "text": "https://doi.org/10.", "orig": "https://doi.org/10.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 80, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 151.518, "r_y0": 610.096, "r_x1": 245.638, "r_y1": 610.096, "r_x2": 245.638, "r_y2": 602.627, "r_x3": 151.518, "r_y3": 602.627, "coord_origin": "TOPLEFT"}, "text": "1145/3219819.3219834", "orig": "1145/3219819.3219834", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "15. Staar, P.W.J., Dolfi, M., Auer, C., Bekas, C.: Corpus conversion service: A machine learning platform to ingest documents at scale. In: Proceedings of the 24th ACM SIGKDD International Conference on Knowledge Discovery & Data Mining. pp. 774-782. KDD '18, Association for Computing Machinery, New York, NY, USA (2018). https://doi.org/10.1145/3219819.3219834 , https://doi.org/10. 1145/3219819.3219834"}, {"label": "list_item", "id": 12, "page_no": 12, "cluster": {"id": 12, "label": "list_item", "bbox": {"l": 134.764, "t": 610.673, "r": 480.595, "b": 632.921, "coord_origin": "TOPLEFT"}, "confidence": 0.9416429996490479, "cells": [{"index": 81, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.764, "r_y0": 621.962, "r_x1": 146.537, "r_y1": 621.962, "r_x2": 146.537, "r_y2": 610.673, "r_x3": 134.764, "r_y3": 610.673, "coord_origin": "TOPLEFT"}, "text": "16.", "orig": "16.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 82, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 151.522, "r_y0": 621.962, "r_x1": 194.229, "r_y1": 621.962, "r_x2": 194.229, "r_y2": 610.673, "r_x3": 151.522, "r_y3": 610.673, "coord_origin": "TOPLEFT"}, "text": "Wang, X.:", "orig": "Wang, X.:", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 83, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 199.313, "r_y0": 621.962, "r_x1": 230.817, "r_y1": 621.962, "r_x2": 230.817, "r_y2": 610.673, "r_x3": 199.313, "r_y3": 610.673, "coord_origin": "TOPLEFT"}, "text": "Tabular", "orig": "Tabular", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 84, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 235.91, "r_y0": 621.962, "r_x1": 285.885, "r_y1": 621.962, "r_x2": 285.885, "r_y2": 610.673, "r_x3": 235.91, "r_y3": 610.673, "coord_origin": "TOPLEFT"}, "text": "Abstraction,", "orig": "Abstraction,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 85, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 290.969, "r_y0": 621.962, "r_x1": 323.342, "r_y1": 621.962, "r_x2": 323.342, "r_y2": 610.673, "r_x3": 290.969, "r_y3": 610.673, "coord_origin": "TOPLEFT"}, "text": "Editing,", "orig": "Editing,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 86, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 328.435, "r_y0": 621.962, "r_x1": 343.278, "r_y1": 621.962, "r_x2": 343.278, "r_y2": 610.673, "r_x3": 328.435, "r_y3": 610.673, "coord_origin": "TOPLEFT"}, "text": "and", "orig": "and", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 87, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 348.371, "r_y0": 621.962, "r_x1": 396.118, "r_y1": 621.962, "r_x2": 396.118, "r_y2": 610.673, "r_x3": 348.371, "r_y3": 610.673, "coord_origin": "TOPLEFT"}, "text": "Formatting.", "orig": "Formatting.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 88, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 401.21, "r_y0": 621.962, "r_x1": 424.753, "r_y1": 621.962, "r_x2": 424.753, "r_y2": 610.673, "r_x3": 401.21, "r_y3": 610.673, "coord_origin": "TOPLEFT"}, "text": "Ph.D.", "orig": "Ph.D.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 89, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 429.846, "r_y0": 621.962, "r_x1": 455.031, "r_y1": 621.962, "r_x2": 455.031, "r_y2": 610.673, "r_x3": 429.846, "r_y3": 610.673, "coord_origin": "TOPLEFT"}, "text": "thesis,", "orig": "thesis,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 90, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 460.124, "r_y0": 621.962, "r_x1": 480.595, "r_y1": 621.962, "r_x2": 480.595, "r_y2": 610.673, "r_x3": 460.124, "r_y3": 610.673, "coord_origin": "TOPLEFT"}, "text": "CAN", "orig": "CAN", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 91, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 151.518, "r_y0": 632.921, "r_x1": 234.43, "r_y1": 632.921, "r_x2": 234.43, "r_y2": 621.6320000000001, "r_x3": 151.518, "r_y3": 621.6320000000001, "coord_origin": "TOPLEFT"}, "text": "(1996), aAINN09397", "orig": "(1996), aAINN09397", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "16. Wang, X.: Tabular Abstraction, Editing, and Formatting. Ph.D. thesis, CAN (1996), aAINN09397"}, {"label": "list_item", "id": 8, "page_no": 12, "cluster": {"id": 8, "label": "list_item", "bbox": {"l": 134.764, "t": 632.602, "r": 480.591, "b": 665.809, "coord_origin": "TOPLEFT"}, "confidence": 0.9646382331848145, "cells": [{"index": 92, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.764, "r_y0": 643.891, "r_x1": 146.537, "r_y1": 643.891, "r_x2": 146.537, "r_y2": 632.602, "r_x3": 134.764, "r_y3": 632.602, "coord_origin": "TOPLEFT"}, "text": "17.", "orig": "17.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 93, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 151.522, "r_y0": 643.891, "r_x1": 480.587, "r_y1": 643.891, "r_x2": 480.587, "r_y2": 632.602, "r_x3": 151.522, "r_y3": 632.602, "coord_origin": "TOPLEFT"}, "text": "Xue, W., Li, Q., Tao, D.: Res2tim: Reconstruct syntactic structures from table", "orig": "Xue, W., Li, Q., Tao, D.: Res2tim: Reconstruct syntactic structures from table", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 94, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 151.518, "r_y0": 654.85, "r_x1": 480.591, "r_y1": 654.85, "r_x2": 480.591, "r_y2": 643.561, "r_x3": 151.518, "r_y3": 643.561, "coord_origin": "TOPLEFT"}, "text": "images. In: 2019 International Conference on Document Analysis and Recognition", "orig": "images. In: 2019 International Conference on Document Analysis and Recognition", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 95, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 151.518, "r_y0": 665.809, "r_x1": 299.303, "r_y1": 665.809, "r_x2": 299.303, "r_y2": 654.52, "r_x3": 151.518, "r_y3": 654.52, "coord_origin": "TOPLEFT"}, "text": "(ICDAR). pp. 749-755. IEEE (2019)", "orig": "(ICDAR). pp. 749-755. IEEE (2019)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "17. Xue, W., Li, Q., Tao, D.: Res2tim: Reconstruct syntactic structures from table images. In: 2019 International Conference on Document Analysis and Recognition (ICDAR). pp. 749-755. IEEE (2019)"}], "body": [{"label": "list_item", "id": 5, "page_no": 12, "cluster": {"id": 5, "label": "list_item", "bbox": {"l": 139.371, "t": 117.39599999999996, "r": 480.595, "b": 150.60299999999995, "coord_origin": "TOPLEFT"}, "confidence": 0.9677112698554993, "cells": [{"index": 2, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 139.371, "r_y0": 128.68499999999995, "r_x1": 146.537, "r_y1": 128.68499999999995, "r_x2": 146.537, "r_y2": 117.39599999999996, "r_x3": 139.371, "r_y3": 117.39599999999996, "coord_origin": "TOPLEFT"}, "text": "5.", "orig": "5.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 3, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 151.522, "r_y0": 128.68499999999995, "r_x1": 480.588, "r_y1": 128.68499999999995, "r_x2": 480.588, "r_y2": 117.39599999999996, "r_x3": 151.522, "r_y3": 117.39599999999996, "coord_origin": "TOPLEFT"}, "text": "Kayal, P., Anand, M., Desai, H., Singh, M.: Tables to latex: structure and content", "orig": "Kayal, P., Anand, M., Desai, H., Singh, M.: Tables to latex: structure and content", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 4, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 151.518, "r_y0": 139.644, "r_x1": 480.595, "r_y1": 139.644, "r_x2": 480.595, "r_y2": 128.35500000000002, "r_x3": 151.518, "r_y3": 128.35500000000002, "coord_origin": "TOPLEFT"}, "text": "extraction from scientific tables. International Journal on Document Analysis and", "orig": "extraction from scientific tables. International Journal on Document Analysis and", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 5, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 151.518, "r_y0": 150.60299999999995, "r_x1": 304.044, "r_y1": 150.60299999999995, "r_x2": 304.044, "r_y2": 139.31399999999996, "r_x3": 151.518, "r_y3": 139.31399999999996, "coord_origin": "TOPLEFT"}, "text": "Recognition (IJDAR) pp. 1-10 (2022)", "orig": "Recognition (IJDAR) pp. 1-10 (2022)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "5. Kayal, P., Anand, M., Desai, H., Singh, M.: Tables to latex: structure and content extraction from scientific tables. International Journal on Document Analysis and Recognition (IJDAR) pp. 1-10 (2022)"}, {"label": "list_item", "id": 1, "page_no": 12, "cluster": {"id": 1, "label": "list_item", "bbox": {"l": 139.371, "t": 150.284, "r": 480.593, "b": 194.45000000000005, "coord_origin": "TOPLEFT"}, "confidence": 0.973045289516449, "cells": [{"index": 6, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 139.371, "r_y0": 161.57299999999998, "r_x1": 146.537, "r_y1": 161.57299999999998, "r_x2": 146.537, "r_y2": 150.284, "r_x3": 139.371, "r_y3": 150.284, "coord_origin": "TOPLEFT"}, "text": "6.", "orig": "6.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 7, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 151.522, "r_y0": 161.57299999999998, "r_x1": 480.59, "r_y1": 161.57299999999998, "r_x2": 480.59, "r_y2": 150.284, "r_x3": 151.522, "r_y3": 150.284, "coord_origin": "TOPLEFT"}, "text": "Lee, E., Kwon, J., Yang, H., Park, J., Lee, S., Koo, H.I., Cho, N.I.: Table structure", "orig": "Lee, E., Kwon, J., Yang, H., Park, J., Lee, S., Koo, H.I., Cho, N.I.: Table structure", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 8, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 151.518, "r_y0": 172.53200000000004, "r_x1": 480.59, "r_y1": 172.53200000000004, "r_x2": 480.59, "r_y2": 161.24300000000005, "r_x3": 151.518, "r_y3": 161.24300000000005, "coord_origin": "TOPLEFT"}, "text": "recognition based on grid shape graph. In: 2022 Asia-Pacific Signal and Information", "orig": "recognition based on grid shape graph. In: 2022 Asia-Pacific Signal and Information", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 9, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 151.518, "r_y0": 183.49099999999999, "r_x1": 480.593, "r_y1": 183.49099999999999, "r_x2": 480.593, "r_y2": 172.202, "r_x3": 151.518, "r_y3": 172.202, "coord_origin": "TOPLEFT"}, "text": "Processing Association Annual Summit and Conference (APSIPA ASC). pp. 1868-", "orig": "Processing Association Annual Summit and Conference (APSIPA ASC). pp. 1868-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 10, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 151.518, "r_y0": 194.45000000000005, "r_x1": 226.374, "r_y1": 194.45000000000005, "r_x2": 226.374, "r_y2": 183.16099999999994, "r_x3": 151.518, "r_y3": 183.16099999999994, "coord_origin": "TOPLEFT"}, "text": "1873. IEEE (2022)", "orig": "1873. IEEE (2022)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "6. Lee, E., Kwon, J., Yang, H., Park, J., Lee, S., Koo, H.I., Cho, N.I.: Table structure recognition based on grid shape graph. In: 2022 Asia-Pacific Signal and Information Processing Association Annual Summit and Conference (APSIPA ASC). pp. 18681873. IEEE (2022)"}, {"label": "list_item", "id": 10, "page_no": 12, "cluster": {"id": 10, "label": "list_item", "bbox": {"l": 139.371, "t": 194.13099999999997, "r": 480.59, "b": 216.37900000000002, "coord_origin": "TOPLEFT"}, "confidence": 0.9582491517066956, "cells": [{"index": 11, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 139.371, "r_y0": 205.41999999999996, "r_x1": 146.537, "r_y1": 205.41999999999996, "r_x2": 146.537, "r_y2": 194.13099999999997, "r_x3": 139.371, "r_y3": 194.13099999999997, "coord_origin": "TOPLEFT"}, "text": "7.", "orig": "7.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 12, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 151.522, "r_y0": 205.41999999999996, "r_x1": 162.398, "r_y1": 205.41999999999996, "r_x2": 162.398, "r_y2": 194.13099999999997, "r_x3": 151.522, "r_y3": 194.13099999999997, "coord_origin": "TOPLEFT"}, "text": "Li,", "orig": "Li,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 13, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 166.298, "r_y0": 205.41999999999996, "r_x1": 480.59, "r_y1": 205.41999999999996, "r_x2": 480.59, "r_y2": 194.13099999999997, "r_x3": 166.298, "r_y3": 194.13099999999997, "coord_origin": "TOPLEFT"}, "text": "M., Cui, L., Huang, S., Wei, F., Zhou, M., Li, Z.: Tablebank: A benchmark", "orig": "M., Cui, L., Huang, S., Wei, F., Zhou, M., Li, Z.: Tablebank: A benchmark", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 14, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 151.518, "r_y0": 216.37900000000002, "r_x1": 352.017, "r_y1": 216.37900000000002, "r_x2": 352.017, "r_y2": 205.09000000000003, "r_x3": 151.518, "r_y3": 205.09000000000003, "coord_origin": "TOPLEFT"}, "text": "dataset for table detection and recognition (2019)", "orig": "dataset for table detection and recognition (2019)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "7. Li, M., Cui, L., Huang, S., Wei, F., Zhou, M., Li, Z.: Tablebank: A benchmark dataset for table detection and recognition (2019)"}, {"label": "list_item", "id": 4, "page_no": 12, "cluster": {"id": 4, "label": "list_item", "bbox": {"l": 139.371, "t": 216.06100000000004, "r": 480.595, "b": 270.289, "coord_origin": "TOPLEFT"}, "confidence": 0.967814564704895, "cells": [{"index": 15, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 139.371, "r_y0": 227.35000000000002, "r_x1": 146.537, "r_y1": 227.35000000000002, "r_x2": 146.537, "r_y2": 216.06100000000004, "r_x3": 139.371, "r_y3": 216.06100000000004, "coord_origin": "TOPLEFT"}, "text": "8.", "orig": "8.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 16, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 151.522, "r_y0": 227.35000000000002, "r_x1": 480.587, "r_y1": 227.35000000000002, "r_x2": 480.587, "r_y2": 216.06100000000004, "r_x3": 151.522, "r_y3": 216.06100000000004, "coord_origin": "TOPLEFT"}, "text": "Livathinos, N., Berrospi, C., Lysak, M., Kuropiatnyk, V., Nassar, A., Carvalho,", "orig": "Livathinos, N., Berrospi, C., Lysak, M., Kuropiatnyk, V., Nassar, A., Carvalho,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 17, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 151.518, "r_y0": 238.30899999999997, "r_x1": 189.414, "r_y1": 238.30899999999997, "r_x2": 189.414, "r_y2": 227.01999999999998, "r_x3": 151.518, "r_y3": 227.01999999999998, "coord_origin": "TOPLEFT"}, "text": "A., Dolfi,", "orig": "A., Dolfi,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 18, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 193.414, "r_y0": 238.30899999999997, "r_x1": 480.59, "r_y1": 238.30899999999997, "r_x2": 480.59, "r_y2": 227.01999999999998, "r_x3": 193.414, "r_y3": 227.01999999999998, "coord_origin": "TOPLEFT"}, "text": "M., Auer, C., Dinkla, K., Staar, P.: Robust pdf document conversion", "orig": "M., Auer, C., Dinkla, K., Staar, P.: Robust pdf document conversion", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 19, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 151.518, "r_y0": 249.26800000000003, "r_x1": 480.595, "r_y1": 249.26800000000003, "r_x2": 480.595, "r_y2": 237.97900000000004, "r_x3": 151.518, "r_y3": 237.97900000000004, "coord_origin": "TOPLEFT"}, "text": "using recurrent neural networks. Proceedings of the AAAI Conference on Artificial", "orig": "using recurrent neural networks. Proceedings of the AAAI Conference on Artificial", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 20, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 151.518, "r_y0": 260.227, "r_x1": 197.086, "r_y1": 260.227, "r_x2": 197.086, "r_y2": 248.938, "r_x3": 151.518, "r_y3": 248.938, "coord_origin": "TOPLEFT"}, "text": "Intelligence", "orig": "Intelligence", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 21, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 199.4, "r_y0": 259.07899999999995, "r_x1": 210.007, "r_y1": 259.07899999999995, "r_x2": 210.007, "r_y2": 251.15300000000002, "r_x3": 199.4, "r_y3": 251.15300000000002, "coord_origin": "TOPLEFT"}, "text": "35", "orig": "35", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 22, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 210.007, "r_y0": 260.227, "r_x1": 332.377, "r_y1": 260.227, "r_x2": 332.377, "r_y2": 248.938, "r_x3": 210.007, "r_y3": 248.938, "coord_origin": "TOPLEFT"}, "text": "(17), 15137-15145 (May 2021),", "orig": "(17), 15137-15145 (May 2021),", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 23, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 334.699, "r_y0": 259.331, "r_x1": 480.59, "r_y1": 259.331, "r_x2": 480.59, "r_y2": 251.86199999999997, "r_x3": 334.699, "r_y3": 251.86199999999997, "coord_origin": "TOPLEFT"}, "text": "https://ojs.aaai.org/index.php/", "orig": "https://ojs.aaai.org/index.php/", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 24, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 151.518, "r_y0": 270.289, "r_x1": 259.758, "r_y1": 270.289, "r_x2": 259.758, "r_y2": 262.82000000000005, "r_x3": 151.518, "r_y3": 262.82000000000005, "coord_origin": "TOPLEFT"}, "text": "AAAI/article/view/17777", "orig": "AAAI/article/view/17777", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "8. Livathinos, N., Berrospi, C., Lysak, M., Kuropiatnyk, V., Nassar, A., Carvalho, A., Dolfi, M., Auer, C., Dinkla, K., Staar, P.: Robust pdf document conversion using recurrent neural networks. Proceedings of the AAAI Conference on Artificial Intelligence 35 (17), 15137-15145 (May 2021), https://ojs.aaai.org/index.php/ AAAI/article/view/17777"}, {"label": "list_item", "id": 11, "page_no": 12, "cluster": {"id": 11, "label": "list_item", "bbox": {"l": 139.371, "t": 270.86699999999996, "r": 480.594, "b": 304.074, "coord_origin": "TOPLEFT"}, "confidence": 0.9557179808616638, "cells": [{"index": 25, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 139.371, "r_y0": 282.156, "r_x1": 146.537, "r_y1": 282.156, "r_x2": 146.537, "r_y2": 270.86699999999996, "r_x3": 139.371, "r_y3": 270.86699999999996, "coord_origin": "TOPLEFT"}, "text": "9.", "orig": "9.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 26, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 151.522, "r_y0": 282.156, "r_x1": 480.588, "r_y1": 282.156, "r_x2": 480.588, "r_y2": 270.86699999999996, "r_x3": 151.522, "r_y3": 270.86699999999996, "coord_origin": "TOPLEFT"}, "text": "Nassar, A., Livathinos, N., Lysak, M., Staar, P.: Tableformer: Table structure un-", "orig": "Nassar, A., Livathinos, N., Lysak, M., Staar, P.: Tableformer: Table structure un-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 27, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 151.518, "r_y0": 293.115, "r_x1": 480.594, "r_y1": 293.115, "r_x2": 480.594, "r_y2": 281.826, "r_x3": 151.518, "r_y3": 281.826, "coord_origin": "TOPLEFT"}, "text": "derstanding with transformers. In: Proceedings of the IEEE/CVF Conference on", "orig": "derstanding with transformers. In: Proceedings of the IEEE/CVF Conference on", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 28, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 151.518, "r_y0": 304.074, "r_x1": 473.443, "r_y1": 304.074, "r_x2": 473.443, "r_y2": 292.785, "r_x3": 151.518, "r_y3": 292.785, "coord_origin": "TOPLEFT"}, "text": "Computer Vision and Pattern Recognition (CVPR). pp. 4614-4623 (June 2022)", "orig": "Computer Vision and Pattern Recognition (CVPR). pp. 4614-4623 (June 2022)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "9. Nassar, A., Livathinos, N., Lysak, M., Staar, P.: Tableformer: Table structure understanding with transformers. In: Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR). pp. 4614-4623 (June 2022)"}, {"label": "list_item", "id": 9, "page_no": 12, "cluster": {"id": 9, "label": "list_item", "bbox": {"l": 134.764, "t": 303.755, "r": 480.594, "b": 368.943, "coord_origin": "TOPLEFT"}, "confidence": 0.9639304876327515, "cells": [{"index": 29, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.764, "r_y0": 315.044, "r_x1": 146.537, "r_y1": 315.044, "r_x2": 146.537, "r_y2": 303.755, "r_x3": 134.764, "r_y3": 303.755, "coord_origin": "TOPLEFT"}, "text": "10.", "orig": "10.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 30, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 151.522, "r_y0": 315.044, "r_x1": 195.667, "r_y1": 315.044, "r_x2": 195.667, "r_y2": 303.755, "r_x3": 151.522, "r_y3": 303.755, "coord_origin": "TOPLEFT"}, "text": "Pfitzmann,", "orig": "Pfitzmann,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 31, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 200.249, "r_y0": 315.044, "r_x1": 211.893, "r_y1": 315.044, "r_x2": 211.893, "r_y2": 303.755, "r_x3": 200.249, "r_y3": 303.755, "coord_origin": "TOPLEFT"}, "text": "B.,", "orig": "B.,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 32, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 216.484, "r_y0": 315.044, "r_x1": 238.772, "r_y1": 315.044, "r_x2": 238.772, "r_y2": 303.755, "r_x3": 216.484, "r_y3": 303.755, "coord_origin": "TOPLEFT"}, "text": "Auer,", "orig": "Auer,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 33, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 243.362, "r_y0": 315.044, "r_x1": 255.134, "r_y1": 315.044, "r_x2": 255.134, "r_y2": 303.755, "r_x3": 243.362, "r_y3": 303.755, "coord_origin": "TOPLEFT"}, "text": "C.,", "orig": "C.,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 34, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 259.725, "r_y0": 315.044, "r_x1": 281.605, "r_y1": 315.044, "r_x2": 281.605, "r_y2": 303.755, "r_x3": 259.725, "r_y3": 303.755, "coord_origin": "TOPLEFT"}, "text": "Dolfi,", "orig": "Dolfi,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 35, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 286.187, "r_y0": 315.044, "r_x1": 299.748, "r_y1": 315.044, "r_x2": 299.748, "r_y2": 303.755, "r_x3": 286.187, "r_y3": 303.755, "coord_origin": "TOPLEFT"}, "text": "M.,", "orig": "M.,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 36, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 304.339, "r_y0": 315.044, "r_x1": 333.893, "r_y1": 315.044, "r_x2": 333.893, "r_y2": 303.755, "r_x3": 304.339, "r_y3": 303.755, "coord_origin": "TOPLEFT"}, "text": "Nassar,", "orig": "Nassar,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 37, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 338.483, "r_y0": 315.044, "r_x1": 358.187, "r_y1": 315.044, "r_x2": 358.187, "r_y2": 303.755, "r_x3": 338.483, "r_y3": 303.755, "coord_origin": "TOPLEFT"}, "text": "A.S.,", "orig": "A.S.,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 38, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 362.778, "r_y0": 315.044, "r_x1": 386.855, "r_y1": 315.044, "r_x2": 386.855, "r_y2": 303.755, "r_x3": 362.778, "r_y3": 303.755, "coord_origin": "TOPLEFT"}, "text": "Staar,", "orig": "Staar,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 39, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 391.437, "r_y0": 315.044, "r_x1": 421.382, "r_y1": 315.044, "r_x2": 421.382, "r_y2": 303.755, "r_x3": 391.437, "r_y3": 303.755, "coord_origin": "TOPLEFT"}, "text": "P.W.J.:", "orig": "P.W.J.:", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 40, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 425.973, "r_y0": 315.044, "r_x1": 469.09, "r_y1": 315.044, "r_x2": 469.09, "r_y2": 303.755, "r_x3": 425.973, "r_y3": 303.755, "coord_origin": "TOPLEFT"}, "text": "Doclaynet:", "orig": "Doclaynet:", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 41, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 473.68, "r_y0": 315.044, "r_x1": 480.589, "r_y1": 315.044, "r_x2": 480.589, "r_y2": 303.755, "r_x3": 473.68, "r_y3": 303.755, "coord_origin": "TOPLEFT"}, "text": "A", "orig": "A", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 42, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 151.518, "r_y0": 326.003, "r_x1": 480.59, "r_y1": 326.003, "r_x2": 480.59, "r_y2": 314.714, "r_x3": 151.518, "r_y3": 314.714, "coord_origin": "TOPLEFT"}, "text": "large human-annotated dataset for document-layout segmentation. In: Zhang, A.,", "orig": "large human-annotated dataset for document-layout segmentation. In: Zhang, A.,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 43, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 151.518, "r_y0": 336.962, "r_x1": 480.591, "r_y1": 336.962, "r_x2": 480.591, "r_y2": 325.673, "r_x3": 151.518, "r_y3": 325.673, "coord_origin": "TOPLEFT"}, "text": "Rangwala, H. (eds.) KDD '22: The 28th ACM SIGKDD Conference on Knowledge", "orig": "Rangwala, H. (eds.) KDD '22: The 28th ACM SIGKDD Conference on Knowledge", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 44, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 151.518, "r_y0": 347.921, "r_x1": 480.591, "r_y1": 347.921, "r_x2": 480.591, "r_y2": 336.632, "r_x3": 151.518, "r_y3": 336.632, "coord_origin": "TOPLEFT"}, "text": "Discovery and Data Mining, Washington, DC, USA, August 14 - 18, 2022. pp.", "orig": "Discovery and Data Mining, Washington, DC, USA, August 14 - 18, 2022. pp.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 45, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 151.518, "r_y0": 358.88, "r_x1": 251.141, "r_y1": 358.88, "r_x2": 251.141, "r_y2": 347.591, "r_x3": 151.518, "r_y3": 347.591, "coord_origin": "TOPLEFT"}, "text": "3743-3751. ACM (2022).", "orig": "3743-3751. ACM (2022).", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 46, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 253.99, "r_y0": 357.984, "r_x1": 437.533, "r_y1": 357.984, "r_x2": 437.533, "r_y2": 350.515, "r_x3": 253.99, "r_y3": 350.515, "coord_origin": "TOPLEFT"}, "text": "https://doi.org/10.1145/3534678.3539043", "orig": "https://doi.org/10.1145/3534678.3539043", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 47, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 437.532, "r_y0": 358.88, "r_x1": 440.091, "r_y1": 358.88, "r_x2": 440.091, "r_y2": 347.591, "r_x3": 437.532, "r_y3": 347.591, "coord_origin": "TOPLEFT"}, "text": ",", "orig": ",", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 48, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 442.942, "r_y0": 357.984, "r_x1": 480.594, "r_y1": 357.984, "r_x2": 480.594, "r_y2": 350.515, "r_x3": 442.942, "r_y3": 350.515, "coord_origin": "TOPLEFT"}, "text": "https://", "orig": "https://", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 49, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 151.518, "r_y0": 368.943, "r_x1": 297.409, "r_y1": 368.943, "r_x2": 297.409, "r_y2": 361.474, "r_x3": 151.518, "r_y3": 361.474, "coord_origin": "TOPLEFT"}, "text": "doi.org/10.1145/3534678.3539043", "orig": "doi.org/10.1145/3534678.3539043", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "10. Pfitzmann, B., Auer, C., Dolfi, M., Nassar, A.S., Staar, P.W.J.: Doclaynet: A large human-annotated dataset for document-layout segmentation. In: Zhang, A., Rangwala, H. (eds.) KDD '22: The 28th ACM SIGKDD Conference on Knowledge Discovery and Data Mining, Washington, DC, USA, August 14 - 18, 2022. pp. 3743-3751. ACM (2022). https://doi.org/10.1145/3534678.3539043 , https:// doi.org/10.1145/3534678.3539043"}, {"label": "list_item", "id": 0, "page_no": 12, "cluster": {"id": 0, "label": "list_item", "bbox": {"l": 134.764, "t": 369.52, "r": 480.593, "b": 413.686, "coord_origin": "TOPLEFT"}, "confidence": 0.9752162098884583, "cells": [{"index": 50, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.764, "r_y0": 380.809, "r_x1": 146.537, "r_y1": 380.809, "r_x2": 146.537, "r_y2": 369.52, "r_x3": 134.764, "r_y3": 369.52, "coord_origin": "TOPLEFT"}, "text": "11.", "orig": "11.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 51, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 151.522, "r_y0": 380.809, "r_x1": 480.589, "r_y1": 380.809, "r_x2": 480.589, "r_y2": 369.52, "r_x3": 151.522, "r_y3": 369.52, "coord_origin": "TOPLEFT"}, "text": "Prasad, D., Gadpal, A., Kapadni, K., Visave, M., Sultanpure, K.: Cascadetabnet:", "orig": "Prasad, D., Gadpal, A., Kapadni, K., Visave, M., Sultanpure, K.: Cascadetabnet:", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 52, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 151.518, "r_y0": 391.768, "r_x1": 480.593, "r_y1": 391.768, "r_x2": 480.593, "r_y2": 380.479, "r_x3": 151.518, "r_y3": 380.479, "coord_origin": "TOPLEFT"}, "text": "An approach for end to end table detection and structure recognition from image-", "orig": "An approach for end to end table detection and structure recognition from image-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 53, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 151.518, "r_y0": 402.727, "r_x1": 480.593, "r_y1": 402.727, "r_x2": 480.593, "r_y2": 391.438, "r_x3": 151.518, "r_y3": 391.438, "coord_origin": "TOPLEFT"}, "text": "based documents. In: Proceedings of the IEEE/CVF conference on computer vision", "orig": "based documents. In: Proceedings of the IEEE/CVF conference on computer vision", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 54, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 151.518, "r_y0": 413.686, "r_x1": 373.827, "r_y1": 413.686, "r_x2": 373.827, "r_y2": 402.397, "r_x3": 151.518, "r_y3": 402.397, "coord_origin": "TOPLEFT"}, "text": "and pattern recognition workshops. pp. 572-573 (2020)", "orig": "and pattern recognition workshops. pp. 572-573 (2020)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "11. Prasad, D., Gadpal, A., Kapadni, K., Visave, M., Sultanpure, K.: Cascadetabnet: An approach for end to end table detection and structure recognition from imagebased documents. In: Proceedings of the IEEE/CVF conference on computer vision and pattern recognition workshops. pp. 572-573 (2020)"}, {"label": "list_item", "id": 3, "page_no": 12, "cluster": {"id": 3, "label": "list_item", "bbox": {"l": 134.764, "t": 413.367, "r": 480.595, "b": 457.533, "coord_origin": "TOPLEFT"}, "confidence": 0.9707236886024475, "cells": [{"index": 55, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.764, "r_y0": 424.656, "r_x1": 146.537, "r_y1": 424.656, "r_x2": 146.537, "r_y2": 413.367, "r_x3": 134.764, "r_y3": 413.367, "coord_origin": "TOPLEFT"}, "text": "12.", "orig": "12.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 56, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 151.522, "r_y0": 424.656, "r_x1": 480.587, "r_y1": 424.656, "r_x2": 480.587, "r_y2": 413.367, "r_x3": 151.522, "r_y3": 413.367, "coord_origin": "TOPLEFT"}, "text": "Schreiber, S., Agne, S., Wolf, I., Dengel, A., Ahmed, S.: Deepdesrt: Deep learning", "orig": "Schreiber, S., Agne, S., Wolf, I., Dengel, A., Ahmed, S.: Deepdesrt: Deep learning", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 57, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 151.518, "r_y0": 435.615, "r_x1": 480.595, "r_y1": 435.615, "r_x2": 480.595, "r_y2": 424.326, "r_x3": 151.518, "r_y3": 424.326, "coord_origin": "TOPLEFT"}, "text": "for detection and structure recognition of tables in document images. In: 2017 14th", "orig": "for detection and structure recognition of tables in document images. In: 2017 14th", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 58, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 151.518, "r_y0": 446.574, "r_x1": 480.588, "r_y1": 446.574, "r_x2": 480.588, "r_y2": 435.285, "r_x3": 151.518, "r_y3": 435.285, "coord_origin": "TOPLEFT"}, "text": "IAPR international conference on document analysis and recognition (ICDAR).", "orig": "IAPR international conference on document analysis and recognition (ICDAR).", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 59, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 151.518, "r_y0": 457.533, "r_x1": 292.915, "r_y1": 457.533, "r_x2": 292.915, "r_y2": 446.244, "r_x3": 151.518, "r_y3": 446.244, "coord_origin": "TOPLEFT"}, "text": "vol. 1, pp. 1162-1167. IEEE (2017)", "orig": "vol. 1, pp. 1162-1167. IEEE (2017)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "12. Schreiber, S., Agne, S., Wolf, I., Dengel, A., Ahmed, S.: Deepdesrt: Deep learning for detection and structure recognition of tables in document images. In: 2017 14th IAPR international conference on document analysis and recognition (ICDAR). vol. 1, pp. 1162-1167. IEEE (2017)"}, {"label": "list_item", "id": 7, "page_no": 12, "cluster": {"id": 7, "label": "list_item", "bbox": {"l": 134.764, "t": 457.214, "r": 480.594, "b": 500.484, "coord_origin": "TOPLEFT"}, "confidence": 0.9658119678497314, "cells": [{"index": 60, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.764, "r_y0": 468.503, "r_x1": 146.537, "r_y1": 468.503, "r_x2": 146.537, "r_y2": 457.214, "r_x3": 134.764, "r_y3": 457.214, "coord_origin": "TOPLEFT"}, "text": "13.", "orig": "13.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 61, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 151.522, "r_y0": 468.503, "r_x1": 480.59, "r_y1": 468.503, "r_x2": 480.59, "r_y2": 457.214, "r_x3": 151.522, "r_y3": 457.214, "coord_origin": "TOPLEFT"}, "text": "Siddiqui, S.A., Fateh, I.A., Rizvi, S.T.R., Dengel, A., Ahmed, S.: Deeptabstr: Deep", "orig": "Siddiqui, S.A., Fateh, I.A., Rizvi, S.T.R., Dengel, A., Ahmed, S.: Deeptabstr: Deep", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 62, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 151.518, "r_y0": 479.462, "r_x1": 480.591, "r_y1": 479.462, "r_x2": 480.591, "r_y2": 468.173, "r_x3": 151.518, "r_y3": 468.173, "coord_origin": "TOPLEFT"}, "text": "learning based table structure recognition. In: 2019 International Conference on", "orig": "learning based table structure recognition. In: 2019 International Conference on", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 63, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 151.518, "r_y0": 490.421, "r_x1": 439.06, "r_y1": 490.421, "r_x2": 439.06, "r_y2": 479.132, "r_x3": 151.518, "r_y3": 479.132, "coord_origin": "TOPLEFT"}, "text": "Document Analysis and Recognition (ICDAR). pp. 1403-1409 (2019).", "orig": "Document Analysis and Recognition (ICDAR). pp. 1403-1409 (2019).", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 64, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 442.942, "r_y0": 489.525, "r_x1": 480.594, "r_y1": 489.525, "r_x2": 480.594, "r_y2": 482.056, "r_x3": 442.942, "r_y3": 482.056, "coord_origin": "TOPLEFT"}, "text": "https://", "orig": "https://", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 65, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 151.518, "r_y0": 500.484, "r_x1": 302.116, "r_y1": 500.484, "r_x2": 302.116, "r_y2": 493.015, "r_x3": 151.518, "r_y3": 493.015, "coord_origin": "TOPLEFT"}, "text": "doi.org/10.1109/ICDAR.2019.00226", "orig": "doi.org/10.1109/ICDAR.2019.00226", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "13. Siddiqui, S.A., Fateh, I.A., Rizvi, S.T.R., Dengel, A., Ahmed, S.: Deeptabstr: Deep learning based table structure recognition. In: 2019 International Conference on Document Analysis and Recognition (ICDAR). pp. 1403-1409 (2019). https:// doi.org/10.1109/ICDAR.2019.00226"}, {"label": "list_item", "id": 2, "page_no": 12, "cluster": {"id": 2, "label": "list_item", "bbox": {"l": 134.764, "t": 501.061, "r": 480.593, "b": 545.227, "coord_origin": "TOPLEFT"}, "confidence": 0.972225546836853, "cells": [{"index": 66, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.764, "r_y0": 512.35, "r_x1": 146.537, "r_y1": 512.35, "r_x2": 146.537, "r_y2": 501.061, "r_x3": 134.764, "r_y3": 501.061, "coord_origin": "TOPLEFT"}, "text": "14.", "orig": "14.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 67, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 151.522, "r_y0": 512.35, "r_x1": 480.591, "r_y1": 512.35, "r_x2": 480.591, "r_y2": 501.061, "r_x3": 151.522, "r_y3": 501.061, "coord_origin": "TOPLEFT"}, "text": "Smock, B., Pesala, R., Abraham, R.: PubTables-1M: Towards comprehensive ta-", "orig": "Smock, B., Pesala, R., Abraham, R.: PubTables-1M: Towards comprehensive ta-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 68, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 151.518, "r_y0": 523.309, "r_x1": 480.593, "r_y1": 523.309, "r_x2": 480.593, "r_y2": 512.02, "r_x3": 151.518, "r_y3": 512.02, "coord_origin": "TOPLEFT"}, "text": "ble extraction from unstructured documents. In: Proceedings of the IEEE/CVF", "orig": "ble extraction from unstructured documents. In: Proceedings of the IEEE/CVF", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 69, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 151.518, "r_y0": 534.268, "r_x1": 480.588, "r_y1": 534.268, "r_x2": 480.588, "r_y2": 522.979, "r_x3": 151.518, "r_y3": 522.979, "coord_origin": "TOPLEFT"}, "text": "Conference on Computer Vision and Pattern Recognition (CVPR). pp. 4634-4642", "orig": "Conference on Computer Vision and Pattern Recognition (CVPR). pp. 4634-4642", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 70, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 151.518, "r_y0": 545.227, "r_x1": 199.247, "r_y1": 545.227, "r_x2": 199.247, "r_y2": 533.938, "r_x3": 151.518, "r_y3": 533.938, "coord_origin": "TOPLEFT"}, "text": "(June 2022)", "orig": "(June 2022)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "14. Smock, B., Pesala, R., Abraham, R.: PubTables-1M: Towards comprehensive table extraction from unstructured documents. In: Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR). pp. 4634-4642 (June 2022)"}, {"label": "list_item", "id": 6, "page_no": 12, "cluster": {"id": 6, "label": "list_item", "bbox": {"l": 134.764, "t": 544.908, "r": 480.596, "b": 610.096, "coord_origin": "TOPLEFT"}, "confidence": 0.9674034714698792, "cells": [{"index": 71, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.764, "r_y0": 556.197, "r_x1": 146.537, "r_y1": 556.197, "r_x2": 146.537, "r_y2": 544.908, "r_x3": 134.764, "r_y3": 544.908, "coord_origin": "TOPLEFT"}, "text": "15.", "orig": "15.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 72, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 151.522, "r_y0": 556.197, "r_x1": 480.587, "r_y1": 556.197, "r_x2": 480.587, "r_y2": 544.908, "r_x3": 151.522, "r_y3": 544.908, "coord_origin": "TOPLEFT"}, "text": "Staar, P.W.J., Dolfi, M., Auer, C., Bekas, C.: Corpus conversion service: A ma-", "orig": "Staar, P.W.J., Dolfi, M., Auer, C., Bekas, C.: Corpus conversion service: A ma-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 73, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 151.518, "r_y0": 567.156, "r_x1": 480.588, "r_y1": 567.156, "r_x2": 480.588, "r_y2": 555.867, "r_x3": 151.518, "r_y3": 555.867, "coord_origin": "TOPLEFT"}, "text": "chine learning platform to ingest documents at scale. In: Proceedings of the 24th", "orig": "chine learning platform to ingest documents at scale. In: Proceedings of the 24th", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 74, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 151.518, "r_y0": 578.115, "r_x1": 480.591, "r_y1": 578.115, "r_x2": 480.591, "r_y2": 566.826, "r_x3": 151.518, "r_y3": 566.826, "coord_origin": "TOPLEFT"}, "text": "ACM SIGKDD International Conference on Knowledge Discovery & Data Min-", "orig": "ACM SIGKDD International Conference on Knowledge Discovery & Data Min-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 75, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 151.518, "r_y0": 589.0740000000001, "r_x1": 480.592, "r_y1": 589.0740000000001, "r_x2": 480.592, "r_y2": 577.785, "r_x3": 151.518, "r_y3": 577.785, "coord_origin": "TOPLEFT"}, "text": "ing. pp. 774-782. KDD '18, Association for Computing Machinery, New York, NY,", "orig": "ing. pp. 774-782. KDD '18, Association for Computing Machinery, New York, NY,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 76, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 151.518, "r_y0": 600.033, "r_x1": 200.758, "r_y1": 600.033, "r_x2": 200.758, "r_y2": 588.744, "r_x3": 151.518, "r_y3": 588.744, "coord_origin": "TOPLEFT"}, "text": "USA (2018).", "orig": "USA (2018).", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 77, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 202.916, "r_y0": 599.137, "r_x1": 386.459, "r_y1": 599.137, "r_x2": 386.459, "r_y2": 591.668, "r_x3": 202.916, "r_y3": 591.668, "coord_origin": "TOPLEFT"}, "text": "https://doi.org/10.1145/3219819.3219834", "orig": "https://doi.org/10.1145/3219819.3219834", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 78, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 386.458, "r_y0": 600.033, "r_x1": 389.017, "r_y1": 600.033, "r_x2": 389.017, "r_y2": 588.744, "r_x3": 386.458, "r_y3": 588.744, "coord_origin": "TOPLEFT"}, "text": ",", "orig": ",", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 79, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 391.173, "r_y0": 599.137, "r_x1": 480.596, "r_y1": 599.137, "r_x2": 480.596, "r_y2": 591.668, "r_x3": 391.173, "r_y3": 591.668, "coord_origin": "TOPLEFT"}, "text": "https://doi.org/10.", "orig": "https://doi.org/10.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 80, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 151.518, "r_y0": 610.096, "r_x1": 245.638, "r_y1": 610.096, "r_x2": 245.638, "r_y2": 602.627, "r_x3": 151.518, "r_y3": 602.627, "coord_origin": "TOPLEFT"}, "text": "1145/3219819.3219834", "orig": "1145/3219819.3219834", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "15. Staar, P.W.J., Dolfi, M., Auer, C., Bekas, C.: Corpus conversion service: A machine learning platform to ingest documents at scale. In: Proceedings of the 24th ACM SIGKDD International Conference on Knowledge Discovery & Data Mining. pp. 774-782. KDD '18, Association for Computing Machinery, New York, NY, USA (2018). https://doi.org/10.1145/3219819.3219834 , https://doi.org/10. 1145/3219819.3219834"}, {"label": "list_item", "id": 12, "page_no": 12, "cluster": {"id": 12, "label": "list_item", "bbox": {"l": 134.764, "t": 610.673, "r": 480.595, "b": 632.921, "coord_origin": "TOPLEFT"}, "confidence": 0.9416429996490479, "cells": [{"index": 81, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.764, "r_y0": 621.962, "r_x1": 146.537, "r_y1": 621.962, "r_x2": 146.537, "r_y2": 610.673, "r_x3": 134.764, "r_y3": 610.673, "coord_origin": "TOPLEFT"}, "text": "16.", "orig": "16.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 82, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 151.522, "r_y0": 621.962, "r_x1": 194.229, "r_y1": 621.962, "r_x2": 194.229, "r_y2": 610.673, "r_x3": 151.522, "r_y3": 610.673, "coord_origin": "TOPLEFT"}, "text": "Wang, X.:", "orig": "Wang, X.:", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 83, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 199.313, "r_y0": 621.962, "r_x1": 230.817, "r_y1": 621.962, "r_x2": 230.817, "r_y2": 610.673, "r_x3": 199.313, "r_y3": 610.673, "coord_origin": "TOPLEFT"}, "text": "Tabular", "orig": "Tabular", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 84, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 235.91, "r_y0": 621.962, "r_x1": 285.885, "r_y1": 621.962, "r_x2": 285.885, "r_y2": 610.673, "r_x3": 235.91, "r_y3": 610.673, "coord_origin": "TOPLEFT"}, "text": "Abstraction,", "orig": "Abstraction,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 85, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 290.969, "r_y0": 621.962, "r_x1": 323.342, "r_y1": 621.962, "r_x2": 323.342, "r_y2": 610.673, "r_x3": 290.969, "r_y3": 610.673, "coord_origin": "TOPLEFT"}, "text": "Editing,", "orig": "Editing,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 86, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 328.435, "r_y0": 621.962, "r_x1": 343.278, "r_y1": 621.962, "r_x2": 343.278, "r_y2": 610.673, "r_x3": 328.435, "r_y3": 610.673, "coord_origin": "TOPLEFT"}, "text": "and", "orig": "and", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 87, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 348.371, "r_y0": 621.962, "r_x1": 396.118, "r_y1": 621.962, "r_x2": 396.118, "r_y2": 610.673, "r_x3": 348.371, "r_y3": 610.673, "coord_origin": "TOPLEFT"}, "text": "Formatting.", "orig": "Formatting.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 88, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 401.21, "r_y0": 621.962, "r_x1": 424.753, "r_y1": 621.962, "r_x2": 424.753, "r_y2": 610.673, "r_x3": 401.21, "r_y3": 610.673, "coord_origin": "TOPLEFT"}, "text": "Ph.D.", "orig": "Ph.D.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 89, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 429.846, "r_y0": 621.962, "r_x1": 455.031, "r_y1": 621.962, "r_x2": 455.031, "r_y2": 610.673, "r_x3": 429.846, "r_y3": 610.673, "coord_origin": "TOPLEFT"}, "text": "thesis,", "orig": "thesis,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 90, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 460.124, "r_y0": 621.962, "r_x1": 480.595, "r_y1": 621.962, "r_x2": 480.595, "r_y2": 610.673, "r_x3": 460.124, "r_y3": 610.673, "coord_origin": "TOPLEFT"}, "text": "CAN", "orig": "CAN", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 91, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 151.518, "r_y0": 632.921, "r_x1": 234.43, "r_y1": 632.921, "r_x2": 234.43, "r_y2": 621.6320000000001, "r_x3": 151.518, "r_y3": 621.6320000000001, "coord_origin": "TOPLEFT"}, "text": "(1996), aAINN09397", "orig": "(1996), aAINN09397", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "16. Wang, X.: Tabular Abstraction, Editing, and Formatting. Ph.D. thesis, CAN (1996), aAINN09397"}, {"label": "list_item", "id": 8, "page_no": 12, "cluster": {"id": 8, "label": "list_item", "bbox": {"l": 134.764, "t": 632.602, "r": 480.591, "b": 665.809, "coord_origin": "TOPLEFT"}, "confidence": 0.9646382331848145, "cells": [{"index": 92, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.764, "r_y0": 643.891, "r_x1": 146.537, "r_y1": 643.891, "r_x2": 146.537, "r_y2": 632.602, "r_x3": 134.764, "r_y3": 632.602, "coord_origin": "TOPLEFT"}, "text": "17.", "orig": "17.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 93, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 151.522, "r_y0": 643.891, "r_x1": 480.587, "r_y1": 643.891, "r_x2": 480.587, "r_y2": 632.602, "r_x3": 151.522, "r_y3": 632.602, "coord_origin": "TOPLEFT"}, "text": "Xue, W., Li, Q., Tao, D.: Res2tim: Reconstruct syntactic structures from table", "orig": "Xue, W., Li, Q., Tao, D.: Res2tim: Reconstruct syntactic structures from table", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 94, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 151.518, "r_y0": 654.85, "r_x1": 480.591, "r_y1": 654.85, "r_x2": 480.591, "r_y2": 643.561, "r_x3": 151.518, "r_y3": 643.561, "coord_origin": "TOPLEFT"}, "text": "images. In: 2019 International Conference on Document Analysis and Recognition", "orig": "images. In: 2019 International Conference on Document Analysis and Recognition", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 95, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 151.518, "r_y0": 665.809, "r_x1": 299.303, "r_y1": 665.809, "r_x2": 299.303, "r_y2": 654.52, "r_x3": 151.518, "r_y3": 654.52, "coord_origin": "TOPLEFT"}, "text": "(ICDAR). pp. 749-755. IEEE (2019)", "orig": "(ICDAR). pp. 749-755. IEEE (2019)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "17. Xue, W., Li, Q., Tao, D.: Res2tim: Reconstruct syntactic structures from table images. In: 2019 International Conference on Document Analysis and Recognition (ICDAR). pp. 749-755. IEEE (2019)"}], "headers": [{"label": "page_header", "id": 13, "page_no": 12, "cluster": {"id": 13, "label": "page_header", "bbox": {"l": 194.478, "t": 91.49300000000005, "r": 447.543, "b": 102.78200000000004, "coord_origin": "TOPLEFT"}, "confidence": 0.9163166880607605, "cells": [{"index": 0, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 194.478, "r_y0": 102.78200000000004, "r_x1": 447.543, "r_y1": 102.78200000000004, "r_x2": 447.543, "r_y2": 91.49300000000005, "r_x3": 194.478, "r_y3": 91.49300000000005, "coord_origin": "TOPLEFT"}, "text": "Optimized Table Tokenization for Table Structure Recognition", "orig": "Optimized Table Tokenization for Table Structure Recognition", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "Optimized Table Tokenization for Table Structure Recognition"}, {"label": "page_header", "id": 14, "page_no": 12, "cluster": {"id": 14, "label": "page_header", "bbox": {"l": 471.376, "t": 91.49300000000005, "r": 480.59, "b": 102.78200000000004, "coord_origin": "TOPLEFT"}, "confidence": 0.9061064720153809, "cells": [{"index": 1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 471.376, "r_y0": 102.78200000000004, "r_x1": 480.59, "r_y1": 102.78200000000004, "r_x2": 480.59, "r_y2": 91.49300000000005, "r_x3": 471.376, "r_y3": 91.49300000000005, "coord_origin": "TOPLEFT"}, "text": "13", "orig": "13", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "13"}]}}, {"page_no": 13, "size": {"width": 612.0, "height": 792.0}, "cells": [{"index": 0, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 102.78200000000004, "r_x1": 143.979, "r_y1": 102.78200000000004, "r_x2": 143.979, "r_y2": 91.49300000000005, "r_x3": 134.765, "r_y3": 91.49300000000005, "coord_origin": "TOPLEFT"}, "text": "14", "orig": "14", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 167.821, "r_y0": 102.78200000000004, "r_x1": 231.72, "r_y1": 102.78200000000004, "r_x2": 231.72, "r_y2": 91.49300000000005, "r_x3": 167.821, "r_y3": 91.49300000000005, "coord_origin": "TOPLEFT"}, "text": "M. Lysak, et al.", "orig": "M. Lysak, et al.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 2, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 128.68499999999995, "r_x1": 146.538, "r_y1": 128.68499999999995, "r_x2": 146.538, "r_y2": 117.39599999999996, "r_x3": 134.765, "r_y3": 117.39599999999996, "coord_origin": "TOPLEFT"}, "text": "18.", "orig": "18.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 3, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 151.514, "r_y0": 128.68499999999995, "r_x1": 480.589, "r_y1": 128.68499999999995, "r_x2": 480.589, "r_y2": 117.39599999999996, "r_x3": 151.514, "r_y3": 117.39599999999996, "coord_origin": "TOPLEFT"}, "text": "Xue, W., Yu, B., Wang, W., Tao, D., Li, Q.: Tgrnet: A table graph reconstruc-", "orig": "Xue, W., Yu, B., Wang, W., Tao, D., Li, Q.: Tgrnet: A table graph reconstruc-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 4, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 151.518, "r_y0": 139.644, "r_x1": 167.385, "r_y1": 139.644, "r_x2": 167.385, "r_y2": 128.35500000000002, "r_x3": 151.518, "r_y3": 128.35500000000002, "coord_origin": "TOPLEFT"}, "text": "tion", "orig": "tion", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 5, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 171.492, "r_y0": 139.644, "r_x1": 334.467, "r_y1": 139.644, "r_x2": 334.467, "r_y2": 128.35500000000002, "r_x3": 171.492, "r_y3": 128.35500000000002, "coord_origin": "TOPLEFT"}, "text": "network for table structure recognition.", "orig": "network for table structure recognition.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 6, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 338.573, "r_y0": 139.644, "r_x1": 349.576, "r_y1": 139.644, "r_x2": 349.576, "r_y2": 128.35500000000002, "r_x3": 338.573, "r_y3": 128.35500000000002, "coord_origin": "TOPLEFT"}, "text": "In:", "orig": "In:", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 7, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 353.674, "r_y0": 139.644, "r_x1": 480.591, "r_y1": 139.644, "r_x2": 480.591, "r_y2": 128.35500000000002, "r_x3": 353.674, "r_y3": 128.35500000000002, "coord_origin": "TOPLEFT"}, "text": "Proceedings of the IEEE/CVF", "orig": "Proceedings of the IEEE/CVF", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 8, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 151.518, "r_y0": 150.60299999999995, "r_x1": 427.533, "r_y1": 150.60299999999995, "r_x2": 427.533, "r_y2": 139.31399999999996, "r_x3": 151.518, "r_y3": 139.31399999999996, "coord_origin": "TOPLEFT"}, "text": "International Conference on Computer Vision. pp. 1295-1304 (2021)", "orig": "International Conference on Computer Vision. pp. 1295-1304 (2021)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 9, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 161.562, "r_x1": 146.538, "r_y1": 161.562, "r_x2": 146.538, "r_y2": 150.27300000000002, "r_x3": 134.765, "r_y3": 150.27300000000002, "coord_origin": "TOPLEFT"}, "text": "19.", "orig": "19.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 10, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 151.514, "r_y0": 161.562, "r_x1": 164.318, "r_y1": 161.562, "r_x2": 164.318, "r_y2": 150.27300000000002, "r_x3": 151.514, "r_y3": 150.27300000000002, "coord_origin": "TOPLEFT"}, "text": "Ye,", "orig": "Ye,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 11, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 168.73, "r_y0": 161.562, "r_x1": 178.582, "r_y1": 161.562, "r_x2": 178.582, "r_y2": 150.27300000000002, "r_x3": 168.73, "r_y3": 150.27300000000002, "coord_origin": "TOPLEFT"}, "text": "J.,", "orig": "J.,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 12, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 183.002, "r_y0": 161.562, "r_x1": 195.286, "r_y1": 161.562, "r_x2": 195.286, "r_y2": 150.27300000000002, "r_x3": 183.002, "r_y3": 150.27300000000002, "coord_origin": "TOPLEFT"}, "text": "Qi,", "orig": "Qi,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 13, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 199.698, "r_y0": 161.562, "r_x1": 211.725, "r_y1": 161.562, "r_x2": 211.725, "r_y2": 150.27300000000002, "r_x3": 199.698, "r_y3": 150.27300000000002, "coord_origin": "TOPLEFT"}, "text": "X.,", "orig": "X.,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 14, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 216.145, "r_y0": 161.562, "r_x1": 246.149, "r_y1": 161.562, "r_x2": 246.149, "r_y2": 150.27300000000002, "r_x3": 216.145, "r_y3": 150.27300000000002, "coord_origin": "TOPLEFT"}, "text": "He, Y.,", "orig": "He, Y.,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 15, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 250.57, "r_y0": 161.562, "r_x1": 364.908, "r_y1": 161.562, "r_x2": 364.908, "r_y2": 150.27300000000002, "r_x3": 250.57, "r_y3": 150.27300000000002, "coord_origin": "TOPLEFT"}, "text": "Chen, Y., Gu, D., Gao, P.,", "orig": "Chen, Y., Gu, D., Gao, P.,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 16, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 369.32, "r_y0": 161.562, "r_x1": 390.56, "r_y1": 161.562, "r_x2": 390.56, "r_y2": 150.27300000000002, "r_x3": 369.32, "r_y3": 150.27300000000002, "coord_origin": "TOPLEFT"}, "text": "Xiao,", "orig": "Xiao,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 17, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 394.981, "r_y0": 161.562, "r_x1": 406.88, "r_y1": 161.562, "r_x2": 406.88, "r_y2": 150.27300000000002, "r_x3": 394.981, "r_y3": 150.27300000000002, "coord_origin": "TOPLEFT"}, "text": "R.:", "orig": "R.:", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 18, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 411.291, "r_y0": 161.562, "r_x1": 480.594, "r_y1": 161.562, "r_x2": 480.594, "r_y2": 150.27300000000002, "r_x3": 411.291, "r_y3": 150.27300000000002, "coord_origin": "TOPLEFT"}, "text": "Pingan-vcgroup's", "orig": "Pingan-vcgroup's", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 19, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 151.518, "r_y0": 172.52099999999996, "r_x1": 183.303, "r_y1": 172.52099999999996, "r_x2": 183.303, "r_y2": 161.23199999999997, "r_x3": 151.518, "r_y3": 161.23199999999997, "coord_origin": "TOPLEFT"}, "text": "solution", "orig": "solution", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 20, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 187.948, "r_y0": 172.52099999999996, "r_x1": 198.974, "r_y1": 172.52099999999996, "r_x2": 198.974, "r_y2": 161.23199999999997, "r_x3": 187.948, "r_y3": 161.23199999999997, "coord_origin": "TOPLEFT"}, "text": "for", "orig": "for", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 21, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 203.618, "r_y0": 172.52099999999996, "r_x1": 223.601, "r_y1": 172.52099999999996, "r_x2": 223.601, "r_y2": 161.23199999999997, "r_x3": 203.618, "r_y3": 161.23199999999997, "coord_origin": "TOPLEFT"}, "text": "icdar", "orig": "icdar", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 22, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 228.245, "r_y0": 172.52099999999996, "r_x1": 246.664, "r_y1": 172.52099999999996, "r_x2": 246.664, "r_y2": 161.23199999999997, "r_x3": 228.245, "r_y3": 161.23199999999997, "coord_origin": "TOPLEFT"}, "text": "2021", "orig": "2021", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 23, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 251.309, "r_y0": 172.52099999999996, "r_x1": 299.174, "r_y1": 172.52099999999996, "r_x2": 299.174, "r_y2": 161.23199999999997, "r_x3": 251.309, "r_y3": 161.23199999999997, "coord_origin": "TOPLEFT"}, "text": "competition", "orig": "competition", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 24, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 303.819, "r_y0": 172.52099999999996, "r_x1": 352.788, "r_y1": 172.52099999999996, "r_x2": 352.788, "r_y2": 161.23199999999997, "r_x3": 303.819, "r_y3": 161.23199999999997, "coord_origin": "TOPLEFT"}, "text": "on scientific", "orig": "on scientific", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 25, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 357.432, "r_y0": 172.52099999999996, "r_x1": 394.845, "r_y1": 172.52099999999996, "r_x2": 394.845, "r_y2": 161.23199999999997, "r_x3": 357.432, "r_y3": 161.23199999999997, "coord_origin": "TOPLEFT"}, "text": "literature", "orig": "literature", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 26, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 399.49, "r_y0": 172.52099999999996, "r_x1": 428.737, "r_y1": 172.52099999999996, "r_x2": 428.737, "r_y2": 161.23199999999997, "r_x3": 399.49, "r_y3": 161.23199999999997, "coord_origin": "TOPLEFT"}, "text": "parsing", "orig": "parsing", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 27, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 433.381, "r_y0": 172.52099999999996, "r_x1": 450.068, "r_y1": 172.52099999999996, "r_x2": 450.068, "r_y2": 161.23199999999997, "r_x3": 433.381, "r_y3": 161.23199999999997, "coord_origin": "TOPLEFT"}, "text": "task", "orig": "task", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 28, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 454.703, "r_y0": 172.52099999999996, "r_x1": 462.38, "r_y1": 172.52099999999996, "r_x2": 462.38, "r_y2": 161.23199999999997, "r_x3": 454.703, "r_y3": 161.23199999999997, "coord_origin": "TOPLEFT"}, "text": "b:", "orig": "b:", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 29, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 467.025, "r_y0": 172.52099999999996, "r_x1": 480.595, "r_y1": 172.52099999999996, "r_x2": 480.595, "r_y2": 161.23199999999997, "r_x3": 467.025, "r_y3": 161.23199999999997, "coord_origin": "TOPLEFT"}, "text": "Ta-", "orig": "Ta-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 30, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 151.518, "r_y0": 183.48000000000002, "r_x1": 163.294, "r_y1": 183.48000000000002, "r_x2": 163.294, "r_y2": 172.19100000000003, "r_x3": 151.518, "r_y3": 172.19100000000003, "coord_origin": "TOPLEFT"}, "text": "ble", "orig": "ble", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 31, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 167.732, "r_y0": 183.48000000000002, "r_x1": 212.287, "r_y1": 183.48000000000002, "r_x2": 212.287, "r_y2": 172.19100000000003, "r_x3": 167.732, "r_y3": 172.19100000000003, "coord_origin": "TOPLEFT"}, "text": "recognition", "orig": "recognition", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 32, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 216.734, "r_y0": 183.48000000000002, "r_x1": 224.924, "r_y1": 183.48000000000002, "r_x2": 224.924, "r_y2": 172.19100000000003, "r_x3": 216.734, "r_y3": 172.19100000000003, "coord_origin": "TOPLEFT"}, "text": "to", "orig": "to", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 33, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 229.362, "r_y0": 183.48000000000002, "r_x1": 280.64, "r_y1": 183.48000000000002, "r_x2": 280.64, "r_y2": 172.19100000000003, "r_x3": 229.362, "r_y3": 172.19100000000003, "coord_origin": "TOPLEFT"}, "text": "html (2021).", "orig": "html (2021).", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 34, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 285.078, "r_y0": 182.58399999999995, "r_x1": 478.034, "r_y1": 182.58399999999995, "r_x2": 478.034, "r_y2": 175.115, "r_x3": 285.078, "r_y3": 175.115, "coord_origin": "TOPLEFT"}, "text": "https://doi.org/10.48550/ARXIV.2105.01848", "orig": "https://doi.org/10.48550/ARXIV.2105.01848", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 35, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 478.032, "r_y0": 183.48000000000002, "r_x1": 480.591, "r_y1": 183.48000000000002, "r_x2": 480.591, "r_y2": 172.19100000000003, "r_x3": 478.032, "r_y3": 172.19100000000003, "coord_origin": "TOPLEFT"}, "text": ",", "orig": ",", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 36, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 151.518, "r_y0": 193.543, "r_x1": 302.116, "r_y1": 193.543, "r_x2": 302.116, "r_y2": 186.07399999999996, "r_x3": 151.518, "r_y3": 186.07399999999996, "coord_origin": "TOPLEFT"}, "text": "https://arxiv.org/abs/2105.01848", "orig": "https://arxiv.org/abs/2105.01848", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 37, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 205.39800000000002, "r_x1": 146.538, "r_y1": 205.39800000000002, "r_x2": 146.538, "r_y2": 194.10900000000004, "r_x3": 134.765, "r_y3": 194.10900000000004, "coord_origin": "TOPLEFT"}, "text": "20.", "orig": "20.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 38, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 151.514, "r_y0": 205.39800000000002, "r_x1": 480.594, "r_y1": 205.39800000000002, "r_x2": 480.594, "r_y2": 194.10900000000004, "r_x3": 151.514, "r_y3": 194.10900000000004, "coord_origin": "TOPLEFT"}, "text": "Zhang, Z., Zhang, J., Du, J., Wang, F.: Split, embed and merge: An accurate table", "orig": "Zhang, Z., Zhang, J., Du, J., Wang, F.: Split, embed and merge: An accurate table", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 39, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 151.518, "r_y0": 216.356, "r_x1": 318.551, "r_y1": 216.356, "r_x2": 318.551, "r_y2": 205.067, "r_x3": 151.518, "r_y3": 205.067, "coord_origin": "TOPLEFT"}, "text": "structure recognizer. Pattern Recognition", "orig": "structure recognizer. Pattern Recognition", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 40, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 321.621, "r_y0": 215.20799999999997, "r_x1": 337.532, "r_y1": 215.20799999999997, "r_x2": 337.532, "r_y2": 207.28200000000004, "r_x3": 321.621, "r_y3": 207.28200000000004, "coord_origin": "TOPLEFT"}, "text": "126", "orig": "126", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 41, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 337.533, "r_y0": 216.356, "r_x1": 340.092, "r_y1": 216.356, "r_x2": 340.092, "r_y2": 205.067, "r_x3": 337.533, "r_y3": 205.067, "coord_origin": "TOPLEFT"}, "text": ",", "orig": ",", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 42, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 343.159, "r_y0": 216.356, "r_x1": 399.469, "r_y1": 216.356, "r_x2": 399.469, "r_y2": 205.067, "r_x3": 343.159, "r_y3": 205.067, "coord_origin": "TOPLEFT"}, "text": "108565 (2022)", "orig": "108565 (2022)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 43, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 227.31500000000005, "r_x1": 146.538, "r_y1": 227.31500000000005, "r_x2": 146.538, "r_y2": 216.02599999999995, "r_x3": 134.765, "r_y3": 216.02599999999995, "coord_origin": "TOPLEFT"}, "text": "21.", "orig": "21.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 44, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 151.514, "r_y0": 227.31500000000005, "r_x1": 480.59, "r_y1": 227.31500000000005, "r_x2": 480.59, "r_y2": 216.02599999999995, "r_x3": 151.514, "r_y3": 216.02599999999995, "coord_origin": "TOPLEFT"}, "text": "Zheng, X., Burdick, D., Popa, L., Zhong, X., Wang, N.X.R.: Global table extractor", "orig": "Zheng, X., Burdick, D., Popa, L., Zhong, X., Wang, N.X.R.: Global table extractor", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 45, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 151.518, "r_y0": 238.274, "r_x1": 480.591, "r_y1": 238.274, "r_x2": 480.591, "r_y2": 226.985, "r_x3": 151.518, "r_y3": 226.985, "coord_origin": "TOPLEFT"}, "text": "(gte): A framework for joint table identification and cell structure recognition using", "orig": "(gte): A framework for joint table identification and cell structure recognition using", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 46, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 151.518, "r_y0": 249.23299999999995, "r_x1": 480.591, "r_y1": 249.23299999999995, "r_x2": 480.591, "r_y2": 237.94399999999996, "r_x3": 151.518, "r_y3": 237.94399999999996, "coord_origin": "TOPLEFT"}, "text": "visual context. In: 2021 IEEE Winter Conference on Applications of Computer Vi-", "orig": "visual context. In: 2021 IEEE Winter Conference on Applications of Computer Vi-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 47, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 151.518, "r_y0": 260.192, "r_x1": 293.441, "r_y1": 260.192, "r_x2": 293.441, "r_y2": 248.90300000000002, "r_x3": 151.518, "r_y3": 248.90300000000002, "coord_origin": "TOPLEFT"}, "text": "sion (WACV). pp. 697-706 (2021).", "orig": "sion (WACV). pp. 697-706 (2021).", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 48, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 297.05, "r_y0": 259.29600000000005, "r_x1": 480.593, "r_y1": 259.29600000000005, "r_x2": 480.593, "r_y2": 251.827, "r_x3": 297.05, "r_y3": 251.827, "coord_origin": "TOPLEFT"}, "text": "https://doi.org/10.1109/WACV48630.2021.", "orig": "https://doi.org/10.1109/WACV48630.2021.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 49, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 151.518, "r_y0": 270.255, "r_x1": 175.05, "r_y1": 270.255, "r_x2": 175.05, "r_y2": 262.78599999999994, "r_x3": 151.518, "r_y3": 262.78599999999994, "coord_origin": "TOPLEFT"}, "text": "00074", "orig": "00074", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 50, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 282.11, "r_x1": 146.538, "r_y1": 282.11, "r_x2": 146.538, "r_y2": 270.821, "r_x3": 134.765, "r_y3": 270.821, "coord_origin": "TOPLEFT"}, "text": "22.", "orig": "22.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 51, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 151.514, "r_y0": 282.11, "r_x1": 271.779, "r_y1": 282.11, "r_x2": 271.779, "r_y2": 270.821, "r_x3": 151.514, "r_y3": 270.821, "coord_origin": "TOPLEFT"}, "text": "Zhong, X., ShafieiBavani, E.,", "orig": "Zhong, X., ShafieiBavani, E.,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 52, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 275.957, "r_y0": 282.11, "r_x1": 480.591, "r_y1": 282.11, "r_x2": 480.591, "r_y2": 270.821, "r_x3": 275.957, "r_y3": 270.821, "coord_origin": "TOPLEFT"}, "text": "Jimeno Yepes, A.: Image-based table recognition:", "orig": "Jimeno Yepes, A.: Image-based table recognition:", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 53, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 151.518, "r_y0": 293.069, "r_x1": 480.588, "r_y1": 293.069, "r_x2": 480.588, "r_y2": 281.78, "r_x3": 151.518, "r_y3": 281.78, "coord_origin": "TOPLEFT"}, "text": "Data, model, and evaluation. In: Vedaldi, A., Bischof, H., Brox, T., Frahm, J.M.", "orig": "Data, model, and evaluation. In: Vedaldi, A., Bischof, H., Brox, T., Frahm, J.M.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 54, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 151.518, "r_y0": 304.028, "r_x1": 480.596, "r_y1": 304.028, "r_x2": 480.596, "r_y2": 292.739, "r_x3": 151.518, "r_y3": 292.739, "coord_origin": "TOPLEFT"}, "text": "(eds.) Computer Vision - ECCV 2020. pp. 564-580. Springer International Pub-", "orig": "(eds.) Computer Vision - ECCV 2020. pp. 564-580. Springer International Pub-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 55, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 151.518, "r_y0": 314.987, "r_x1": 236.024, "r_y1": 314.987, "r_x2": 236.024, "r_y2": 303.698, "r_x3": 151.518, "r_y3": 303.698, "coord_origin": "TOPLEFT"}, "text": "lishing, Cham (2020)", "orig": "lishing, Cham (2020)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 56, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 325.946, "r_x1": 146.538, "r_y1": 325.946, "r_x2": 146.538, "r_y2": 314.657, "r_x3": 134.765, "r_y3": 314.657, "coord_origin": "TOPLEFT"}, "text": "23.", "orig": "23.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 57, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 151.514, "r_y0": 325.946, "r_x1": 480.595, "r_y1": 325.946, "r_x2": 480.595, "r_y2": 314.657, "r_x3": 151.514, "r_y3": 314.657, "coord_origin": "TOPLEFT"}, "text": "Zhong, X., Tang, J., Yepes, A.J.: Publaynet: largest dataset ever for document lay-", "orig": "Zhong, X., Tang, J., Yepes, A.J.: Publaynet: largest dataset ever for document lay-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 58, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 151.518, "r_y0": 336.904, "r_x1": 480.594, "r_y1": 336.904, "r_x2": 480.594, "r_y2": 325.615, "r_x3": 151.518, "r_y3": 325.615, "coord_origin": "TOPLEFT"}, "text": "out analysis. In: 2019 International Conference on Document Analysis and Recog-", "orig": "out analysis. In: 2019 International Conference on Document Analysis and Recog-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 59, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 151.518, "r_y0": 347.863, "r_x1": 335.136, "r_y1": 347.863, "r_x2": 335.136, "r_y2": 336.574, "r_x3": 151.518, "r_y3": 336.574, "coord_origin": "TOPLEFT"}, "text": "nition (ICDAR). pp. 1015-1022. IEEE (2019)", "orig": "nition (ICDAR). pp. 1015-1022. IEEE (2019)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "parsed_page": null, "predictions": {"layout": {"clusters": [{"id": 7, "label": "page_header", "bbox": {"l": 134.765, "t": 91.49300000000005, "r": 143.979, "b": 102.78200000000004, "coord_origin": "TOPLEFT"}, "confidence": 0.7012730240821838, "cells": [{"index": 0, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 102.78200000000004, "r_x1": 143.979, "r_y1": 102.78200000000004, "r_x2": 143.979, "r_y2": 91.49300000000005, "r_x3": 134.765, "r_y3": 91.49300000000005, "coord_origin": "TOPLEFT"}, "text": "14", "orig": "14", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 6, "label": "page_header", "bbox": {"l": 167.821, "t": 91.49300000000005, "r": 231.72, "b": 102.78200000000004, "coord_origin": "TOPLEFT"}, "confidence": 0.7889755964279175, "cells": [{"index": 1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 167.821, "r_y0": 102.78200000000004, "r_x1": 231.72, "r_y1": 102.78200000000004, "r_x2": 231.72, "r_y2": 91.49300000000005, "r_x3": 167.821, "r_y3": 91.49300000000005, "coord_origin": "TOPLEFT"}, "text": "M. Lysak, et al.", "orig": "M. Lysak, et al.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 5, "label": "list_item", "bbox": {"l": 134.765, "t": 117.39599999999996, "r": 480.591, "b": 150.60299999999995, "coord_origin": "TOPLEFT"}, "confidence": 0.9444757699966431, "cells": [{"index": 2, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 128.68499999999995, "r_x1": 146.538, "r_y1": 128.68499999999995, "r_x2": 146.538, "r_y2": 117.39599999999996, "r_x3": 134.765, "r_y3": 117.39599999999996, "coord_origin": "TOPLEFT"}, "text": "18.", "orig": "18.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 3, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 151.514, "r_y0": 128.68499999999995, "r_x1": 480.589, "r_y1": 128.68499999999995, "r_x2": 480.589, "r_y2": 117.39599999999996, "r_x3": 151.514, "r_y3": 117.39599999999996, "coord_origin": "TOPLEFT"}, "text": "Xue, W., Yu, B., Wang, W., Tao, D., Li, Q.: Tgrnet: A table graph reconstruc-", "orig": "Xue, W., Yu, B., Wang, W., Tao, D., Li, Q.: Tgrnet: A table graph reconstruc-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 4, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 151.518, "r_y0": 139.644, "r_x1": 167.385, "r_y1": 139.644, "r_x2": 167.385, "r_y2": 128.35500000000002, "r_x3": 151.518, "r_y3": 128.35500000000002, "coord_origin": "TOPLEFT"}, "text": "tion", "orig": "tion", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 5, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 171.492, "r_y0": 139.644, "r_x1": 334.467, "r_y1": 139.644, "r_x2": 334.467, "r_y2": 128.35500000000002, "r_x3": 171.492, "r_y3": 128.35500000000002, "coord_origin": "TOPLEFT"}, "text": "network for table structure recognition.", "orig": "network for table structure recognition.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 6, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 338.573, "r_y0": 139.644, "r_x1": 349.576, "r_y1": 139.644, "r_x2": 349.576, "r_y2": 128.35500000000002, "r_x3": 338.573, "r_y3": 128.35500000000002, "coord_origin": "TOPLEFT"}, "text": "In:", "orig": "In:", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 7, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 353.674, "r_y0": 139.644, "r_x1": 480.591, "r_y1": 139.644, "r_x2": 480.591, "r_y2": 128.35500000000002, "r_x3": 353.674, "r_y3": 128.35500000000002, "coord_origin": "TOPLEFT"}, "text": "Proceedings of the IEEE/CVF", "orig": "Proceedings of the IEEE/CVF", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 8, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 151.518, "r_y0": 150.60299999999995, "r_x1": 427.533, "r_y1": 150.60299999999995, "r_x2": 427.533, "r_y2": 139.31399999999996, "r_x3": 151.518, "r_y3": 139.31399999999996, "coord_origin": "TOPLEFT"}, "text": "International Conference on Computer Vision. pp. 1295-1304 (2021)", "orig": "International Conference on Computer Vision. pp. 1295-1304 (2021)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 3, "label": "list_item", "bbox": {"l": 134.765, "t": 150.27300000000002, "r": 480.595, "b": 193.543, "coord_origin": "TOPLEFT"}, "confidence": 0.9540892243385315, "cells": [{"index": 9, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 161.562, "r_x1": 146.538, "r_y1": 161.562, "r_x2": 146.538, "r_y2": 150.27300000000002, "r_x3": 134.765, "r_y3": 150.27300000000002, "coord_origin": "TOPLEFT"}, "text": "19.", "orig": "19.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 10, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 151.514, "r_y0": 161.562, "r_x1": 164.318, "r_y1": 161.562, "r_x2": 164.318, "r_y2": 150.27300000000002, "r_x3": 151.514, "r_y3": 150.27300000000002, "coord_origin": "TOPLEFT"}, "text": "Ye,", "orig": "Ye,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 11, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 168.73, "r_y0": 161.562, "r_x1": 178.582, "r_y1": 161.562, "r_x2": 178.582, "r_y2": 150.27300000000002, "r_x3": 168.73, "r_y3": 150.27300000000002, "coord_origin": "TOPLEFT"}, "text": "J.,", "orig": "J.,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 12, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 183.002, "r_y0": 161.562, "r_x1": 195.286, "r_y1": 161.562, "r_x2": 195.286, "r_y2": 150.27300000000002, "r_x3": 183.002, "r_y3": 150.27300000000002, "coord_origin": "TOPLEFT"}, "text": "Qi,", "orig": "Qi,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 13, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 199.698, "r_y0": 161.562, "r_x1": 211.725, "r_y1": 161.562, "r_x2": 211.725, "r_y2": 150.27300000000002, "r_x3": 199.698, "r_y3": 150.27300000000002, "coord_origin": "TOPLEFT"}, "text": "X.,", "orig": "X.,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 14, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 216.145, "r_y0": 161.562, "r_x1": 246.149, "r_y1": 161.562, "r_x2": 246.149, "r_y2": 150.27300000000002, "r_x3": 216.145, "r_y3": 150.27300000000002, "coord_origin": "TOPLEFT"}, "text": "He, Y.,", "orig": "He, Y.,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 15, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 250.57, "r_y0": 161.562, "r_x1": 364.908, "r_y1": 161.562, "r_x2": 364.908, "r_y2": 150.27300000000002, "r_x3": 250.57, "r_y3": 150.27300000000002, "coord_origin": "TOPLEFT"}, "text": "Chen, Y., Gu, D., Gao, P.,", "orig": "Chen, Y., Gu, D., Gao, P.,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 16, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 369.32, "r_y0": 161.562, "r_x1": 390.56, "r_y1": 161.562, "r_x2": 390.56, "r_y2": 150.27300000000002, "r_x3": 369.32, "r_y3": 150.27300000000002, "coord_origin": "TOPLEFT"}, "text": "Xiao,", "orig": "Xiao,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 17, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 394.981, "r_y0": 161.562, "r_x1": 406.88, "r_y1": 161.562, "r_x2": 406.88, "r_y2": 150.27300000000002, "r_x3": 394.981, "r_y3": 150.27300000000002, "coord_origin": "TOPLEFT"}, "text": "R.:", "orig": "R.:", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 18, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 411.291, "r_y0": 161.562, "r_x1": 480.594, "r_y1": 161.562, "r_x2": 480.594, "r_y2": 150.27300000000002, "r_x3": 411.291, "r_y3": 150.27300000000002, "coord_origin": "TOPLEFT"}, "text": "Pingan-vcgroup's", "orig": "Pingan-vcgroup's", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 19, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 151.518, "r_y0": 172.52099999999996, "r_x1": 183.303, "r_y1": 172.52099999999996, "r_x2": 183.303, "r_y2": 161.23199999999997, "r_x3": 151.518, "r_y3": 161.23199999999997, "coord_origin": "TOPLEFT"}, "text": "solution", "orig": "solution", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 20, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 187.948, "r_y0": 172.52099999999996, "r_x1": 198.974, "r_y1": 172.52099999999996, "r_x2": 198.974, "r_y2": 161.23199999999997, "r_x3": 187.948, "r_y3": 161.23199999999997, "coord_origin": "TOPLEFT"}, "text": "for", "orig": "for", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 21, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 203.618, "r_y0": 172.52099999999996, "r_x1": 223.601, "r_y1": 172.52099999999996, "r_x2": 223.601, "r_y2": 161.23199999999997, "r_x3": 203.618, "r_y3": 161.23199999999997, "coord_origin": "TOPLEFT"}, "text": "icdar", "orig": "icdar", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 22, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 228.245, "r_y0": 172.52099999999996, "r_x1": 246.664, "r_y1": 172.52099999999996, "r_x2": 246.664, "r_y2": 161.23199999999997, "r_x3": 228.245, "r_y3": 161.23199999999997, "coord_origin": "TOPLEFT"}, "text": "2021", "orig": "2021", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 23, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 251.309, "r_y0": 172.52099999999996, "r_x1": 299.174, "r_y1": 172.52099999999996, "r_x2": 299.174, "r_y2": 161.23199999999997, "r_x3": 251.309, "r_y3": 161.23199999999997, "coord_origin": "TOPLEFT"}, "text": "competition", "orig": "competition", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 24, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 303.819, "r_y0": 172.52099999999996, "r_x1": 352.788, "r_y1": 172.52099999999996, "r_x2": 352.788, "r_y2": 161.23199999999997, "r_x3": 303.819, "r_y3": 161.23199999999997, "coord_origin": "TOPLEFT"}, "text": "on scientific", "orig": "on scientific", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 25, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 357.432, "r_y0": 172.52099999999996, "r_x1": 394.845, "r_y1": 172.52099999999996, "r_x2": 394.845, "r_y2": 161.23199999999997, "r_x3": 357.432, "r_y3": 161.23199999999997, "coord_origin": "TOPLEFT"}, "text": "literature", "orig": "literature", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 26, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 399.49, "r_y0": 172.52099999999996, "r_x1": 428.737, "r_y1": 172.52099999999996, "r_x2": 428.737, "r_y2": 161.23199999999997, "r_x3": 399.49, "r_y3": 161.23199999999997, "coord_origin": "TOPLEFT"}, "text": "parsing", "orig": "parsing", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 27, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 433.381, "r_y0": 172.52099999999996, "r_x1": 450.068, "r_y1": 172.52099999999996, "r_x2": 450.068, "r_y2": 161.23199999999997, "r_x3": 433.381, "r_y3": 161.23199999999997, "coord_origin": "TOPLEFT"}, "text": "task", "orig": "task", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 28, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 454.703, "r_y0": 172.52099999999996, "r_x1": 462.38, "r_y1": 172.52099999999996, "r_x2": 462.38, "r_y2": 161.23199999999997, "r_x3": 454.703, "r_y3": 161.23199999999997, "coord_origin": "TOPLEFT"}, "text": "b:", "orig": "b:", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 29, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 467.025, "r_y0": 172.52099999999996, "r_x1": 480.595, "r_y1": 172.52099999999996, "r_x2": 480.595, "r_y2": 161.23199999999997, "r_x3": 467.025, "r_y3": 161.23199999999997, "coord_origin": "TOPLEFT"}, "text": "Ta-", "orig": "Ta-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 30, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 151.518, "r_y0": 183.48000000000002, "r_x1": 163.294, "r_y1": 183.48000000000002, "r_x2": 163.294, "r_y2": 172.19100000000003, "r_x3": 151.518, "r_y3": 172.19100000000003, "coord_origin": "TOPLEFT"}, "text": "ble", "orig": "ble", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 31, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 167.732, "r_y0": 183.48000000000002, "r_x1": 212.287, "r_y1": 183.48000000000002, "r_x2": 212.287, "r_y2": 172.19100000000003, "r_x3": 167.732, "r_y3": 172.19100000000003, "coord_origin": "TOPLEFT"}, "text": "recognition", "orig": "recognition", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 32, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 216.734, "r_y0": 183.48000000000002, "r_x1": 224.924, "r_y1": 183.48000000000002, "r_x2": 224.924, "r_y2": 172.19100000000003, "r_x3": 216.734, "r_y3": 172.19100000000003, "coord_origin": "TOPLEFT"}, "text": "to", "orig": "to", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 33, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 229.362, "r_y0": 183.48000000000002, "r_x1": 280.64, "r_y1": 183.48000000000002, "r_x2": 280.64, "r_y2": 172.19100000000003, "r_x3": 229.362, "r_y3": 172.19100000000003, "coord_origin": "TOPLEFT"}, "text": "html (2021).", "orig": "html (2021).", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 34, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 285.078, "r_y0": 182.58399999999995, "r_x1": 478.034, "r_y1": 182.58399999999995, "r_x2": 478.034, "r_y2": 175.115, "r_x3": 285.078, "r_y3": 175.115, "coord_origin": "TOPLEFT"}, "text": "https://doi.org/10.48550/ARXIV.2105.01848", "orig": "https://doi.org/10.48550/ARXIV.2105.01848", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 35, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 478.032, "r_y0": 183.48000000000002, "r_x1": 480.591, "r_y1": 183.48000000000002, "r_x2": 480.591, "r_y2": 172.19100000000003, "r_x3": 478.032, "r_y3": 172.19100000000003, "coord_origin": "TOPLEFT"}, "text": ",", "orig": ",", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 36, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 151.518, "r_y0": 193.543, "r_x1": 302.116, "r_y1": 193.543, "r_x2": 302.116, "r_y2": 186.07399999999996, "r_x3": 151.518, "r_y3": 186.07399999999996, "coord_origin": "TOPLEFT"}, "text": "https://arxiv.org/abs/2105.01848", "orig": "https://arxiv.org/abs/2105.01848", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 4, "label": "list_item", "bbox": {"l": 134.765, "t": 194.10900000000004, "r": 480.594, "b": 216.356, "coord_origin": "TOPLEFT"}, "confidence": 0.9531471729278564, "cells": [{"index": 37, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 205.39800000000002, "r_x1": 146.538, "r_y1": 205.39800000000002, "r_x2": 146.538, "r_y2": 194.10900000000004, "r_x3": 134.765, "r_y3": 194.10900000000004, "coord_origin": "TOPLEFT"}, "text": "20.", "orig": "20.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 38, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 151.514, "r_y0": 205.39800000000002, "r_x1": 480.594, "r_y1": 205.39800000000002, "r_x2": 480.594, "r_y2": 194.10900000000004, "r_x3": 151.514, "r_y3": 194.10900000000004, "coord_origin": "TOPLEFT"}, "text": "Zhang, Z., Zhang, J., Du, J., Wang, F.: Split, embed and merge: An accurate table", "orig": "Zhang, Z., Zhang, J., Du, J., Wang, F.: Split, embed and merge: An accurate table", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 39, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 151.518, "r_y0": 216.356, "r_x1": 318.551, "r_y1": 216.356, "r_x2": 318.551, "r_y2": 205.067, "r_x3": 151.518, "r_y3": 205.067, "coord_origin": "TOPLEFT"}, "text": "structure recognizer. Pattern Recognition", "orig": "structure recognizer. Pattern Recognition", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 40, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 321.621, "r_y0": 215.20799999999997, "r_x1": 337.532, "r_y1": 215.20799999999997, "r_x2": 337.532, "r_y2": 207.28200000000004, "r_x3": 321.621, "r_y3": 207.28200000000004, "coord_origin": "TOPLEFT"}, "text": "126", "orig": "126", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 41, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 337.533, "r_y0": 216.356, "r_x1": 340.092, "r_y1": 216.356, "r_x2": 340.092, "r_y2": 205.067, "r_x3": 337.533, "r_y3": 205.067, "coord_origin": "TOPLEFT"}, "text": ",", "orig": ",", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 42, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 343.159, "r_y0": 216.356, "r_x1": 399.469, "r_y1": 216.356, "r_x2": 399.469, "r_y2": 205.067, "r_x3": 343.159, "r_y3": 205.067, "coord_origin": "TOPLEFT"}, "text": "108565 (2022)", "orig": "108565 (2022)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 0, "label": "list_item", "bbox": {"l": 134.765, "t": 216.02599999999995, "r": 480.593, "b": 270.255, "coord_origin": "TOPLEFT"}, "confidence": 0.972027063369751, "cells": [{"index": 43, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 227.31500000000005, "r_x1": 146.538, "r_y1": 227.31500000000005, "r_x2": 146.538, "r_y2": 216.02599999999995, "r_x3": 134.765, "r_y3": 216.02599999999995, "coord_origin": "TOPLEFT"}, "text": "21.", "orig": "21.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 44, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 151.514, "r_y0": 227.31500000000005, "r_x1": 480.59, "r_y1": 227.31500000000005, "r_x2": 480.59, "r_y2": 216.02599999999995, "r_x3": 151.514, "r_y3": 216.02599999999995, "coord_origin": "TOPLEFT"}, "text": "Zheng, X., Burdick, D., Popa, L., Zhong, X., Wang, N.X.R.: Global table extractor", "orig": "Zheng, X., Burdick, D., Popa, L., Zhong, X., Wang, N.X.R.: Global table extractor", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 45, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 151.518, "r_y0": 238.274, "r_x1": 480.591, "r_y1": 238.274, "r_x2": 480.591, "r_y2": 226.985, "r_x3": 151.518, "r_y3": 226.985, "coord_origin": "TOPLEFT"}, "text": "(gte): A framework for joint table identification and cell structure recognition using", "orig": "(gte): A framework for joint table identification and cell structure recognition using", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 46, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 151.518, "r_y0": 249.23299999999995, "r_x1": 480.591, "r_y1": 249.23299999999995, "r_x2": 480.591, "r_y2": 237.94399999999996, "r_x3": 151.518, "r_y3": 237.94399999999996, "coord_origin": "TOPLEFT"}, "text": "visual context. In: 2021 IEEE Winter Conference on Applications of Computer Vi-", "orig": "visual context. In: 2021 IEEE Winter Conference on Applications of Computer Vi-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 47, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 151.518, "r_y0": 260.192, "r_x1": 293.441, "r_y1": 260.192, "r_x2": 293.441, "r_y2": 248.90300000000002, "r_x3": 151.518, "r_y3": 248.90300000000002, "coord_origin": "TOPLEFT"}, "text": "sion (WACV). pp. 697-706 (2021).", "orig": "sion (WACV). pp. 697-706 (2021).", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 48, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 297.05, "r_y0": 259.29600000000005, "r_x1": 480.593, "r_y1": 259.29600000000005, "r_x2": 480.593, "r_y2": 251.827, "r_x3": 297.05, "r_y3": 251.827, "coord_origin": "TOPLEFT"}, "text": "https://doi.org/10.1109/WACV48630.2021.", "orig": "https://doi.org/10.1109/WACV48630.2021.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 49, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 151.518, "r_y0": 270.255, "r_x1": 175.05, "r_y1": 270.255, "r_x2": 175.05, "r_y2": 262.78599999999994, "r_x3": 151.518, "r_y3": 262.78599999999994, "coord_origin": "TOPLEFT"}, "text": "00074", "orig": "00074", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 1, "label": "list_item", "bbox": {"l": 134.765, "t": 270.821, "r": 480.596, "b": 314.987, "coord_origin": "TOPLEFT"}, "confidence": 0.9685125946998596, "cells": [{"index": 50, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 282.11, "r_x1": 146.538, "r_y1": 282.11, "r_x2": 146.538, "r_y2": 270.821, "r_x3": 134.765, "r_y3": 270.821, "coord_origin": "TOPLEFT"}, "text": "22.", "orig": "22.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 51, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 151.514, "r_y0": 282.11, "r_x1": 271.779, "r_y1": 282.11, "r_x2": 271.779, "r_y2": 270.821, "r_x3": 151.514, "r_y3": 270.821, "coord_origin": "TOPLEFT"}, "text": "Zhong, X., ShafieiBavani, E.,", "orig": "Zhong, X., ShafieiBavani, E.,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 52, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 275.957, "r_y0": 282.11, "r_x1": 480.591, "r_y1": 282.11, "r_x2": 480.591, "r_y2": 270.821, "r_x3": 275.957, "r_y3": 270.821, "coord_origin": "TOPLEFT"}, "text": "Jimeno Yepes, A.: Image-based table recognition:", "orig": "Jimeno Yepes, A.: Image-based table recognition:", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 53, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 151.518, "r_y0": 293.069, "r_x1": 480.588, "r_y1": 293.069, "r_x2": 480.588, "r_y2": 281.78, "r_x3": 151.518, "r_y3": 281.78, "coord_origin": "TOPLEFT"}, "text": "Data, model, and evaluation. In: Vedaldi, A., Bischof, H., Brox, T., Frahm, J.M.", "orig": "Data, model, and evaluation. In: Vedaldi, A., Bischof, H., Brox, T., Frahm, J.M.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 54, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 151.518, "r_y0": 304.028, "r_x1": 480.596, "r_y1": 304.028, "r_x2": 480.596, "r_y2": 292.739, "r_x3": 151.518, "r_y3": 292.739, "coord_origin": "TOPLEFT"}, "text": "(eds.) Computer Vision - ECCV 2020. pp. 564-580. Springer International Pub-", "orig": "(eds.) Computer Vision - ECCV 2020. pp. 564-580. Springer International Pub-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 55, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 151.518, "r_y0": 314.987, "r_x1": 236.024, "r_y1": 314.987, "r_x2": 236.024, "r_y2": 303.698, "r_x3": 151.518, "r_y3": 303.698, "coord_origin": "TOPLEFT"}, "text": "lishing, Cham (2020)", "orig": "lishing, Cham (2020)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 2, "label": "list_item", "bbox": {"l": 134.765, "t": 314.657, "r": 480.595, "b": 347.863, "coord_origin": "TOPLEFT"}, "confidence": 0.9668973684310913, "cells": [{"index": 56, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 325.946, "r_x1": 146.538, "r_y1": 325.946, "r_x2": 146.538, "r_y2": 314.657, "r_x3": 134.765, "r_y3": 314.657, "coord_origin": "TOPLEFT"}, "text": "23.", "orig": "23.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 57, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 151.514, "r_y0": 325.946, "r_x1": 480.595, "r_y1": 325.946, "r_x2": 480.595, "r_y2": 314.657, "r_x3": 151.514, "r_y3": 314.657, "coord_origin": "TOPLEFT"}, "text": "Zhong, X., Tang, J., Yepes, A.J.: Publaynet: largest dataset ever for document lay-", "orig": "Zhong, X., Tang, J., Yepes, A.J.: Publaynet: largest dataset ever for document lay-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 58, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 151.518, "r_y0": 336.904, "r_x1": 480.594, "r_y1": 336.904, "r_x2": 480.594, "r_y2": 325.615, "r_x3": 151.518, "r_y3": 325.615, "coord_origin": "TOPLEFT"}, "text": "out analysis. In: 2019 International Conference on Document Analysis and Recog-", "orig": "out analysis. In: 2019 International Conference on Document Analysis and Recog-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 59, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 151.518, "r_y0": 347.863, "r_x1": 335.136, "r_y1": 347.863, "r_x2": 335.136, "r_y2": 336.574, "r_x3": 151.518, "r_y3": 336.574, "coord_origin": "TOPLEFT"}, "text": "nition (ICDAR). pp. 1015-1022. IEEE (2019)", "orig": "nition (ICDAR). pp. 1015-1022. IEEE (2019)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}]}, "tablestructure": {"table_map": {}}, "figures_classification": null, "equations_prediction": null, "vlm_response": null}, "assembled": {"elements": [{"label": "page_header", "id": 7, "page_no": 13, "cluster": {"id": 7, "label": "page_header", "bbox": {"l": 134.765, "t": 91.49300000000005, "r": 143.979, "b": 102.78200000000004, "coord_origin": "TOPLEFT"}, "confidence": 0.7012730240821838, "cells": [{"index": 0, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 102.78200000000004, "r_x1": 143.979, "r_y1": 102.78200000000004, "r_x2": 143.979, "r_y2": 91.49300000000005, "r_x3": 134.765, "r_y3": 91.49300000000005, "coord_origin": "TOPLEFT"}, "text": "14", "orig": "14", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "14"}, {"label": "page_header", "id": 6, "page_no": 13, "cluster": {"id": 6, "label": "page_header", "bbox": {"l": 167.821, "t": 91.49300000000005, "r": 231.72, "b": 102.78200000000004, "coord_origin": "TOPLEFT"}, "confidence": 0.7889755964279175, "cells": [{"index": 1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 167.821, "r_y0": 102.78200000000004, "r_x1": 231.72, "r_y1": 102.78200000000004, "r_x2": 231.72, "r_y2": 91.49300000000005, "r_x3": 167.821, "r_y3": 91.49300000000005, "coord_origin": "TOPLEFT"}, "text": "M. Lysak, et al.", "orig": "M. Lysak, et al.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "M. Lysak, et al."}, {"label": "list_item", "id": 5, "page_no": 13, "cluster": {"id": 5, "label": "list_item", "bbox": {"l": 134.765, "t": 117.39599999999996, "r": 480.591, "b": 150.60299999999995, "coord_origin": "TOPLEFT"}, "confidence": 0.9444757699966431, "cells": [{"index": 2, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 128.68499999999995, "r_x1": 146.538, "r_y1": 128.68499999999995, "r_x2": 146.538, "r_y2": 117.39599999999996, "r_x3": 134.765, "r_y3": 117.39599999999996, "coord_origin": "TOPLEFT"}, "text": "18.", "orig": "18.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 3, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 151.514, "r_y0": 128.68499999999995, "r_x1": 480.589, "r_y1": 128.68499999999995, "r_x2": 480.589, "r_y2": 117.39599999999996, "r_x3": 151.514, "r_y3": 117.39599999999996, "coord_origin": "TOPLEFT"}, "text": "Xue, W., Yu, B., Wang, W., Tao, D., Li, Q.: Tgrnet: A table graph reconstruc-", "orig": "Xue, W., Yu, B., Wang, W., Tao, D., Li, Q.: Tgrnet: A table graph reconstruc-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 4, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 151.518, "r_y0": 139.644, "r_x1": 167.385, "r_y1": 139.644, "r_x2": 167.385, "r_y2": 128.35500000000002, "r_x3": 151.518, "r_y3": 128.35500000000002, "coord_origin": "TOPLEFT"}, "text": "tion", "orig": "tion", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 5, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 171.492, "r_y0": 139.644, "r_x1": 334.467, "r_y1": 139.644, "r_x2": 334.467, "r_y2": 128.35500000000002, "r_x3": 171.492, "r_y3": 128.35500000000002, "coord_origin": "TOPLEFT"}, "text": "network for table structure recognition.", "orig": "network for table structure recognition.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 6, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 338.573, "r_y0": 139.644, "r_x1": 349.576, "r_y1": 139.644, "r_x2": 349.576, "r_y2": 128.35500000000002, "r_x3": 338.573, "r_y3": 128.35500000000002, "coord_origin": "TOPLEFT"}, "text": "In:", "orig": "In:", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 7, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 353.674, "r_y0": 139.644, "r_x1": 480.591, "r_y1": 139.644, "r_x2": 480.591, "r_y2": 128.35500000000002, "r_x3": 353.674, "r_y3": 128.35500000000002, "coord_origin": "TOPLEFT"}, "text": "Proceedings of the IEEE/CVF", "orig": "Proceedings of the IEEE/CVF", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 8, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 151.518, "r_y0": 150.60299999999995, "r_x1": 427.533, "r_y1": 150.60299999999995, "r_x2": 427.533, "r_y2": 139.31399999999996, "r_x3": 151.518, "r_y3": 139.31399999999996, "coord_origin": "TOPLEFT"}, "text": "International Conference on Computer Vision. pp. 1295-1304 (2021)", "orig": "International Conference on Computer Vision. pp. 1295-1304 (2021)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "18. Xue, W., Yu, B., Wang, W., Tao, D., Li, Q.: Tgrnet: A table graph reconstruction network for table structure recognition. In: Proceedings of the IEEE/CVF International Conference on Computer Vision. pp. 1295-1304 (2021)"}, {"label": "list_item", "id": 3, "page_no": 13, "cluster": {"id": 3, "label": "list_item", "bbox": {"l": 134.765, "t": 150.27300000000002, "r": 480.595, "b": 193.543, "coord_origin": "TOPLEFT"}, "confidence": 0.9540892243385315, "cells": [{"index": 9, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 161.562, "r_x1": 146.538, "r_y1": 161.562, "r_x2": 146.538, "r_y2": 150.27300000000002, "r_x3": 134.765, "r_y3": 150.27300000000002, "coord_origin": "TOPLEFT"}, "text": "19.", "orig": "19.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 10, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 151.514, "r_y0": 161.562, "r_x1": 164.318, "r_y1": 161.562, "r_x2": 164.318, "r_y2": 150.27300000000002, "r_x3": 151.514, "r_y3": 150.27300000000002, "coord_origin": "TOPLEFT"}, "text": "Ye,", "orig": "Ye,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 11, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 168.73, "r_y0": 161.562, "r_x1": 178.582, "r_y1": 161.562, "r_x2": 178.582, "r_y2": 150.27300000000002, "r_x3": 168.73, "r_y3": 150.27300000000002, "coord_origin": "TOPLEFT"}, "text": "J.,", "orig": "J.,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 12, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 183.002, "r_y0": 161.562, "r_x1": 195.286, "r_y1": 161.562, "r_x2": 195.286, "r_y2": 150.27300000000002, "r_x3": 183.002, "r_y3": 150.27300000000002, "coord_origin": "TOPLEFT"}, "text": "Qi,", "orig": "Qi,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 13, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 199.698, "r_y0": 161.562, "r_x1": 211.725, "r_y1": 161.562, "r_x2": 211.725, "r_y2": 150.27300000000002, "r_x3": 199.698, "r_y3": 150.27300000000002, "coord_origin": "TOPLEFT"}, "text": "X.,", "orig": "X.,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 14, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 216.145, "r_y0": 161.562, "r_x1": 246.149, "r_y1": 161.562, "r_x2": 246.149, "r_y2": 150.27300000000002, "r_x3": 216.145, "r_y3": 150.27300000000002, "coord_origin": "TOPLEFT"}, "text": "He, Y.,", "orig": "He, Y.,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 15, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 250.57, "r_y0": 161.562, "r_x1": 364.908, "r_y1": 161.562, "r_x2": 364.908, "r_y2": 150.27300000000002, "r_x3": 250.57, "r_y3": 150.27300000000002, "coord_origin": "TOPLEFT"}, "text": "Chen, Y., Gu, D., Gao, P.,", "orig": "Chen, Y., Gu, D., Gao, P.,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 16, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 369.32, "r_y0": 161.562, "r_x1": 390.56, "r_y1": 161.562, "r_x2": 390.56, "r_y2": 150.27300000000002, "r_x3": 369.32, "r_y3": 150.27300000000002, "coord_origin": "TOPLEFT"}, "text": "Xiao,", "orig": "Xiao,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 17, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 394.981, "r_y0": 161.562, "r_x1": 406.88, "r_y1": 161.562, "r_x2": 406.88, "r_y2": 150.27300000000002, "r_x3": 394.981, "r_y3": 150.27300000000002, "coord_origin": "TOPLEFT"}, "text": "R.:", "orig": "R.:", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 18, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 411.291, "r_y0": 161.562, "r_x1": 480.594, "r_y1": 161.562, "r_x2": 480.594, "r_y2": 150.27300000000002, "r_x3": 411.291, "r_y3": 150.27300000000002, "coord_origin": "TOPLEFT"}, "text": "Pingan-vcgroup's", "orig": "Pingan-vcgroup's", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 19, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 151.518, "r_y0": 172.52099999999996, "r_x1": 183.303, "r_y1": 172.52099999999996, "r_x2": 183.303, "r_y2": 161.23199999999997, "r_x3": 151.518, "r_y3": 161.23199999999997, "coord_origin": "TOPLEFT"}, "text": "solution", "orig": "solution", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 20, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 187.948, "r_y0": 172.52099999999996, "r_x1": 198.974, "r_y1": 172.52099999999996, "r_x2": 198.974, "r_y2": 161.23199999999997, "r_x3": 187.948, "r_y3": 161.23199999999997, "coord_origin": "TOPLEFT"}, "text": "for", "orig": "for", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 21, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 203.618, "r_y0": 172.52099999999996, "r_x1": 223.601, "r_y1": 172.52099999999996, "r_x2": 223.601, "r_y2": 161.23199999999997, "r_x3": 203.618, "r_y3": 161.23199999999997, "coord_origin": "TOPLEFT"}, "text": "icdar", "orig": "icdar", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 22, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 228.245, "r_y0": 172.52099999999996, "r_x1": 246.664, "r_y1": 172.52099999999996, "r_x2": 246.664, "r_y2": 161.23199999999997, "r_x3": 228.245, "r_y3": 161.23199999999997, "coord_origin": "TOPLEFT"}, "text": "2021", "orig": "2021", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 23, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 251.309, "r_y0": 172.52099999999996, "r_x1": 299.174, "r_y1": 172.52099999999996, "r_x2": 299.174, "r_y2": 161.23199999999997, "r_x3": 251.309, "r_y3": 161.23199999999997, "coord_origin": "TOPLEFT"}, "text": "competition", "orig": "competition", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 24, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 303.819, "r_y0": 172.52099999999996, "r_x1": 352.788, "r_y1": 172.52099999999996, "r_x2": 352.788, "r_y2": 161.23199999999997, "r_x3": 303.819, "r_y3": 161.23199999999997, "coord_origin": "TOPLEFT"}, "text": "on scientific", "orig": "on scientific", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 25, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 357.432, "r_y0": 172.52099999999996, "r_x1": 394.845, "r_y1": 172.52099999999996, "r_x2": 394.845, "r_y2": 161.23199999999997, "r_x3": 357.432, "r_y3": 161.23199999999997, "coord_origin": "TOPLEFT"}, "text": "literature", "orig": "literature", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 26, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 399.49, "r_y0": 172.52099999999996, "r_x1": 428.737, "r_y1": 172.52099999999996, "r_x2": 428.737, "r_y2": 161.23199999999997, "r_x3": 399.49, "r_y3": 161.23199999999997, "coord_origin": "TOPLEFT"}, "text": "parsing", "orig": "parsing", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 27, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 433.381, "r_y0": 172.52099999999996, "r_x1": 450.068, "r_y1": 172.52099999999996, "r_x2": 450.068, "r_y2": 161.23199999999997, "r_x3": 433.381, "r_y3": 161.23199999999997, "coord_origin": "TOPLEFT"}, "text": "task", "orig": "task", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 28, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 454.703, "r_y0": 172.52099999999996, "r_x1": 462.38, "r_y1": 172.52099999999996, "r_x2": 462.38, "r_y2": 161.23199999999997, "r_x3": 454.703, "r_y3": 161.23199999999997, "coord_origin": "TOPLEFT"}, "text": "b:", "orig": "b:", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 29, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 467.025, "r_y0": 172.52099999999996, "r_x1": 480.595, "r_y1": 172.52099999999996, "r_x2": 480.595, "r_y2": 161.23199999999997, "r_x3": 467.025, "r_y3": 161.23199999999997, "coord_origin": "TOPLEFT"}, "text": "Ta-", "orig": "Ta-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 30, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 151.518, "r_y0": 183.48000000000002, "r_x1": 163.294, "r_y1": 183.48000000000002, "r_x2": 163.294, "r_y2": 172.19100000000003, "r_x3": 151.518, "r_y3": 172.19100000000003, "coord_origin": "TOPLEFT"}, "text": "ble", "orig": "ble", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 31, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 167.732, "r_y0": 183.48000000000002, "r_x1": 212.287, "r_y1": 183.48000000000002, "r_x2": 212.287, "r_y2": 172.19100000000003, "r_x3": 167.732, "r_y3": 172.19100000000003, "coord_origin": "TOPLEFT"}, "text": "recognition", "orig": "recognition", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 32, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 216.734, "r_y0": 183.48000000000002, "r_x1": 224.924, "r_y1": 183.48000000000002, "r_x2": 224.924, "r_y2": 172.19100000000003, "r_x3": 216.734, "r_y3": 172.19100000000003, "coord_origin": "TOPLEFT"}, "text": "to", "orig": "to", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 33, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 229.362, "r_y0": 183.48000000000002, "r_x1": 280.64, "r_y1": 183.48000000000002, "r_x2": 280.64, "r_y2": 172.19100000000003, "r_x3": 229.362, "r_y3": 172.19100000000003, "coord_origin": "TOPLEFT"}, "text": "html (2021).", "orig": "html (2021).", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 34, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 285.078, "r_y0": 182.58399999999995, "r_x1": 478.034, "r_y1": 182.58399999999995, "r_x2": 478.034, "r_y2": 175.115, "r_x3": 285.078, "r_y3": 175.115, "coord_origin": "TOPLEFT"}, "text": "https://doi.org/10.48550/ARXIV.2105.01848", "orig": "https://doi.org/10.48550/ARXIV.2105.01848", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 35, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 478.032, "r_y0": 183.48000000000002, "r_x1": 480.591, "r_y1": 183.48000000000002, "r_x2": 480.591, "r_y2": 172.19100000000003, "r_x3": 478.032, "r_y3": 172.19100000000003, "coord_origin": "TOPLEFT"}, "text": ",", "orig": ",", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 36, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 151.518, "r_y0": 193.543, "r_x1": 302.116, "r_y1": 193.543, "r_x2": 302.116, "r_y2": 186.07399999999996, "r_x3": 151.518, "r_y3": 186.07399999999996, "coord_origin": "TOPLEFT"}, "text": "https://arxiv.org/abs/2105.01848", "orig": "https://arxiv.org/abs/2105.01848", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "19. Ye, J., Qi, X., He, Y., Chen, Y., Gu, D., Gao, P., Xiao, R.: Pingan-vcgroup's solution for icdar 2021 competition on scientific literature parsing task b: Table recognition to html (2021). https://doi.org/10.48550/ARXIV.2105.01848 , https://arxiv.org/abs/2105.01848"}, {"label": "list_item", "id": 4, "page_no": 13, "cluster": {"id": 4, "label": "list_item", "bbox": {"l": 134.765, "t": 194.10900000000004, "r": 480.594, "b": 216.356, "coord_origin": "TOPLEFT"}, "confidence": 0.9531471729278564, "cells": [{"index": 37, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 205.39800000000002, "r_x1": 146.538, "r_y1": 205.39800000000002, "r_x2": 146.538, "r_y2": 194.10900000000004, "r_x3": 134.765, "r_y3": 194.10900000000004, "coord_origin": "TOPLEFT"}, "text": "20.", "orig": "20.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 38, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 151.514, "r_y0": 205.39800000000002, "r_x1": 480.594, "r_y1": 205.39800000000002, "r_x2": 480.594, "r_y2": 194.10900000000004, "r_x3": 151.514, "r_y3": 194.10900000000004, "coord_origin": "TOPLEFT"}, "text": "Zhang, Z., Zhang, J., Du, J., Wang, F.: Split, embed and merge: An accurate table", "orig": "Zhang, Z., Zhang, J., Du, J., Wang, F.: Split, embed and merge: An accurate table", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 39, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 151.518, "r_y0": 216.356, "r_x1": 318.551, "r_y1": 216.356, "r_x2": 318.551, "r_y2": 205.067, "r_x3": 151.518, "r_y3": 205.067, "coord_origin": "TOPLEFT"}, "text": "structure recognizer. Pattern Recognition", "orig": "structure recognizer. Pattern Recognition", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 40, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 321.621, "r_y0": 215.20799999999997, "r_x1": 337.532, "r_y1": 215.20799999999997, "r_x2": 337.532, "r_y2": 207.28200000000004, "r_x3": 321.621, "r_y3": 207.28200000000004, "coord_origin": "TOPLEFT"}, "text": "126", "orig": "126", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 41, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 337.533, "r_y0": 216.356, "r_x1": 340.092, "r_y1": 216.356, "r_x2": 340.092, "r_y2": 205.067, "r_x3": 337.533, "r_y3": 205.067, "coord_origin": "TOPLEFT"}, "text": ",", "orig": ",", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 42, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 343.159, "r_y0": 216.356, "r_x1": 399.469, "r_y1": 216.356, "r_x2": 399.469, "r_y2": 205.067, "r_x3": 343.159, "r_y3": 205.067, "coord_origin": "TOPLEFT"}, "text": "108565 (2022)", "orig": "108565 (2022)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "20. Zhang, Z., Zhang, J., Du, J., Wang, F.: Split, embed and merge: An accurate table structure recognizer. Pattern Recognition 126 , 108565 (2022)"}, {"label": "list_item", "id": 0, "page_no": 13, "cluster": {"id": 0, "label": "list_item", "bbox": {"l": 134.765, "t": 216.02599999999995, "r": 480.593, "b": 270.255, "coord_origin": "TOPLEFT"}, "confidence": 0.972027063369751, "cells": [{"index": 43, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 227.31500000000005, "r_x1": 146.538, "r_y1": 227.31500000000005, "r_x2": 146.538, "r_y2": 216.02599999999995, "r_x3": 134.765, "r_y3": 216.02599999999995, "coord_origin": "TOPLEFT"}, "text": "21.", "orig": "21.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 44, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 151.514, "r_y0": 227.31500000000005, "r_x1": 480.59, "r_y1": 227.31500000000005, "r_x2": 480.59, "r_y2": 216.02599999999995, "r_x3": 151.514, "r_y3": 216.02599999999995, "coord_origin": "TOPLEFT"}, "text": "Zheng, X., Burdick, D., Popa, L., Zhong, X., Wang, N.X.R.: Global table extractor", "orig": "Zheng, X., Burdick, D., Popa, L., Zhong, X., Wang, N.X.R.: Global table extractor", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 45, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 151.518, "r_y0": 238.274, "r_x1": 480.591, "r_y1": 238.274, "r_x2": 480.591, "r_y2": 226.985, "r_x3": 151.518, "r_y3": 226.985, "coord_origin": "TOPLEFT"}, "text": "(gte): A framework for joint table identification and cell structure recognition using", "orig": "(gte): A framework for joint table identification and cell structure recognition using", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 46, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 151.518, "r_y0": 249.23299999999995, "r_x1": 480.591, "r_y1": 249.23299999999995, "r_x2": 480.591, "r_y2": 237.94399999999996, "r_x3": 151.518, "r_y3": 237.94399999999996, "coord_origin": "TOPLEFT"}, "text": "visual context. In: 2021 IEEE Winter Conference on Applications of Computer Vi-", "orig": "visual context. In: 2021 IEEE Winter Conference on Applications of Computer Vi-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 47, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 151.518, "r_y0": 260.192, "r_x1": 293.441, "r_y1": 260.192, "r_x2": 293.441, "r_y2": 248.90300000000002, "r_x3": 151.518, "r_y3": 248.90300000000002, "coord_origin": "TOPLEFT"}, "text": "sion (WACV). pp. 697-706 (2021).", "orig": "sion (WACV). pp. 697-706 (2021).", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 48, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 297.05, "r_y0": 259.29600000000005, "r_x1": 480.593, "r_y1": 259.29600000000005, "r_x2": 480.593, "r_y2": 251.827, "r_x3": 297.05, "r_y3": 251.827, "coord_origin": "TOPLEFT"}, "text": "https://doi.org/10.1109/WACV48630.2021.", "orig": "https://doi.org/10.1109/WACV48630.2021.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 49, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 151.518, "r_y0": 270.255, "r_x1": 175.05, "r_y1": 270.255, "r_x2": 175.05, "r_y2": 262.78599999999994, "r_x3": 151.518, "r_y3": 262.78599999999994, "coord_origin": "TOPLEFT"}, "text": "00074", "orig": "00074", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "21. Zheng, X., Burdick, D., Popa, L., Zhong, X., Wang, N.X.R.: Global table extractor (gte): A framework for joint table identification and cell structure recognition using visual context. In: 2021 IEEE Winter Conference on Applications of Computer Vision (WACV). pp. 697-706 (2021). https://doi.org/10.1109/WACV48630.2021. 00074"}, {"label": "list_item", "id": 1, "page_no": 13, "cluster": {"id": 1, "label": "list_item", "bbox": {"l": 134.765, "t": 270.821, "r": 480.596, "b": 314.987, "coord_origin": "TOPLEFT"}, "confidence": 0.9685125946998596, "cells": [{"index": 50, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 282.11, "r_x1": 146.538, "r_y1": 282.11, "r_x2": 146.538, "r_y2": 270.821, "r_x3": 134.765, "r_y3": 270.821, "coord_origin": "TOPLEFT"}, "text": "22.", "orig": "22.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 51, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 151.514, "r_y0": 282.11, "r_x1": 271.779, "r_y1": 282.11, "r_x2": 271.779, "r_y2": 270.821, "r_x3": 151.514, "r_y3": 270.821, "coord_origin": "TOPLEFT"}, "text": "Zhong, X., ShafieiBavani, E.,", "orig": "Zhong, X., ShafieiBavani, E.,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 52, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 275.957, "r_y0": 282.11, "r_x1": 480.591, "r_y1": 282.11, "r_x2": 480.591, "r_y2": 270.821, "r_x3": 275.957, "r_y3": 270.821, "coord_origin": "TOPLEFT"}, "text": "Jimeno Yepes, A.: Image-based table recognition:", "orig": "Jimeno Yepes, A.: Image-based table recognition:", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 53, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 151.518, "r_y0": 293.069, "r_x1": 480.588, "r_y1": 293.069, "r_x2": 480.588, "r_y2": 281.78, "r_x3": 151.518, "r_y3": 281.78, "coord_origin": "TOPLEFT"}, "text": "Data, model, and evaluation. In: Vedaldi, A., Bischof, H., Brox, T., Frahm, J.M.", "orig": "Data, model, and evaluation. In: Vedaldi, A., Bischof, H., Brox, T., Frahm, J.M.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 54, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 151.518, "r_y0": 304.028, "r_x1": 480.596, "r_y1": 304.028, "r_x2": 480.596, "r_y2": 292.739, "r_x3": 151.518, "r_y3": 292.739, "coord_origin": "TOPLEFT"}, "text": "(eds.) Computer Vision - ECCV 2020. pp. 564-580. Springer International Pub-", "orig": "(eds.) Computer Vision - ECCV 2020. pp. 564-580. Springer International Pub-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 55, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 151.518, "r_y0": 314.987, "r_x1": 236.024, "r_y1": 314.987, "r_x2": 236.024, "r_y2": 303.698, "r_x3": 151.518, "r_y3": 303.698, "coord_origin": "TOPLEFT"}, "text": "lishing, Cham (2020)", "orig": "lishing, Cham (2020)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "22. Zhong, X., ShafieiBavani, E., Jimeno Yepes, A.: Image-based table recognition: Data, model, and evaluation. In: Vedaldi, A., Bischof, H., Brox, T., Frahm, J.M. (eds.) Computer Vision - ECCV 2020. pp. 564-580. Springer International Publishing, Cham (2020)"}, {"label": "list_item", "id": 2, "page_no": 13, "cluster": {"id": 2, "label": "list_item", "bbox": {"l": 134.765, "t": 314.657, "r": 480.595, "b": 347.863, "coord_origin": "TOPLEFT"}, "confidence": 0.9668973684310913, "cells": [{"index": 56, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 325.946, "r_x1": 146.538, "r_y1": 325.946, "r_x2": 146.538, "r_y2": 314.657, "r_x3": 134.765, "r_y3": 314.657, "coord_origin": "TOPLEFT"}, "text": "23.", "orig": "23.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 57, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 151.514, "r_y0": 325.946, "r_x1": 480.595, "r_y1": 325.946, "r_x2": 480.595, "r_y2": 314.657, "r_x3": 151.514, "r_y3": 314.657, "coord_origin": "TOPLEFT"}, "text": "Zhong, X., Tang, J., Yepes, A.J.: Publaynet: largest dataset ever for document lay-", "orig": "Zhong, X., Tang, J., Yepes, A.J.: Publaynet: largest dataset ever for document lay-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 58, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 151.518, "r_y0": 336.904, "r_x1": 480.594, "r_y1": 336.904, "r_x2": 480.594, "r_y2": 325.615, "r_x3": 151.518, "r_y3": 325.615, "coord_origin": "TOPLEFT"}, "text": "out analysis. In: 2019 International Conference on Document Analysis and Recog-", "orig": "out analysis. In: 2019 International Conference on Document Analysis and Recog-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 59, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 151.518, "r_y0": 347.863, "r_x1": 335.136, "r_y1": 347.863, "r_x2": 335.136, "r_y2": 336.574, "r_x3": 151.518, "r_y3": 336.574, "coord_origin": "TOPLEFT"}, "text": "nition (ICDAR). pp. 1015-1022. IEEE (2019)", "orig": "nition (ICDAR). pp. 1015-1022. IEEE (2019)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "23. Zhong, X., Tang, J., Yepes, A.J.: Publaynet: largest dataset ever for document layout analysis. In: 2019 International Conference on Document Analysis and Recognition (ICDAR). pp. 1015-1022. IEEE (2019)"}], "body": [{"label": "list_item", "id": 5, "page_no": 13, "cluster": {"id": 5, "label": "list_item", "bbox": {"l": 134.765, "t": 117.39599999999996, "r": 480.591, "b": 150.60299999999995, "coord_origin": "TOPLEFT"}, "confidence": 0.9444757699966431, "cells": [{"index": 2, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 128.68499999999995, "r_x1": 146.538, "r_y1": 128.68499999999995, "r_x2": 146.538, "r_y2": 117.39599999999996, "r_x3": 134.765, "r_y3": 117.39599999999996, "coord_origin": "TOPLEFT"}, "text": "18.", "orig": "18.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 3, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 151.514, "r_y0": 128.68499999999995, "r_x1": 480.589, "r_y1": 128.68499999999995, "r_x2": 480.589, "r_y2": 117.39599999999996, "r_x3": 151.514, "r_y3": 117.39599999999996, "coord_origin": "TOPLEFT"}, "text": "Xue, W., Yu, B., Wang, W., Tao, D., Li, Q.: Tgrnet: A table graph reconstruc-", "orig": "Xue, W., Yu, B., Wang, W., Tao, D., Li, Q.: Tgrnet: A table graph reconstruc-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 4, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 151.518, "r_y0": 139.644, "r_x1": 167.385, "r_y1": 139.644, "r_x2": 167.385, "r_y2": 128.35500000000002, "r_x3": 151.518, "r_y3": 128.35500000000002, "coord_origin": "TOPLEFT"}, "text": "tion", "orig": "tion", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 5, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 171.492, "r_y0": 139.644, "r_x1": 334.467, "r_y1": 139.644, "r_x2": 334.467, "r_y2": 128.35500000000002, "r_x3": 171.492, "r_y3": 128.35500000000002, "coord_origin": "TOPLEFT"}, "text": "network for table structure recognition.", "orig": "network for table structure recognition.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 6, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 338.573, "r_y0": 139.644, "r_x1": 349.576, "r_y1": 139.644, "r_x2": 349.576, "r_y2": 128.35500000000002, "r_x3": 338.573, "r_y3": 128.35500000000002, "coord_origin": "TOPLEFT"}, "text": "In:", "orig": "In:", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 7, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 353.674, "r_y0": 139.644, "r_x1": 480.591, "r_y1": 139.644, "r_x2": 480.591, "r_y2": 128.35500000000002, "r_x3": 353.674, "r_y3": 128.35500000000002, "coord_origin": "TOPLEFT"}, "text": "Proceedings of the IEEE/CVF", "orig": "Proceedings of the IEEE/CVF", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 8, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 151.518, "r_y0": 150.60299999999995, "r_x1": 427.533, "r_y1": 150.60299999999995, "r_x2": 427.533, "r_y2": 139.31399999999996, "r_x3": 151.518, "r_y3": 139.31399999999996, "coord_origin": "TOPLEFT"}, "text": "International Conference on Computer Vision. pp. 1295-1304 (2021)", "orig": "International Conference on Computer Vision. pp. 1295-1304 (2021)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "18. Xue, W., Yu, B., Wang, W., Tao, D., Li, Q.: Tgrnet: A table graph reconstruction network for table structure recognition. In: Proceedings of the IEEE/CVF International Conference on Computer Vision. pp. 1295-1304 (2021)"}, {"label": "list_item", "id": 3, "page_no": 13, "cluster": {"id": 3, "label": "list_item", "bbox": {"l": 134.765, "t": 150.27300000000002, "r": 480.595, "b": 193.543, "coord_origin": "TOPLEFT"}, "confidence": 0.9540892243385315, "cells": [{"index": 9, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 161.562, "r_x1": 146.538, "r_y1": 161.562, "r_x2": 146.538, "r_y2": 150.27300000000002, "r_x3": 134.765, "r_y3": 150.27300000000002, "coord_origin": "TOPLEFT"}, "text": "19.", "orig": "19.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 10, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 151.514, "r_y0": 161.562, "r_x1": 164.318, "r_y1": 161.562, "r_x2": 164.318, "r_y2": 150.27300000000002, "r_x3": 151.514, "r_y3": 150.27300000000002, "coord_origin": "TOPLEFT"}, "text": "Ye,", "orig": "Ye,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 11, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 168.73, "r_y0": 161.562, "r_x1": 178.582, "r_y1": 161.562, "r_x2": 178.582, "r_y2": 150.27300000000002, "r_x3": 168.73, "r_y3": 150.27300000000002, "coord_origin": "TOPLEFT"}, "text": "J.,", "orig": "J.,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 12, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 183.002, "r_y0": 161.562, "r_x1": 195.286, "r_y1": 161.562, "r_x2": 195.286, "r_y2": 150.27300000000002, "r_x3": 183.002, "r_y3": 150.27300000000002, "coord_origin": "TOPLEFT"}, "text": "Qi,", "orig": "Qi,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 13, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 199.698, "r_y0": 161.562, "r_x1": 211.725, "r_y1": 161.562, "r_x2": 211.725, "r_y2": 150.27300000000002, "r_x3": 199.698, "r_y3": 150.27300000000002, "coord_origin": "TOPLEFT"}, "text": "X.,", "orig": "X.,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 14, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 216.145, "r_y0": 161.562, "r_x1": 246.149, "r_y1": 161.562, "r_x2": 246.149, "r_y2": 150.27300000000002, "r_x3": 216.145, "r_y3": 150.27300000000002, "coord_origin": "TOPLEFT"}, "text": "He, Y.,", "orig": "He, Y.,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 15, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 250.57, "r_y0": 161.562, "r_x1": 364.908, "r_y1": 161.562, "r_x2": 364.908, "r_y2": 150.27300000000002, "r_x3": 250.57, "r_y3": 150.27300000000002, "coord_origin": "TOPLEFT"}, "text": "Chen, Y., Gu, D., Gao, P.,", "orig": "Chen, Y., Gu, D., Gao, P.,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 16, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 369.32, "r_y0": 161.562, "r_x1": 390.56, "r_y1": 161.562, "r_x2": 390.56, "r_y2": 150.27300000000002, "r_x3": 369.32, "r_y3": 150.27300000000002, "coord_origin": "TOPLEFT"}, "text": "Xiao,", "orig": "Xiao,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 17, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 394.981, "r_y0": 161.562, "r_x1": 406.88, "r_y1": 161.562, "r_x2": 406.88, "r_y2": 150.27300000000002, "r_x3": 394.981, "r_y3": 150.27300000000002, "coord_origin": "TOPLEFT"}, "text": "R.:", "orig": "R.:", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 18, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 411.291, "r_y0": 161.562, "r_x1": 480.594, "r_y1": 161.562, "r_x2": 480.594, "r_y2": 150.27300000000002, "r_x3": 411.291, "r_y3": 150.27300000000002, "coord_origin": "TOPLEFT"}, "text": "Pingan-vcgroup's", "orig": "Pingan-vcgroup's", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 19, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 151.518, "r_y0": 172.52099999999996, "r_x1": 183.303, "r_y1": 172.52099999999996, "r_x2": 183.303, "r_y2": 161.23199999999997, "r_x3": 151.518, "r_y3": 161.23199999999997, "coord_origin": "TOPLEFT"}, "text": "solution", "orig": "solution", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 20, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 187.948, "r_y0": 172.52099999999996, "r_x1": 198.974, "r_y1": 172.52099999999996, "r_x2": 198.974, "r_y2": 161.23199999999997, "r_x3": 187.948, "r_y3": 161.23199999999997, "coord_origin": "TOPLEFT"}, "text": "for", "orig": "for", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 21, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 203.618, "r_y0": 172.52099999999996, "r_x1": 223.601, "r_y1": 172.52099999999996, "r_x2": 223.601, "r_y2": 161.23199999999997, "r_x3": 203.618, "r_y3": 161.23199999999997, "coord_origin": "TOPLEFT"}, "text": "icdar", "orig": "icdar", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 22, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 228.245, "r_y0": 172.52099999999996, "r_x1": 246.664, "r_y1": 172.52099999999996, "r_x2": 246.664, "r_y2": 161.23199999999997, "r_x3": 228.245, "r_y3": 161.23199999999997, "coord_origin": "TOPLEFT"}, "text": "2021", "orig": "2021", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 23, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 251.309, "r_y0": 172.52099999999996, "r_x1": 299.174, "r_y1": 172.52099999999996, "r_x2": 299.174, "r_y2": 161.23199999999997, "r_x3": 251.309, "r_y3": 161.23199999999997, "coord_origin": "TOPLEFT"}, "text": "competition", "orig": "competition", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 24, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 303.819, "r_y0": 172.52099999999996, "r_x1": 352.788, "r_y1": 172.52099999999996, "r_x2": 352.788, "r_y2": 161.23199999999997, "r_x3": 303.819, "r_y3": 161.23199999999997, "coord_origin": "TOPLEFT"}, "text": "on scientific", "orig": "on scientific", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 25, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 357.432, "r_y0": 172.52099999999996, "r_x1": 394.845, "r_y1": 172.52099999999996, "r_x2": 394.845, "r_y2": 161.23199999999997, "r_x3": 357.432, "r_y3": 161.23199999999997, "coord_origin": "TOPLEFT"}, "text": "literature", "orig": "literature", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 26, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 399.49, "r_y0": 172.52099999999996, "r_x1": 428.737, "r_y1": 172.52099999999996, "r_x2": 428.737, "r_y2": 161.23199999999997, "r_x3": 399.49, "r_y3": 161.23199999999997, "coord_origin": "TOPLEFT"}, "text": "parsing", "orig": "parsing", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 27, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 433.381, "r_y0": 172.52099999999996, "r_x1": 450.068, "r_y1": 172.52099999999996, "r_x2": 450.068, "r_y2": 161.23199999999997, "r_x3": 433.381, "r_y3": 161.23199999999997, "coord_origin": "TOPLEFT"}, "text": "task", "orig": "task", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 28, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 454.703, "r_y0": 172.52099999999996, "r_x1": 462.38, "r_y1": 172.52099999999996, "r_x2": 462.38, "r_y2": 161.23199999999997, "r_x3": 454.703, "r_y3": 161.23199999999997, "coord_origin": "TOPLEFT"}, "text": "b:", "orig": "b:", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 29, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 467.025, "r_y0": 172.52099999999996, "r_x1": 480.595, "r_y1": 172.52099999999996, "r_x2": 480.595, "r_y2": 161.23199999999997, "r_x3": 467.025, "r_y3": 161.23199999999997, "coord_origin": "TOPLEFT"}, "text": "Ta-", "orig": "Ta-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 30, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 151.518, "r_y0": 183.48000000000002, "r_x1": 163.294, "r_y1": 183.48000000000002, "r_x2": 163.294, "r_y2": 172.19100000000003, "r_x3": 151.518, "r_y3": 172.19100000000003, "coord_origin": "TOPLEFT"}, "text": "ble", "orig": "ble", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 31, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 167.732, "r_y0": 183.48000000000002, "r_x1": 212.287, "r_y1": 183.48000000000002, "r_x2": 212.287, "r_y2": 172.19100000000003, "r_x3": 167.732, "r_y3": 172.19100000000003, "coord_origin": "TOPLEFT"}, "text": "recognition", "orig": "recognition", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 32, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 216.734, "r_y0": 183.48000000000002, "r_x1": 224.924, "r_y1": 183.48000000000002, "r_x2": 224.924, "r_y2": 172.19100000000003, "r_x3": 216.734, "r_y3": 172.19100000000003, "coord_origin": "TOPLEFT"}, "text": "to", "orig": "to", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 33, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 229.362, "r_y0": 183.48000000000002, "r_x1": 280.64, "r_y1": 183.48000000000002, "r_x2": 280.64, "r_y2": 172.19100000000003, "r_x3": 229.362, "r_y3": 172.19100000000003, "coord_origin": "TOPLEFT"}, "text": "html (2021).", "orig": "html (2021).", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 34, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 285.078, "r_y0": 182.58399999999995, "r_x1": 478.034, "r_y1": 182.58399999999995, "r_x2": 478.034, "r_y2": 175.115, "r_x3": 285.078, "r_y3": 175.115, "coord_origin": "TOPLEFT"}, "text": "https://doi.org/10.48550/ARXIV.2105.01848", "orig": "https://doi.org/10.48550/ARXIV.2105.01848", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 35, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 478.032, "r_y0": 183.48000000000002, "r_x1": 480.591, "r_y1": 183.48000000000002, "r_x2": 480.591, "r_y2": 172.19100000000003, "r_x3": 478.032, "r_y3": 172.19100000000003, "coord_origin": "TOPLEFT"}, "text": ",", "orig": ",", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 36, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 151.518, "r_y0": 193.543, "r_x1": 302.116, "r_y1": 193.543, "r_x2": 302.116, "r_y2": 186.07399999999996, "r_x3": 151.518, "r_y3": 186.07399999999996, "coord_origin": "TOPLEFT"}, "text": "https://arxiv.org/abs/2105.01848", "orig": "https://arxiv.org/abs/2105.01848", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "19. Ye, J., Qi, X., He, Y., Chen, Y., Gu, D., Gao, P., Xiao, R.: Pingan-vcgroup's solution for icdar 2021 competition on scientific literature parsing task b: Table recognition to html (2021). https://doi.org/10.48550/ARXIV.2105.01848 , https://arxiv.org/abs/2105.01848"}, {"label": "list_item", "id": 4, "page_no": 13, "cluster": {"id": 4, "label": "list_item", "bbox": {"l": 134.765, "t": 194.10900000000004, "r": 480.594, "b": 216.356, "coord_origin": "TOPLEFT"}, "confidence": 0.9531471729278564, "cells": [{"index": 37, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 205.39800000000002, "r_x1": 146.538, "r_y1": 205.39800000000002, "r_x2": 146.538, "r_y2": 194.10900000000004, "r_x3": 134.765, "r_y3": 194.10900000000004, "coord_origin": "TOPLEFT"}, "text": "20.", "orig": "20.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 38, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 151.514, "r_y0": 205.39800000000002, "r_x1": 480.594, "r_y1": 205.39800000000002, "r_x2": 480.594, "r_y2": 194.10900000000004, "r_x3": 151.514, "r_y3": 194.10900000000004, "coord_origin": "TOPLEFT"}, "text": "Zhang, Z., Zhang, J., Du, J., Wang, F.: Split, embed and merge: An accurate table", "orig": "Zhang, Z., Zhang, J., Du, J., Wang, F.: Split, embed and merge: An accurate table", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 39, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 151.518, "r_y0": 216.356, "r_x1": 318.551, "r_y1": 216.356, "r_x2": 318.551, "r_y2": 205.067, "r_x3": 151.518, "r_y3": 205.067, "coord_origin": "TOPLEFT"}, "text": "structure recognizer. Pattern Recognition", "orig": "structure recognizer. Pattern Recognition", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 40, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 321.621, "r_y0": 215.20799999999997, "r_x1": 337.532, "r_y1": 215.20799999999997, "r_x2": 337.532, "r_y2": 207.28200000000004, "r_x3": 321.621, "r_y3": 207.28200000000004, "coord_origin": "TOPLEFT"}, "text": "126", "orig": "126", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 41, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 337.533, "r_y0": 216.356, "r_x1": 340.092, "r_y1": 216.356, "r_x2": 340.092, "r_y2": 205.067, "r_x3": 337.533, "r_y3": 205.067, "coord_origin": "TOPLEFT"}, "text": ",", "orig": ",", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 42, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 343.159, "r_y0": 216.356, "r_x1": 399.469, "r_y1": 216.356, "r_x2": 399.469, "r_y2": 205.067, "r_x3": 343.159, "r_y3": 205.067, "coord_origin": "TOPLEFT"}, "text": "108565 (2022)", "orig": "108565 (2022)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "20. Zhang, Z., Zhang, J., Du, J., Wang, F.: Split, embed and merge: An accurate table structure recognizer. Pattern Recognition 126 , 108565 (2022)"}, {"label": "list_item", "id": 0, "page_no": 13, "cluster": {"id": 0, "label": "list_item", "bbox": {"l": 134.765, "t": 216.02599999999995, "r": 480.593, "b": 270.255, "coord_origin": "TOPLEFT"}, "confidence": 0.972027063369751, "cells": [{"index": 43, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 227.31500000000005, "r_x1": 146.538, "r_y1": 227.31500000000005, "r_x2": 146.538, "r_y2": 216.02599999999995, "r_x3": 134.765, "r_y3": 216.02599999999995, "coord_origin": "TOPLEFT"}, "text": "21.", "orig": "21.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 44, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 151.514, "r_y0": 227.31500000000005, "r_x1": 480.59, "r_y1": 227.31500000000005, "r_x2": 480.59, "r_y2": 216.02599999999995, "r_x3": 151.514, "r_y3": 216.02599999999995, "coord_origin": "TOPLEFT"}, "text": "Zheng, X., Burdick, D., Popa, L., Zhong, X., Wang, N.X.R.: Global table extractor", "orig": "Zheng, X., Burdick, D., Popa, L., Zhong, X., Wang, N.X.R.: Global table extractor", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 45, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 151.518, "r_y0": 238.274, "r_x1": 480.591, "r_y1": 238.274, "r_x2": 480.591, "r_y2": 226.985, "r_x3": 151.518, "r_y3": 226.985, "coord_origin": "TOPLEFT"}, "text": "(gte): A framework for joint table identification and cell structure recognition using", "orig": "(gte): A framework for joint table identification and cell structure recognition using", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 46, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 151.518, "r_y0": 249.23299999999995, "r_x1": 480.591, "r_y1": 249.23299999999995, "r_x2": 480.591, "r_y2": 237.94399999999996, "r_x3": 151.518, "r_y3": 237.94399999999996, "coord_origin": "TOPLEFT"}, "text": "visual context. In: 2021 IEEE Winter Conference on Applications of Computer Vi-", "orig": "visual context. In: 2021 IEEE Winter Conference on Applications of Computer Vi-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 47, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 151.518, "r_y0": 260.192, "r_x1": 293.441, "r_y1": 260.192, "r_x2": 293.441, "r_y2": 248.90300000000002, "r_x3": 151.518, "r_y3": 248.90300000000002, "coord_origin": "TOPLEFT"}, "text": "sion (WACV). pp. 697-706 (2021).", "orig": "sion (WACV). pp. 697-706 (2021).", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 48, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 297.05, "r_y0": 259.29600000000005, "r_x1": 480.593, "r_y1": 259.29600000000005, "r_x2": 480.593, "r_y2": 251.827, "r_x3": 297.05, "r_y3": 251.827, "coord_origin": "TOPLEFT"}, "text": "https://doi.org/10.1109/WACV48630.2021.", "orig": "https://doi.org/10.1109/WACV48630.2021.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 49, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 151.518, "r_y0": 270.255, "r_x1": 175.05, "r_y1": 270.255, "r_x2": 175.05, "r_y2": 262.78599999999994, "r_x3": 151.518, "r_y3": 262.78599999999994, "coord_origin": "TOPLEFT"}, "text": "00074", "orig": "00074", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "21. Zheng, X., Burdick, D., Popa, L., Zhong, X., Wang, N.X.R.: Global table extractor (gte): A framework for joint table identification and cell structure recognition using visual context. In: 2021 IEEE Winter Conference on Applications of Computer Vision (WACV). pp. 697-706 (2021). https://doi.org/10.1109/WACV48630.2021. 00074"}, {"label": "list_item", "id": 1, "page_no": 13, "cluster": {"id": 1, "label": "list_item", "bbox": {"l": 134.765, "t": 270.821, "r": 480.596, "b": 314.987, "coord_origin": "TOPLEFT"}, "confidence": 0.9685125946998596, "cells": [{"index": 50, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 282.11, "r_x1": 146.538, "r_y1": 282.11, "r_x2": 146.538, "r_y2": 270.821, "r_x3": 134.765, "r_y3": 270.821, "coord_origin": "TOPLEFT"}, "text": "22.", "orig": "22.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 51, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 151.514, "r_y0": 282.11, "r_x1": 271.779, "r_y1": 282.11, "r_x2": 271.779, "r_y2": 270.821, "r_x3": 151.514, "r_y3": 270.821, "coord_origin": "TOPLEFT"}, "text": "Zhong, X., ShafieiBavani, E.,", "orig": "Zhong, X., ShafieiBavani, E.,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 52, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 275.957, "r_y0": 282.11, "r_x1": 480.591, "r_y1": 282.11, "r_x2": 480.591, "r_y2": 270.821, "r_x3": 275.957, "r_y3": 270.821, "coord_origin": "TOPLEFT"}, "text": "Jimeno Yepes, A.: Image-based table recognition:", "orig": "Jimeno Yepes, A.: Image-based table recognition:", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 53, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 151.518, "r_y0": 293.069, "r_x1": 480.588, "r_y1": 293.069, "r_x2": 480.588, "r_y2": 281.78, "r_x3": 151.518, "r_y3": 281.78, "coord_origin": "TOPLEFT"}, "text": "Data, model, and evaluation. In: Vedaldi, A., Bischof, H., Brox, T., Frahm, J.M.", "orig": "Data, model, and evaluation. In: Vedaldi, A., Bischof, H., Brox, T., Frahm, J.M.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 54, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 151.518, "r_y0": 304.028, "r_x1": 480.596, "r_y1": 304.028, "r_x2": 480.596, "r_y2": 292.739, "r_x3": 151.518, "r_y3": 292.739, "coord_origin": "TOPLEFT"}, "text": "(eds.) Computer Vision - ECCV 2020. pp. 564-580. Springer International Pub-", "orig": "(eds.) Computer Vision - ECCV 2020. pp. 564-580. Springer International Pub-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 55, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 151.518, "r_y0": 314.987, "r_x1": 236.024, "r_y1": 314.987, "r_x2": 236.024, "r_y2": 303.698, "r_x3": 151.518, "r_y3": 303.698, "coord_origin": "TOPLEFT"}, "text": "lishing, Cham (2020)", "orig": "lishing, Cham (2020)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "22. Zhong, X., ShafieiBavani, E., Jimeno Yepes, A.: Image-based table recognition: Data, model, and evaluation. In: Vedaldi, A., Bischof, H., Brox, T., Frahm, J.M. (eds.) Computer Vision - ECCV 2020. pp. 564-580. Springer International Publishing, Cham (2020)"}, {"label": "list_item", "id": 2, "page_no": 13, "cluster": {"id": 2, "label": "list_item", "bbox": {"l": 134.765, "t": 314.657, "r": 480.595, "b": 347.863, "coord_origin": "TOPLEFT"}, "confidence": 0.9668973684310913, "cells": [{"index": 56, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 325.946, "r_x1": 146.538, "r_y1": 325.946, "r_x2": 146.538, "r_y2": 314.657, "r_x3": 134.765, "r_y3": 314.657, "coord_origin": "TOPLEFT"}, "text": "23.", "orig": "23.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 57, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 151.514, "r_y0": 325.946, "r_x1": 480.595, "r_y1": 325.946, "r_x2": 480.595, "r_y2": 314.657, "r_x3": 151.514, "r_y3": 314.657, "coord_origin": "TOPLEFT"}, "text": "Zhong, X., Tang, J., Yepes, A.J.: Publaynet: largest dataset ever for document lay-", "orig": "Zhong, X., Tang, J., Yepes, A.J.: Publaynet: largest dataset ever for document lay-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 58, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 151.518, "r_y0": 336.904, "r_x1": 480.594, "r_y1": 336.904, "r_x2": 480.594, "r_y2": 325.615, "r_x3": 151.518, "r_y3": 325.615, "coord_origin": "TOPLEFT"}, "text": "out analysis. In: 2019 International Conference on Document Analysis and Recog-", "orig": "out analysis. In: 2019 International Conference on Document Analysis and Recog-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 59, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 151.518, "r_y0": 347.863, "r_x1": 335.136, "r_y1": 347.863, "r_x2": 335.136, "r_y2": 336.574, "r_x3": 151.518, "r_y3": 336.574, "coord_origin": "TOPLEFT"}, "text": "nition (ICDAR). pp. 1015-1022. IEEE (2019)", "orig": "nition (ICDAR). pp. 1015-1022. IEEE (2019)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "23. Zhong, X., Tang, J., Yepes, A.J.: Publaynet: largest dataset ever for document layout analysis. In: 2019 International Conference on Document Analysis and Recognition (ICDAR). pp. 1015-1022. IEEE (2019)"}], "headers": [{"label": "page_header", "id": 7, "page_no": 13, "cluster": {"id": 7, "label": "page_header", "bbox": {"l": 134.765, "t": 91.49300000000005, "r": 143.979, "b": 102.78200000000004, "coord_origin": "TOPLEFT"}, "confidence": 0.7012730240821838, "cells": [{"index": 0, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.765, "r_y0": 102.78200000000004, "r_x1": 143.979, "r_y1": 102.78200000000004, "r_x2": 143.979, "r_y2": 91.49300000000005, "r_x3": 134.765, "r_y3": 91.49300000000005, "coord_origin": "TOPLEFT"}, "text": "14", "orig": "14", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "14"}, {"label": "page_header", "id": 6, "page_no": 13, "cluster": {"id": 6, "label": "page_header", "bbox": {"l": 167.821, "t": 91.49300000000005, "r": 231.72, "b": 102.78200000000004, "coord_origin": "TOPLEFT"}, "confidence": 0.7889755964279175, "cells": [{"index": 1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 167.821, "r_y0": 102.78200000000004, "r_x1": 231.72, "r_y1": 102.78200000000004, "r_x2": 231.72, "r_y2": 91.49300000000005, "r_x3": 167.821, "r_y3": 91.49300000000005, "coord_origin": "TOPLEFT"}, "text": "M. Lysak, et al.", "orig": "M. Lysak, et al.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "M. Lysak, et al."}]}}]