[ { "page_no": 0, "size": { "width": 612.0, "height": 792.0 }, "parsed_page": { "dimension": { "angle": 0.0, "rect": { "r_x0": 0.0, "r_y0": 0.0, "r_x1": 612.0, "r_y1": 0.0, "r_x2": 612.0, "r_y2": 792.0, "r_x3": 0.0, "r_y3": 792.0, "coord_origin": "BOTTOMLEFT" }, "boundary_type": "crop_box", "art_bbox": { "l": 0.0, "t": 792.0, "r": 612.0, "b": 0.0, "coord_origin": "BOTTOMLEFT" }, "bleed_bbox": { "l": 0.0, "t": 792.0, "r": 612.0, "b": 0.0, "coord_origin": "BOTTOMLEFT" }, "crop_bbox": { "l": 0.0, "t": 792.0, "r": 612.0, "b": 0.0, "coord_origin": "BOTTOMLEFT" }, "media_bbox": { "l": 0.0, "t": 792.0, "r": 612.0, "b": 0.0, "coord_origin": "BOTTOMLEFT" }, "trim_bbox": { "l": 0.0, "t": 792.0, "r": 612.0, "b": 0.0, "coord_origin": "BOTTOMLEFT" } }, "bitmap_resources": [], "char_cells": [], "word_cells": [], "textline_cells": [ { "index": 0, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 128.58, "r_x1": 480.6, "r_y1": 128.58, "r_x2": 480.6, "r_y2": 115.9, "r_x3": 134.76, "r_y3": 115.9, "coord_origin": "TOPLEFT" }, "text": "Optimized Table Tokenization for Table Structure", "orig": "Optimized Table Tokenization for Table Structure", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 1, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 266.67, "r_y0": 146.51, "r_x1": 348.69, "r_y1": 146.51, "r_x2": 348.69, "r_y2": 133.83, "r_x3": 266.67, "r_y3": 133.83, "coord_origin": "TOPLEFT" }, "text": "Recognition", "orig": "Recognition", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 2, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.23, "r_y0": 180.47, "r_x1": 217.04, "r_y1": 180.47, "r_x2": 217.04, "r_y2": 171.67, "r_x3": 151.23, "r_y3": 171.67, "coord_origin": "TOPLEFT" }, "text": "Maksym Lysak", "orig": "Maksym Lysak", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 3, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 217.05, "r_y0": 176.27, "r_x1": 235.19, "r_y1": 176.27, "r_x2": 235.19, "r_y2": 170.08, "r_x3": 217.05, "r_y3": 170.08, "coord_origin": "TOPLEFT" }, "text": "[0000", "orig": "[0000", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 4, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 235.19, "r_y0": 176.27, "r_x1": 241.41, "r_y1": 176.27, "r_x2": 241.41, "r_y2": 169.69, "r_x3": 235.19, "r_y3": 169.69, "coord_origin": "TOPLEFT" }, "text": "\u2212", "orig": "\u2212", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 5, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 241.41, "r_y0": 176.27, "r_x1": 257.3, "r_y1": 176.27, "r_x2": 257.3, "r_y2": 170.08, "r_x3": 241.41, "r_y3": 170.08, "coord_origin": "TOPLEFT" }, "text": "0002", "orig": "0002", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 6, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 257.3, "r_y0": 176.27, "r_x1": 263.52, "r_y1": 176.27, "r_x2": 263.52, "r_y2": 169.69, "r_x3": 257.3, "r_y3": 169.69, "coord_origin": "TOPLEFT" }, "text": "\u2212", "orig": "\u2212", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 7, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 263.52, "r_y0": 176.27, "r_x1": 279.41, "r_y1": 176.27, "r_x2": 279.41, "r_y2": 170.08, "r_x3": 263.52, "r_y3": 170.08, "coord_origin": "TOPLEFT" }, "text": "3723", "orig": "3723", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 8, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 279.41, "r_y0": 176.27, "r_x1": 285.64, "r_y1": 176.27, "r_x2": 285.64, "r_y2": 169.69, "r_x3": 279.41, "r_y3": 169.69, "coord_origin": "TOPLEFT" }, "text": "\u2212", "orig": "\u2212", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 9, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 285.64, "r_y0": 180.47, "r_x1": 392.28, "r_y1": 180.47, "r_x2": 392.28, "r_y2": 171.67, "r_x3": 285.64, "r_y3": 171.67, "coord_origin": "TOPLEFT" }, "text": "$^{6960]}$, Ahmed Nassar[0000", "orig": "$^{6960]}$, Ahmed Nassar[0000", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 10, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 392.28, "r_y0": 176.27, "r_x1": 398.5, "r_y1": 176.27, "r_x2": 398.5, "r_y2": 169.69, "r_x3": 392.28, "r_y3": 169.69, "coord_origin": "TOPLEFT" }, "text": "\u2212", "orig": "\u2212", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 11, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 398.5, "r_y0": 176.27, "r_x1": 414.39, "r_y1": 176.27, "r_x2": 414.39, "r_y2": 170.08, "r_x3": 398.5, "r_y3": 170.08, "coord_origin": "TOPLEFT" }, "text": "0002", "orig": "0002", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 12, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 414.39, "r_y0": 176.27, "r_x1": 420.61, "r_y1": 176.27, "r_x2": 420.61, "r_y2": 169.69, "r_x3": 414.39, "r_y3": 169.69, "coord_origin": "TOPLEFT" }, "text": "\u2212", "orig": "\u2212", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 13, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 420.61, "r_y0": 176.27, "r_x1": 436.5, "r_y1": 176.27, "r_x2": 436.5, "r_y2": 170.08, "r_x3": 420.61, "r_y3": 170.08, "coord_origin": "TOPLEFT" }, "text": "9468", "orig": "9468", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 14, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 436.5, "r_y0": 176.27, "r_x1": 442.72, "r_y1": 176.27, "r_x2": 442.72, "r_y2": 169.69, "r_x3": 436.5, "r_y3": 169.69, "coord_origin": "TOPLEFT" }, "text": "\u2212", "orig": "\u2212", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 15, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 442.73, "r_y0": 180.47, "r_x1": 464.13, "r_y1": 180.47, "r_x2": 464.13, "r_y2": 171.67, "r_x3": 442.73, "r_y3": 171.67, "coord_origin": "TOPLEFT" }, "text": "$^{0822]}$,", "orig": "$^{0822]}$,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 16, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 139.34, "r_y0": 192.43, "r_x1": 224.81, "r_y1": 192.43, "r_x2": 224.81, "r_y2": 183.63, "r_x3": 139.34, "r_y3": 183.63, "coord_origin": "TOPLEFT" }, "text": "Nikolaos Livathinos", "orig": "Nikolaos Livathinos", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 17, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 224.81, "r_y0": 188.23, "r_x1": 242.95, "r_y1": 188.23, "r_x2": 242.95, "r_y2": 182.04, "r_x3": 224.81, "r_y3": 182.04, "coord_origin": "TOPLEFT" }, "text": "[0000", "orig": "[0000", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 18, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 242.95, "r_y0": 188.23, "r_x1": 249.17, "r_y1": 188.23, "r_x2": 249.17, "r_y2": 181.65, "r_x3": 242.95, "r_y3": 181.65, "coord_origin": "TOPLEFT" }, "text": "\u2212", "orig": "\u2212", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 19, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 249.17, "r_y0": 188.23, "r_x1": 265.06, "r_y1": 188.23, "r_x2": 265.06, "r_y2": 182.04, "r_x3": 249.17, "r_y3": 182.04, "coord_origin": "TOPLEFT" }, "text": "0001", "orig": "0001", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 20, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 265.06, "r_y0": 188.23, "r_x1": 271.29, "r_y1": 188.23, "r_x2": 271.29, "r_y2": 181.65, "r_x3": 265.06, "r_y3": 181.65, "coord_origin": "TOPLEFT" }, "text": "\u2212", "orig": "\u2212", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 21, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 271.29, "r_y0": 188.23, "r_x1": 287.17, "r_y1": 188.23, "r_x2": 287.17, "r_y2": 182.04, "r_x3": 271.29, "r_y3": 182.04, "coord_origin": "TOPLEFT" }, "text": "8513", "orig": "8513", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 22, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 287.17, "r_y0": 188.23, "r_x1": 293.4, "r_y1": 188.23, "r_x2": 293.4, "r_y2": 181.65, "r_x3": 287.17, "r_y3": 181.65, "coord_origin": "TOPLEFT" }, "text": "\u2212", "orig": "\u2212", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 23, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 293.4, "r_y0": 192.43, "r_x1": 404.16, "r_y1": 192.43, "r_x2": 404.16, "r_y2": 183.63, "r_x3": 293.4, "r_y3": 183.63, "coord_origin": "TOPLEFT" }, "text": "$^{3491]}$, Christoph Auer[0000", "orig": "$^{3491]}$, Christoph Auer[0000", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 24, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 404.16, "r_y0": 188.23, "r_x1": 410.38, "r_y1": 188.23, "r_x2": 410.38, "r_y2": 181.65, "r_x3": 404.16, "r_y3": 181.65, "coord_origin": "TOPLEFT" }, "text": "\u2212", "orig": "\u2212", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 25, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 410.39, "r_y0": 188.23, "r_x1": 426.27, "r_y1": 188.23, "r_x2": 426.27, "r_y2": 182.04, "r_x3": 410.39, "r_y3": 182.04, "coord_origin": "TOPLEFT" }, "text": "0001", "orig": "0001", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 26, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 426.27, "r_y0": 188.23, "r_x1": 432.5, "r_y1": 188.23, "r_x2": 432.5, "r_y2": 181.65, "r_x3": 426.27, "r_y3": 181.65, "coord_origin": "TOPLEFT" }, "text": "\u2212", "orig": "\u2212", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 27, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 432.5, "r_y0": 188.23, "r_x1": 448.38, "r_y1": 188.23, "r_x2": 448.38, "r_y2": 182.04, "r_x3": 432.5, "r_y3": 182.04, "coord_origin": "TOPLEFT" }, "text": "5761", "orig": "5761", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 28, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 448.38, "r_y0": 188.23, "r_x1": 454.61, "r_y1": 188.23, "r_x2": 454.61, "r_y2": 181.65, "r_x3": 448.38, "r_y3": 181.65, "coord_origin": "TOPLEFT" }, "text": "\u2212", "orig": "\u2212", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 29, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 454.61, "r_y0": 192.43, "r_x1": 476.01, "r_y1": 192.43, "r_x2": 476.01, "r_y2": 183.63, "r_x3": 454.61, "r_y3": 183.63, "coord_origin": "TOPLEFT" }, "text": "$^{0422]}$,", "orig": "$^{0422]}$,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 30, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 229.52, "r_y0": 204.38, "r_x1": 298.61, "r_y1": 204.38, "r_x2": 298.61, "r_y2": 195.58, "r_x3": 229.52, "r_y3": 195.58, "coord_origin": "TOPLEFT" }, "text": "and Peter Staar", "orig": "and Peter Staar", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 31, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 298.61, "r_y0": 200.19, "r_x1": 316.75, "r_y1": 200.19, "r_x2": 316.75, "r_y2": 193.99, "r_x3": 298.61, "r_y3": 193.99, "coord_origin": "TOPLEFT" }, "text": "[0000", "orig": "[0000", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 32, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 316.75, "r_y0": 200.19, "r_x1": 322.97, "r_y1": 200.19, "r_x2": 322.97, "r_y2": 193.6, "r_x3": 316.75, "r_y3": 193.6, "coord_origin": "TOPLEFT" }, "text": "\u2212", "orig": "\u2212", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 33, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 322.97, "r_y0": 200.19, "r_x1": 338.86, "r_y1": 200.19, "r_x2": 338.86, "r_y2": 193.99, "r_x3": 322.97, "r_y3": 193.99, "coord_origin": "TOPLEFT" }, "text": "0002", "orig": "0002", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 34, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 338.86, "r_y0": 200.19, "r_x1": 345.08, "r_y1": 200.19, "r_x2": 345.08, "r_y2": 193.6, "r_x3": 338.86, "r_y3": 193.6, "coord_origin": "TOPLEFT" }, "text": "\u2212", "orig": "\u2212", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 35, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 345.09, "r_y0": 200.19, "r_x1": 360.97, "r_y1": 200.19, "r_x2": 360.97, "r_y2": 193.99, "r_x3": 345.09, "r_y3": 193.99, "coord_origin": "TOPLEFT" }, "text": "8088", "orig": "8088", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 36, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 360.97, "r_y0": 200.19, "r_x1": 367.2, "r_y1": 200.19, "r_x2": 367.2, "r_y2": 193.6, "r_x3": 360.97, "r_y3": 193.6, "coord_origin": "TOPLEFT" }, "text": "\u2212", "orig": "\u2212", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 37, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 367.2, "r_y0": 200.19, "r_x1": 385.34, "r_y1": 200.19, "r_x2": 385.34, "r_y2": 193.99, "r_x3": 367.2, "r_y3": 193.99, "coord_origin": "TOPLEFT" }, "text": "0823]", "orig": "0823]", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 38, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 279.11, "r_y0": 225.27, "r_x1": 336.25, "r_y1": 225.27, "r_x2": 336.25, "r_y2": 217.2, "r_x3": 279.11, "r_y3": 217.2, "coord_origin": "TOPLEFT" }, "text": "IBM Research", "orig": "IBM Research", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 39, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 222.97, "r_y0": 236.28, "r_x1": 392.39, "r_y1": 236.28, "r_x2": 392.39, "r_y2": 228.81, "r_x3": 222.97, "r_y3": 228.81, "coord_origin": "TOPLEFT" }, "text": "{mly,ahn,nli,cau,taa}@zurich.ibm.com", "orig": "{mly,ahn,nli,cau,taa}@zurich.ibm.com", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 40, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 163.11, "r_y0": 278.23, "r_x1": 206.64, "r_y1": 278.23, "r_x2": 206.64, "r_y2": 270.3, "r_x3": 163.11, "r_y3": 270.3, "coord_origin": "TOPLEFT" }, "text": "Abstract.", "orig": "Abstract.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 41, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 211.62, "r_y0": 278.43, "r_x1": 452.24, "r_y1": 278.43, "r_x2": 452.24, "r_y2": 270.36, "r_x3": 211.62, "r_y3": 270.36, "coord_origin": "TOPLEFT" }, "text": "Extracting tables from documents is a crucial task in any", "orig": "Extracting tables from documents is a crucial task in any", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 42, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 163.11, "r_y0": 289.39, "r_x1": 452.24, "r_y1": 289.39, "r_x2": 452.24, "r_y2": 281.32, "r_x3": 163.11, "r_y3": 281.32, "coord_origin": "TOPLEFT" }, "text": "document conversion pipeline. Recently, transformer-based models have", "orig": "document conversion pipeline. Recently, transformer-based models have", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 43, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 163.11, "r_y0": 300.35, "r_x1": 452.25, "r_y1": 300.35, "r_x2": 452.25, "r_y2": 292.28, "r_x3": 163.11, "r_y3": 292.28, "coord_origin": "TOPLEFT" }, "text": "demonstrated that table-structure can be recognized with impressive ac-", "orig": "demonstrated that table-structure can be recognized with impressive ac-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 44, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 163.11, "r_y0": 311.31, "r_x1": 452.24, "r_y1": 311.31, "r_x2": 452.24, "r_y2": 303.24, "r_x3": 163.11, "r_y3": 303.24, "coord_origin": "TOPLEFT" }, "text": "curacy using Image-to-Markup-Sequence (Im2Seq) approaches. Taking", "orig": "curacy using Image-to-Markup-Sequence (Im2Seq) approaches. Taking", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 45, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 163.11, "r_y0": 322.27, "r_x1": 452.25, "r_y1": 322.27, "r_x2": 452.25, "r_y2": 314.2, "r_x3": 163.11, "r_y3": 314.2, "coord_origin": "TOPLEFT" }, "text": "only the image of a table, such models predict a sequence of tokens (e.g.", "orig": "only the image of a table, such models predict a sequence of tokens (e.g.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 46, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 163.11, "r_y0": 333.23, "r_x1": 452.25, "r_y1": 333.23, "r_x2": 452.25, "r_y2": 325.16, "r_x3": 163.11, "r_y3": 325.16, "coord_origin": "TOPLEFT" }, "text": "in HTML, LaTeX) which represent the structure of the table. Since the", "orig": "in HTML, LaTeX) which represent the structure of the table. Since the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 47, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 163.11, "r_y0": 344.19, "r_x1": 452.25, "r_y1": 344.19, "r_x2": 452.25, "r_y2": 336.12, "r_x3": 163.11, "r_y3": 336.12, "coord_origin": "TOPLEFT" }, "text": "token representation of the table structure has a significant impact on", "orig": "token representation of the table structure has a significant impact on", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 48, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 163.11, "r_y0": 355.15, "r_x1": 452.25, "r_y1": 355.15, "r_x2": 452.25, "r_y2": 347.08, "r_x3": 163.11, "r_y3": 347.08, "coord_origin": "TOPLEFT" }, "text": "the accuracy and run-time performance of any Im2Seq model, we inves-", "orig": "the accuracy and run-time performance of any Im2Seq model, we inves-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 49, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 163.11, "r_y0": 366.1, "r_x1": 452.25, "r_y1": 366.1, "r_x2": 452.25, "r_y2": 358.03, "r_x3": 163.11, "r_y3": 358.03, "coord_origin": "TOPLEFT" }, "text": "tigate in this paper how table-structure representation can be optimised.", "orig": "tigate in this paper how table-structure representation can be optimised.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 50, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 163.11, "r_y0": 377.06, "r_x1": 452.25, "r_y1": 377.06, "r_x2": 452.25, "r_y2": 368.99, "r_x3": 163.11, "r_y3": 368.99, "coord_origin": "TOPLEFT" }, "text": "We propose a new, optimised table-structure language (OTSL) with a", "orig": "We propose a new, optimised table-structure language (OTSL) with a", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 51, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 163.11, "r_y0": 388.02, "r_x1": 452.24, "r_y1": 388.02, "r_x2": 452.24, "r_y2": 379.95, "r_x3": 163.11, "r_y3": 379.95, "coord_origin": "TOPLEFT" }, "text": "minimized vocabulary and specific rules. The benefits of OTSL are that", "orig": "minimized vocabulary and specific rules. The benefits of OTSL are that", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 52, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 163.11, "r_y0": 398.98, "r_x1": 452.24, "r_y1": 398.98, "r_x2": 452.24, "r_y2": 390.91, "r_x3": 163.11, "r_y3": 390.91, "coord_origin": "TOPLEFT" }, "text": "it reduces the number of tokens to 5 (HTML needs 28+) and shortens", "orig": "it reduces the number of tokens to 5 (HTML needs 28+) and shortens", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 53, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 163.11, "r_y0": 409.94, "r_x1": 452.25, "r_y1": 409.94, "r_x2": 452.25, "r_y2": 401.87, "r_x3": 163.11, "r_y3": 401.87, "coord_origin": "TOPLEFT" }, "text": "the sequence length to half of HTML on average. Consequently, model", "orig": "the sequence length to half of HTML on average. Consequently, model", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 54, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 163.11, "r_y0": 420.9, "r_x1": 452.24, "r_y1": 420.9, "r_x2": 452.24, "r_y2": 412.83, "r_x3": 163.11, "r_y3": 412.83, "coord_origin": "TOPLEFT" }, "text": "accuracy improves significantly, inference time is halved compared to", "orig": "accuracy improves significantly, inference time is halved compared to", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 55, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 163.11, "r_y0": 431.86, "r_x1": 452.24, "r_y1": 431.86, "r_x2": 452.24, "r_y2": 423.79, "r_x3": 163.11, "r_y3": 423.79, "coord_origin": "TOPLEFT" }, "text": "HTML-based models, and the predicted table structures are always syn-", "orig": "HTML-based models, and the predicted table structures are always syn-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 56, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 163.11, "r_y0": 442.82, "r_x1": 452.24, "r_y1": 442.82, "r_x2": 452.24, "r_y2": 434.75, "r_x3": 163.11, "r_y3": 434.75, "coord_origin": "TOPLEFT" }, "text": "tactically correct. This in turn eliminates most post-processing needs.", "orig": "tactically correct. This in turn eliminates most post-processing needs.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 57, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 163.11, "r_y0": 453.78, "r_x1": 452.25, "r_y1": 453.78, "r_x2": 452.25, "r_y2": 445.71, "r_x3": 163.11, "r_y3": 445.71, "coord_origin": "TOPLEFT" }, "text": "Popular table structure data-sets will be published in OTSL format to", "orig": "Popular table structure data-sets will be published in OTSL format to", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 58, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 163.11, "r_y0": 464.73, "r_x1": 225.56, "r_y1": 464.73, "r_x2": 225.56, "r_y2": 456.66, "r_x3": 163.11, "r_y3": 456.66, "coord_origin": "TOPLEFT" }, "text": "the community.", "orig": "the community.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 59, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 163.11, "r_y0": 486.62, "r_x1": 211.94, "r_y1": 486.62, "r_x2": 211.94, "r_y2": 478.69, "r_x3": 163.11, "r_y3": 478.69, "coord_origin": "TOPLEFT" }, "text": "Keywords:", "orig": "Keywords:", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 60, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 216.55, "r_y0": 486.83, "r_x1": 452.24, "r_y1": 486.83, "r_x2": 452.24, "r_y2": 478.76, "r_x3": 216.55, "r_y3": 478.76, "coord_origin": "TOPLEFT" }, "text": "Table Structure Recognition \u00b7 Data Representation \u00b7 Trans-", "orig": "Table Structure Recognition \u00b7 Data Representation \u00b7 Trans-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 61, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 163.11, "r_y0": 497.79, "r_x1": 257.64, "r_y1": 497.79, "r_x2": 257.64, "r_y2": 489.72, "r_x3": 163.11, "r_y3": 489.72, "coord_origin": "TOPLEFT" }, "text": "formers \u00b7 Optimization.", "orig": "formers \u00b7 Optimization.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 62, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.77, "r_y0": 532.69, "r_x1": 141.49, "r_y1": 532.69, "r_x2": 141.49, "r_y2": 522.12, "r_x3": 134.77, "r_y3": 522.12, "coord_origin": "TOPLEFT" }, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 63, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 154.94, "r_y0": 532.69, "r_x1": 228.93, "r_y1": 532.69, "r_x2": 228.93, "r_y2": 522.12, "r_x3": 154.94, "r_y3": 522.12, "coord_origin": "TOPLEFT" }, "text": "Introduction", "orig": "Introduction", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 64, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.77, "r_y0": 557.08, "r_x1": 480.59, "r_y1": 557.08, "r_x2": 480.59, "r_y2": 548.29, "r_x3": 134.77, "r_y3": 548.29, "coord_origin": "TOPLEFT" }, "text": "Tables are ubiquitous in documents such as scientific papers, patents, reports,", "orig": "Tables are ubiquitous in documents such as scientific papers, patents, reports,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 65, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.77, "r_y0": 569.04, "r_x1": 480.59, "r_y1": 569.04, "r_x2": 480.59, "r_y2": 560.24, "r_x3": 134.77, "r_y3": 560.24, "coord_origin": "TOPLEFT" }, "text": "manuals, specification sheets or marketing material. They often encode highly", "orig": "manuals, specification sheets or marketing material. They often encode highly", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 66, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.77, "r_y0": 580.99, "r_x1": 480.59, "r_y1": 580.99, "r_x2": 480.59, "r_y2": 572.2, "r_x3": 134.77, "r_y3": 572.2, "coord_origin": "TOPLEFT" }, "text": "valuable information and therefore need to be extracted with high accuracy.", "orig": "valuable information and therefore need to be extracted with high accuracy.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 67, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.77, "r_y0": 592.95, "r_x1": 480.6, "r_y1": 592.95, "r_x2": 480.6, "r_y2": 584.15, "r_x3": 134.77, "r_y3": 584.15, "coord_origin": "TOPLEFT" }, "text": "Unfortunately, tables appear in documents in various sizes, styling and struc-", "orig": "Unfortunately, tables appear in documents in various sizes, styling and struc-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 68, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.77, "r_y0": 604.9, "r_x1": 480.59, "r_y1": 604.9, "r_x2": 480.59, "r_y2": 596.11, "r_x3": 134.77, "r_y3": 596.11, "coord_origin": "TOPLEFT" }, "text": "ture, making it difficult to recover their correct structure with simple analyt-", "orig": "ture, making it difficult to recover their correct structure with simple analyt-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 69, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.77, "r_y0": 616.86, "r_x1": 480.59, "r_y1": 616.86, "r_x2": 480.59, "r_y2": 608.06, "r_x3": 134.77, "r_y3": 608.06, "coord_origin": "TOPLEFT" }, "text": "ical methods. Therefore, accurate table extraction is achieved these days with", "orig": "ical methods. Therefore, accurate table extraction is achieved these days with", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 70, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.77, "r_y0": 628.81, "r_x1": 279.33, "r_y1": 628.81, "r_x2": 279.33, "r_y2": 620.02, "r_x3": 134.77, "r_y3": 620.02, "coord_origin": "TOPLEFT" }, "text": "machine-learning based methods.", "orig": "machine-learning based methods.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 71, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 149.71, "r_y0": 640.94, "r_x1": 480.59, "r_y1": 640.94, "r_x2": 480.59, "r_y2": 632.15, "r_x3": 149.71, "r_y3": 632.15, "coord_origin": "TOPLEFT" }, "text": "In modern document understanding systems [1,15], table extraction is typi-", "orig": "In modern document understanding systems [1,15], table extraction is typi-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 72, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.77, "r_y0": 652.9, "r_x1": 480.6, "r_y1": 652.9, "r_x2": 480.6, "r_y2": 644.1, "r_x3": 134.77, "r_y3": 644.1, "coord_origin": "TOPLEFT" }, "text": "cally a two-step process. Firstly, every table on a page is located with a bounding", "orig": "cally a two-step process. Firstly, every table on a page is located with a bounding", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 73, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.77, "r_y0": 664.85, "r_x1": 480.59, "r_y1": 664.85, "r_x2": 480.59, "r_y2": 656.06, "r_x3": 134.77, "r_y3": 656.06, "coord_origin": "TOPLEFT" }, "text": "box, and secondly, their logical row and column structure is recognized. As of", "orig": "box, and secondly, their logical row and column structure is recognized. As of", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 74, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 18.34, "r_y0": 555.0, "r_x1": 36.34, "r_y1": 555.0, "r_x2": 36.34, "r_y2": 209.48, "r_x3": 18.34, "r_y3": 209.48, "coord_origin": "TOPLEFT" }, "text": "arXiv:2305.03393v1 [cs.CV] 5 May 2023", "orig": "arXiv:2305.03393v1 [cs.CV] 5 May 2023", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "has_chars": false, "has_words": false, "has_lines": true, "image": null, "lines": [] }, "predictions": { "layout": { "clusters": [ { "id": 5, "label": "section_header", "bbox": { "l": 134.76, "t": 115.9, "r": 480.6, "b": 146.51, "coord_origin": "TOPLEFT" }, "confidence": 0.892, "cells": [ { "index": 0, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 128.58, "r_x1": 480.6, "r_y1": 128.58, "r_x2": 480.6, "r_y2": 115.9, "r_x3": 134.76, "r_y3": 115.9, "coord_origin": "TOPLEFT" }, "text": "Optimized Table Tokenization for Table Structure", "orig": "Optimized Table Tokenization for Table Structure", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 1, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 266.67, "r_y0": 146.51, "r_x1": 348.69, "r_y1": 146.51, "r_x2": 348.69, "r_y2": 133.83, "r_x3": 266.67, "r_y3": 133.83, "coord_origin": "TOPLEFT" }, "text": "Recognition", "orig": "Recognition", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 16, "label": "key_value_region", "bbox": { "l": 139.34, "t": 169.69, "r": 476.01, "b": 236.28, "coord_origin": "TOPLEFT" }, "confidence": 0.484, "cells": [ { "index": 2, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.23, "r_y0": 180.47, "r_x1": 217.04, "r_y1": 180.47, "r_x2": 217.04, "r_y2": 171.67, "r_x3": 151.23, "r_y3": 171.67, "coord_origin": "TOPLEFT" }, "text": "Maksym Lysak", "orig": "Maksym Lysak", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 3, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 217.05, "r_y0": 176.27, "r_x1": 235.19, "r_y1": 176.27, "r_x2": 235.19, "r_y2": 170.08, "r_x3": 217.05, "r_y3": 170.08, "coord_origin": "TOPLEFT" }, "text": "[0000", "orig": "[0000", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 4, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 235.19, "r_y0": 176.27, "r_x1": 241.41, "r_y1": 176.27, "r_x2": 241.41, "r_y2": 169.69, "r_x3": 235.19, "r_y3": 169.69, "coord_origin": "TOPLEFT" }, "text": "\u2212", "orig": "\u2212", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 5, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 241.41, "r_y0": 176.27, "r_x1": 257.3, "r_y1": 176.27, "r_x2": 257.3, "r_y2": 170.08, "r_x3": 241.41, "r_y3": 170.08, "coord_origin": "TOPLEFT" }, "text": "0002", "orig": "0002", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 6, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 257.3, "r_y0": 176.27, "r_x1": 263.52, "r_y1": 176.27, "r_x2": 263.52, "r_y2": 169.69, "r_x3": 257.3, "r_y3": 169.69, "coord_origin": "TOPLEFT" }, "text": "\u2212", "orig": "\u2212", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 7, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 263.52, "r_y0": 176.27, "r_x1": 279.41, "r_y1": 176.27, "r_x2": 279.41, "r_y2": 170.08, "r_x3": 263.52, "r_y3": 170.08, "coord_origin": "TOPLEFT" }, "text": "3723", "orig": "3723", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 8, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 279.41, "r_y0": 176.27, "r_x1": 285.64, "r_y1": 176.27, "r_x2": 285.64, "r_y2": 169.69, "r_x3": 279.41, "r_y3": 169.69, "coord_origin": "TOPLEFT" }, "text": "\u2212", "orig": "\u2212", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 9, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 285.64, "r_y0": 180.47, "r_x1": 392.28, "r_y1": 180.47, "r_x2": 392.28, "r_y2": 171.67, "r_x3": 285.64, "r_y3": 171.67, "coord_origin": "TOPLEFT" }, "text": "$^{6960]}$, Ahmed Nassar[0000", "orig": "$^{6960]}$, Ahmed Nassar[0000", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 10, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 392.28, "r_y0": 176.27, "r_x1": 398.5, "r_y1": 176.27, "r_x2": 398.5, "r_y2": 169.69, "r_x3": 392.28, "r_y3": 169.69, "coord_origin": "TOPLEFT" }, "text": "\u2212", "orig": "\u2212", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 11, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 398.5, "r_y0": 176.27, "r_x1": 414.39, "r_y1": 176.27, "r_x2": 414.39, "r_y2": 170.08, "r_x3": 398.5, "r_y3": 170.08, "coord_origin": "TOPLEFT" }, "text": "0002", "orig": "0002", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 12, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 414.39, "r_y0": 176.27, "r_x1": 420.61, "r_y1": 176.27, "r_x2": 420.61, "r_y2": 169.69, "r_x3": 414.39, "r_y3": 169.69, "coord_origin": "TOPLEFT" }, "text": "\u2212", "orig": "\u2212", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 13, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 420.61, "r_y0": 176.27, "r_x1": 436.5, "r_y1": 176.27, "r_x2": 436.5, "r_y2": 170.08, "r_x3": 420.61, "r_y3": 170.08, "coord_origin": "TOPLEFT" }, "text": "9468", "orig": "9468", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 14, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 436.5, "r_y0": 176.27, "r_x1": 442.72, "r_y1": 176.27, "r_x2": 442.72, "r_y2": 169.69, "r_x3": 436.5, "r_y3": 169.69, "coord_origin": "TOPLEFT" }, "text": "\u2212", "orig": "\u2212", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 15, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 442.73, "r_y0": 180.47, "r_x1": 464.13, "r_y1": 180.47, "r_x2": 464.13, "r_y2": 171.67, "r_x3": 442.73, "r_y3": 171.67, "coord_origin": "TOPLEFT" }, "text": "$^{0822]}$,", "orig": "$^{0822]}$,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 16, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 139.34, "r_y0": 192.43, "r_x1": 224.81, "r_y1": 192.43, "r_x2": 224.81, "r_y2": 183.63, "r_x3": 139.34, "r_y3": 183.63, "coord_origin": "TOPLEFT" }, "text": "Nikolaos Livathinos", "orig": "Nikolaos Livathinos", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 17, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 224.81, "r_y0": 188.23, "r_x1": 242.95, "r_y1": 188.23, "r_x2": 242.95, "r_y2": 182.04, "r_x3": 224.81, "r_y3": 182.04, "coord_origin": "TOPLEFT" }, "text": "[0000", "orig": "[0000", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 18, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 242.95, "r_y0": 188.23, "r_x1": 249.17, "r_y1": 188.23, "r_x2": 249.17, "r_y2": 181.65, "r_x3": 242.95, "r_y3": 181.65, "coord_origin": "TOPLEFT" }, "text": "\u2212", "orig": "\u2212", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 19, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 249.17, "r_y0": 188.23, "r_x1": 265.06, "r_y1": 188.23, "r_x2": 265.06, "r_y2": 182.04, "r_x3": 249.17, "r_y3": 182.04, "coord_origin": "TOPLEFT" }, "text": "0001", "orig": "0001", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 20, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 265.06, "r_y0": 188.23, "r_x1": 271.29, "r_y1": 188.23, "r_x2": 271.29, "r_y2": 181.65, "r_x3": 265.06, "r_y3": 181.65, "coord_origin": "TOPLEFT" }, "text": "\u2212", "orig": "\u2212", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 21, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 271.29, "r_y0": 188.23, "r_x1": 287.17, "r_y1": 188.23, "r_x2": 287.17, "r_y2": 182.04, "r_x3": 271.29, "r_y3": 182.04, "coord_origin": "TOPLEFT" }, "text": "8513", "orig": "8513", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 22, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 287.17, "r_y0": 188.23, "r_x1": 293.4, "r_y1": 188.23, "r_x2": 293.4, "r_y2": 181.65, "r_x3": 287.17, "r_y3": 181.65, "coord_origin": "TOPLEFT" }, "text": "\u2212", "orig": "\u2212", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 23, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 293.4, "r_y0": 192.43, "r_x1": 404.16, "r_y1": 192.43, "r_x2": 404.16, "r_y2": 183.63, "r_x3": 293.4, "r_y3": 183.63, "coord_origin": "TOPLEFT" }, "text": "$^{3491]}$, Christoph Auer[0000", "orig": "$^{3491]}$, Christoph Auer[0000", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 24, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 404.16, "r_y0": 188.23, "r_x1": 410.38, "r_y1": 188.23, "r_x2": 410.38, "r_y2": 181.65, "r_x3": 404.16, "r_y3": 181.65, "coord_origin": "TOPLEFT" }, "text": "\u2212", "orig": "\u2212", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 25, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 410.39, "r_y0": 188.23, "r_x1": 426.27, "r_y1": 188.23, "r_x2": 426.27, "r_y2": 182.04, "r_x3": 410.39, "r_y3": 182.04, "coord_origin": "TOPLEFT" }, "text": "0001", "orig": "0001", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 26, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 426.27, "r_y0": 188.23, "r_x1": 432.5, "r_y1": 188.23, "r_x2": 432.5, "r_y2": 181.65, "r_x3": 426.27, "r_y3": 181.65, "coord_origin": "TOPLEFT" }, "text": "\u2212", "orig": "\u2212", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 27, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 432.5, "r_y0": 188.23, "r_x1": 448.38, "r_y1": 188.23, "r_x2": 448.38, "r_y2": 182.04, "r_x3": 432.5, "r_y3": 182.04, "coord_origin": "TOPLEFT" }, "text": "5761", "orig": "5761", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 28, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 448.38, "r_y0": 188.23, "r_x1": 454.61, "r_y1": 188.23, "r_x2": 454.61, "r_y2": 181.65, "r_x3": 448.38, "r_y3": 181.65, "coord_origin": "TOPLEFT" }, "text": "\u2212", "orig": "\u2212", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 29, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 454.61, "r_y0": 192.43, "r_x1": 476.01, "r_y1": 192.43, "r_x2": 476.01, "r_y2": 183.63, "r_x3": 454.61, "r_y3": 183.63, "coord_origin": "TOPLEFT" }, "text": "$^{0422]}$,", "orig": "$^{0422]}$,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 30, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 229.52, "r_y0": 204.38, "r_x1": 298.61, "r_y1": 204.38, "r_x2": 298.61, "r_y2": 195.58, "r_x3": 229.52, "r_y3": 195.58, "coord_origin": "TOPLEFT" }, "text": "and Peter Staar", "orig": "and Peter Staar", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 31, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 298.61, "r_y0": 200.19, "r_x1": 316.75, "r_y1": 200.19, "r_x2": 316.75, "r_y2": 193.99, "r_x3": 298.61, "r_y3": 193.99, "coord_origin": "TOPLEFT" }, "text": "[0000", "orig": "[0000", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 32, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 316.75, "r_y0": 200.19, "r_x1": 322.97, "r_y1": 200.19, "r_x2": 322.97, "r_y2": 193.6, "r_x3": 316.75, "r_y3": 193.6, "coord_origin": "TOPLEFT" }, "text": "\u2212", "orig": "\u2212", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 33, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 322.97, "r_y0": 200.19, "r_x1": 338.86, "r_y1": 200.19, "r_x2": 338.86, "r_y2": 193.99, "r_x3": 322.97, "r_y3": 193.99, "coord_origin": "TOPLEFT" }, "text": "0002", "orig": "0002", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 34, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 338.86, "r_y0": 200.19, "r_x1": 345.08, "r_y1": 200.19, "r_x2": 345.08, "r_y2": 193.6, "r_x3": 338.86, "r_y3": 193.6, "coord_origin": "TOPLEFT" }, "text": "\u2212", "orig": "\u2212", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 35, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 345.09, "r_y0": 200.19, "r_x1": 360.97, "r_y1": 200.19, "r_x2": 360.97, "r_y2": 193.99, "r_x3": 345.09, "r_y3": 193.99, "coord_origin": "TOPLEFT" }, "text": "8088", "orig": "8088", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 36, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 360.97, "r_y0": 200.19, "r_x1": 367.2, "r_y1": 200.19, "r_x2": 367.2, "r_y2": 193.6, "r_x3": 360.97, "r_y3": 193.6, "coord_origin": "TOPLEFT" }, "text": "\u2212", "orig": "\u2212", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 37, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 367.2, "r_y0": 200.19, "r_x1": 385.34, "r_y1": 200.19, "r_x2": 385.34, "r_y2": 193.99, "r_x3": 367.2, "r_y3": 193.99, "coord_origin": "TOPLEFT" }, "text": "0823]", "orig": "0823]", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 38, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 279.11, "r_y0": 225.27, "r_x1": 336.25, "r_y1": 225.27, "r_x2": 336.25, "r_y2": 217.2, "r_x3": 279.11, "r_y3": 217.2, "coord_origin": "TOPLEFT" }, "text": "IBM Research", "orig": "IBM Research", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 39, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 222.97, "r_y0": 236.28, "r_x1": 392.39, "r_y1": 236.28, "r_x2": 392.39, "r_y2": 228.81, "r_x3": 222.97, "r_y3": 228.81, "coord_origin": "TOPLEFT" }, "text": "{mly,ahn,nli,cau,taa}@zurich.ibm.com", "orig": "{mly,ahn,nli,cau,taa}@zurich.ibm.com", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [ { "id": 7, "label": "text", "bbox": { "l": 139.34, "t": 169.69, "r": 476.01, "b": 200.19, "coord_origin": "TOPLEFT" }, "confidence": 0.792, "cells": [ { "index": 2, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.23, "r_y0": 180.47, "r_x1": 217.04, "r_y1": 180.47, "r_x2": 217.04, "r_y2": 171.67, "r_x3": 151.23, "r_y3": 171.67, "coord_origin": "TOPLEFT" }, "text": "Maksym Lysak", "orig": "Maksym Lysak", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 3, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 217.05, "r_y0": 176.27, "r_x1": 235.19, "r_y1": 176.27, "r_x2": 235.19, "r_y2": 170.08, "r_x3": 217.05, "r_y3": 170.08, "coord_origin": "TOPLEFT" }, "text": "[0000", "orig": "[0000", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 4, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 235.19, "r_y0": 176.27, "r_x1": 241.41, "r_y1": 176.27, "r_x2": 241.41, "r_y2": 169.69, "r_x3": 235.19, "r_y3": 169.69, "coord_origin": "TOPLEFT" }, "text": "\u2212", "orig": "\u2212", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 5, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 241.41, "r_y0": 176.27, "r_x1": 257.3, "r_y1": 176.27, "r_x2": 257.3, "r_y2": 170.08, "r_x3": 241.41, "r_y3": 170.08, "coord_origin": "TOPLEFT" }, "text": "0002", "orig": "0002", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 6, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 257.3, "r_y0": 176.27, "r_x1": 263.52, "r_y1": 176.27, "r_x2": 263.52, "r_y2": 169.69, "r_x3": 257.3, "r_y3": 169.69, "coord_origin": "TOPLEFT" }, "text": "\u2212", "orig": "\u2212", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 7, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 263.52, "r_y0": 176.27, "r_x1": 279.41, "r_y1": 176.27, "r_x2": 279.41, "r_y2": 170.08, "r_x3": 263.52, "r_y3": 170.08, "coord_origin": "TOPLEFT" }, "text": "3723", "orig": "3723", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 8, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 279.41, "r_y0": 176.27, "r_x1": 285.64, "r_y1": 176.27, "r_x2": 285.64, "r_y2": 169.69, "r_x3": 279.41, "r_y3": 169.69, "coord_origin": "TOPLEFT" }, "text": "\u2212", "orig": "\u2212", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 9, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 285.64, "r_y0": 180.47, "r_x1": 392.28, "r_y1": 180.47, "r_x2": 392.28, "r_y2": 171.67, "r_x3": 285.64, "r_y3": 171.67, "coord_origin": "TOPLEFT" }, "text": "$^{6960]}$, Ahmed Nassar[0000", "orig": "$^{6960]}$, Ahmed Nassar[0000", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 10, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 392.28, "r_y0": 176.27, "r_x1": 398.5, "r_y1": 176.27, "r_x2": 398.5, "r_y2": 169.69, "r_x3": 392.28, "r_y3": 169.69, "coord_origin": "TOPLEFT" }, "text": "\u2212", "orig": "\u2212", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 11, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 398.5, "r_y0": 176.27, "r_x1": 414.39, "r_y1": 176.27, "r_x2": 414.39, "r_y2": 170.08, "r_x3": 398.5, "r_y3": 170.08, "coord_origin": "TOPLEFT" }, "text": "0002", "orig": "0002", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 12, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 414.39, "r_y0": 176.27, "r_x1": 420.61, "r_y1": 176.27, "r_x2": 420.61, "r_y2": 169.69, "r_x3": 414.39, "r_y3": 169.69, "coord_origin": "TOPLEFT" }, "text": "\u2212", "orig": "\u2212", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 13, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 420.61, "r_y0": 176.27, "r_x1": 436.5, "r_y1": 176.27, "r_x2": 436.5, "r_y2": 170.08, "r_x3": 420.61, "r_y3": 170.08, "coord_origin": "TOPLEFT" }, "text": "9468", "orig": "9468", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 14, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 436.5, "r_y0": 176.27, "r_x1": 442.72, "r_y1": 176.27, "r_x2": 442.72, "r_y2": 169.69, "r_x3": 436.5, "r_y3": 169.69, "coord_origin": "TOPLEFT" }, "text": "\u2212", "orig": "\u2212", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 15, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 442.73, "r_y0": 180.47, "r_x1": 464.13, "r_y1": 180.47, "r_x2": 464.13, "r_y2": 171.67, "r_x3": 442.73, "r_y3": 171.67, "coord_origin": "TOPLEFT" }, "text": "$^{0822]}$,", "orig": "$^{0822]}$,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 16, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 139.34, "r_y0": 192.43, "r_x1": 224.81, "r_y1": 192.43, "r_x2": 224.81, "r_y2": 183.63, "r_x3": 139.34, "r_y3": 183.63, "coord_origin": "TOPLEFT" }, "text": "Nikolaos Livathinos", "orig": "Nikolaos Livathinos", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 17, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 224.81, "r_y0": 188.23, "r_x1": 242.95, "r_y1": 188.23, "r_x2": 242.95, "r_y2": 182.04, "r_x3": 224.81, "r_y3": 182.04, "coord_origin": "TOPLEFT" }, "text": "[0000", "orig": "[0000", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 18, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 242.95, "r_y0": 188.23, "r_x1": 249.17, "r_y1": 188.23, "r_x2": 249.17, "r_y2": 181.65, "r_x3": 242.95, "r_y3": 181.65, "coord_origin": "TOPLEFT" }, "text": "\u2212", "orig": "\u2212", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 19, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 249.17, "r_y0": 188.23, "r_x1": 265.06, "r_y1": 188.23, "r_x2": 265.06, "r_y2": 182.04, "r_x3": 249.17, "r_y3": 182.04, "coord_origin": "TOPLEFT" }, "text": "0001", "orig": "0001", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 20, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 265.06, "r_y0": 188.23, "r_x1": 271.29, "r_y1": 188.23, "r_x2": 271.29, "r_y2": 181.65, "r_x3": 265.06, "r_y3": 181.65, "coord_origin": "TOPLEFT" }, "text": "\u2212", "orig": "\u2212", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 21, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 271.29, "r_y0": 188.23, "r_x1": 287.17, "r_y1": 188.23, "r_x2": 287.17, "r_y2": 182.04, "r_x3": 271.29, "r_y3": 182.04, "coord_origin": "TOPLEFT" }, "text": "8513", "orig": "8513", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 22, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 287.17, "r_y0": 188.23, "r_x1": 293.4, "r_y1": 188.23, "r_x2": 293.4, "r_y2": 181.65, "r_x3": 287.17, "r_y3": 181.65, "coord_origin": "TOPLEFT" }, "text": "\u2212", "orig": "\u2212", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 23, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 293.4, "r_y0": 192.43, "r_x1": 404.16, "r_y1": 192.43, "r_x2": 404.16, "r_y2": 183.63, "r_x3": 293.4, "r_y3": 183.63, "coord_origin": "TOPLEFT" }, "text": "$^{3491]}$, Christoph Auer[0000", "orig": "$^{3491]}$, Christoph Auer[0000", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 24, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 404.16, "r_y0": 188.23, "r_x1": 410.38, "r_y1": 188.23, "r_x2": 410.38, "r_y2": 181.65, "r_x3": 404.16, "r_y3": 181.65, "coord_origin": "TOPLEFT" }, "text": "\u2212", "orig": "\u2212", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 25, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 410.39, "r_y0": 188.23, "r_x1": 426.27, "r_y1": 188.23, "r_x2": 426.27, "r_y2": 182.04, "r_x3": 410.39, "r_y3": 182.04, "coord_origin": "TOPLEFT" }, "text": "0001", "orig": "0001", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 26, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 426.27, "r_y0": 188.23, "r_x1": 432.5, "r_y1": 188.23, "r_x2": 432.5, "r_y2": 181.65, "r_x3": 426.27, "r_y3": 181.65, "coord_origin": "TOPLEFT" }, "text": "\u2212", "orig": "\u2212", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 27, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 432.5, "r_y0": 188.23, "r_x1": 448.38, "r_y1": 188.23, "r_x2": 448.38, "r_y2": 182.04, "r_x3": 432.5, "r_y3": 182.04, "coord_origin": "TOPLEFT" }, "text": "5761", "orig": "5761", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 28, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 448.38, "r_y0": 188.23, "r_x1": 454.61, "r_y1": 188.23, "r_x2": 454.61, "r_y2": 181.65, "r_x3": 448.38, "r_y3": 181.65, "coord_origin": "TOPLEFT" }, "text": "\u2212", "orig": "\u2212", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 29, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 454.61, "r_y0": 192.43, "r_x1": 476.01, "r_y1": 192.43, "r_x2": 476.01, "r_y2": 183.63, "r_x3": 454.61, "r_y3": 183.63, "coord_origin": "TOPLEFT" }, "text": "$^{0422]}$,", "orig": "$^{0422]}$,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 31, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 298.61, "r_y0": 200.19, "r_x1": 316.75, "r_y1": 200.19, "r_x2": 316.75, "r_y2": 193.99, "r_x3": 298.61, "r_y3": 193.99, "coord_origin": "TOPLEFT" }, "text": "[0000", "orig": "[0000", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 32, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 316.75, "r_y0": 200.19, "r_x1": 322.97, "r_y1": 200.19, "r_x2": 322.97, "r_y2": 193.6, "r_x3": 316.75, "r_y3": 193.6, "coord_origin": "TOPLEFT" }, "text": "\u2212", "orig": "\u2212", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 33, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 322.97, "r_y0": 200.19, "r_x1": 338.86, "r_y1": 200.19, "r_x2": 338.86, "r_y2": 193.99, "r_x3": 322.97, "r_y3": 193.99, "coord_origin": "TOPLEFT" }, "text": "0002", "orig": "0002", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 34, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 338.86, "r_y0": 200.19, "r_x1": 345.08, "r_y1": 200.19, "r_x2": 345.08, "r_y2": 193.6, "r_x3": 338.86, "r_y3": 193.6, "coord_origin": "TOPLEFT" }, "text": "\u2212", "orig": "\u2212", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 35, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 345.09, "r_y0": 200.19, "r_x1": 360.97, "r_y1": 200.19, "r_x2": 360.97, "r_y2": 193.99, "r_x3": 345.09, "r_y3": 193.99, "coord_origin": "TOPLEFT" }, "text": "8088", "orig": "8088", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 36, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 360.97, "r_y0": 200.19, "r_x1": 367.2, "r_y1": 200.19, "r_x2": 367.2, "r_y2": 193.6, "r_x3": 360.97, "r_y3": 193.6, "coord_origin": "TOPLEFT" }, "text": "\u2212", "orig": "\u2212", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 37, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 367.2, "r_y0": 200.19, "r_x1": 385.34, "r_y1": 200.19, "r_x2": 385.34, "r_y2": 193.99, "r_x3": 367.2, "r_y3": 193.99, "coord_origin": "TOPLEFT" }, "text": "0823]", "orig": "0823]", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 13, "label": "text", "bbox": { "l": 229.52, "t": 195.58, "r": 298.61, "b": 204.38, "coord_origin": "TOPLEFT" }, "confidence": 0.502, "cells": [ { "index": 30, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 229.52, "r_y0": 204.38, "r_x1": 298.61, "r_y1": 204.38, "r_x2": 298.61, "r_y2": 195.58, "r_x3": 229.52, "r_y3": 195.58, "coord_origin": "TOPLEFT" }, "text": "and Peter Staar", "orig": "and Peter Staar", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 9, "label": "text", "bbox": { "l": 279.11, "t": 217.2, "r": 336.25, "b": 225.27, "coord_origin": "TOPLEFT" }, "confidence": 0.631, "cells": [ { "index": 38, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 279.11, "r_y0": 225.27, "r_x1": 336.25, "r_y1": 225.27, "r_x2": 336.25, "r_y2": 217.2, "r_x3": 279.11, "r_y3": 217.2, "coord_origin": "TOPLEFT" }, "text": "IBM Research", "orig": "IBM Research", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 8, "label": "text", "bbox": { "l": 222.97, "t": 228.81, "r": 392.39, "b": 236.28, "coord_origin": "TOPLEFT" }, "confidence": 0.692, "cells": [ { "index": 39, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 222.97, "r_y0": 236.28, "r_x1": 392.39, "r_y1": 236.28, "r_x2": 392.39, "r_y2": 228.81, "r_x3": 222.97, "r_y3": 228.81, "coord_origin": "TOPLEFT" }, "text": "{mly,ahn,nli,cau,taa}@zurich.ibm.com", "orig": "{mly,ahn,nli,cau,taa}@zurich.ibm.com", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] } ] }, { "id": 1, "label": "text", "bbox": { "l": 163.11, "t": 270.3, "r": 452.25, "b": 464.73, "coord_origin": "TOPLEFT" }, "confidence": 0.981, "cells": [ { "index": 40, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 163.11, "r_y0": 278.23, "r_x1": 206.64, "r_y1": 278.23, "r_x2": 206.64, "r_y2": 270.3, "r_x3": 163.11, "r_y3": 270.3, "coord_origin": "TOPLEFT" }, "text": "Abstract.", "orig": "Abstract.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 41, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 211.62, "r_y0": 278.43, "r_x1": 452.24, "r_y1": 278.43, "r_x2": 452.24, "r_y2": 270.36, "r_x3": 211.62, "r_y3": 270.36, "coord_origin": "TOPLEFT" }, "text": "Extracting tables from documents is a crucial task in any", "orig": "Extracting tables from documents is a crucial task in any", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 42, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 163.11, "r_y0": 289.39, "r_x1": 452.24, "r_y1": 289.39, "r_x2": 452.24, "r_y2": 281.32, "r_x3": 163.11, "r_y3": 281.32, "coord_origin": "TOPLEFT" }, "text": "document conversion pipeline. Recently, transformer-based models have", "orig": "document conversion pipeline. Recently, transformer-based models have", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 43, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 163.11, "r_y0": 300.35, "r_x1": 452.25, "r_y1": 300.35, "r_x2": 452.25, "r_y2": 292.28, "r_x3": 163.11, "r_y3": 292.28, "coord_origin": "TOPLEFT" }, "text": "demonstrated that table-structure can be recognized with impressive ac-", "orig": "demonstrated that table-structure can be recognized with impressive ac-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 44, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 163.11, "r_y0": 311.31, "r_x1": 452.24, "r_y1": 311.31, "r_x2": 452.24, "r_y2": 303.24, "r_x3": 163.11, "r_y3": 303.24, "coord_origin": "TOPLEFT" }, "text": "curacy using Image-to-Markup-Sequence (Im2Seq) approaches. Taking", "orig": "curacy using Image-to-Markup-Sequence (Im2Seq) approaches. Taking", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 45, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 163.11, "r_y0": 322.27, "r_x1": 452.25, "r_y1": 322.27, "r_x2": 452.25, "r_y2": 314.2, "r_x3": 163.11, "r_y3": 314.2, "coord_origin": "TOPLEFT" }, "text": "only the image of a table, such models predict a sequence of tokens (e.g.", "orig": "only the image of a table, such models predict a sequence of tokens (e.g.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 46, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 163.11, "r_y0": 333.23, "r_x1": 452.25, "r_y1": 333.23, "r_x2": 452.25, "r_y2": 325.16, "r_x3": 163.11, "r_y3": 325.16, "coord_origin": "TOPLEFT" }, "text": "in HTML, LaTeX) which represent the structure of the table. Since the", "orig": "in HTML, LaTeX) which represent the structure of the table. Since the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 47, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 163.11, "r_y0": 344.19, "r_x1": 452.25, "r_y1": 344.19, "r_x2": 452.25, "r_y2": 336.12, "r_x3": 163.11, "r_y3": 336.12, "coord_origin": "TOPLEFT" }, "text": "token representation of the table structure has a significant impact on", "orig": "token representation of the table structure has a significant impact on", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 48, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 163.11, "r_y0": 355.15, "r_x1": 452.25, "r_y1": 355.15, "r_x2": 452.25, "r_y2": 347.08, "r_x3": 163.11, "r_y3": 347.08, "coord_origin": "TOPLEFT" }, "text": "the accuracy and run-time performance of any Im2Seq model, we inves-", "orig": "the accuracy and run-time performance of any Im2Seq model, we inves-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 49, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 163.11, "r_y0": 366.1, "r_x1": 452.25, "r_y1": 366.1, "r_x2": 452.25, "r_y2": 358.03, "r_x3": 163.11, "r_y3": 358.03, "coord_origin": "TOPLEFT" }, "text": "tigate in this paper how table-structure representation can be optimised.", "orig": "tigate in this paper how table-structure representation can be optimised.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 50, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 163.11, "r_y0": 377.06, "r_x1": 452.25, "r_y1": 377.06, "r_x2": 452.25, "r_y2": 368.99, "r_x3": 163.11, "r_y3": 368.99, "coord_origin": "TOPLEFT" }, "text": "We propose a new, optimised table-structure language (OTSL) with a", "orig": "We propose a new, optimised table-structure language (OTSL) with a", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 51, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 163.11, "r_y0": 388.02, "r_x1": 452.24, "r_y1": 388.02, "r_x2": 452.24, "r_y2": 379.95, "r_x3": 163.11, "r_y3": 379.95, "coord_origin": "TOPLEFT" }, "text": "minimized vocabulary and specific rules. The benefits of OTSL are that", "orig": "minimized vocabulary and specific rules. The benefits of OTSL are that", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 52, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 163.11, "r_y0": 398.98, "r_x1": 452.24, "r_y1": 398.98, "r_x2": 452.24, "r_y2": 390.91, "r_x3": 163.11, "r_y3": 390.91, "coord_origin": "TOPLEFT" }, "text": "it reduces the number of tokens to 5 (HTML needs 28+) and shortens", "orig": "it reduces the number of tokens to 5 (HTML needs 28+) and shortens", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 53, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 163.11, "r_y0": 409.94, "r_x1": 452.25, "r_y1": 409.94, "r_x2": 452.25, "r_y2": 401.87, "r_x3": 163.11, "r_y3": 401.87, "coord_origin": "TOPLEFT" }, "text": "the sequence length to half of HTML on average. Consequently, model", "orig": "the sequence length to half of HTML on average. Consequently, model", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 54, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 163.11, "r_y0": 420.9, "r_x1": 452.24, "r_y1": 420.9, "r_x2": 452.24, "r_y2": 412.83, "r_x3": 163.11, "r_y3": 412.83, "coord_origin": "TOPLEFT" }, "text": "accuracy improves significantly, inference time is halved compared to", "orig": "accuracy improves significantly, inference time is halved compared to", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 55, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 163.11, "r_y0": 431.86, "r_x1": 452.24, "r_y1": 431.86, "r_x2": 452.24, "r_y2": 423.79, "r_x3": 163.11, "r_y3": 423.79, "coord_origin": "TOPLEFT" }, "text": "HTML-based models, and the predicted table structures are always syn-", "orig": "HTML-based models, and the predicted table structures are always syn-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 56, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 163.11, "r_y0": 442.82, "r_x1": 452.24, "r_y1": 442.82, "r_x2": 452.24, "r_y2": 434.75, "r_x3": 163.11, "r_y3": 434.75, "coord_origin": "TOPLEFT" }, "text": "tactically correct. This in turn eliminates most post-processing needs.", "orig": "tactically correct. This in turn eliminates most post-processing needs.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 57, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 163.11, "r_y0": 453.78, "r_x1": 452.25, "r_y1": 453.78, "r_x2": 452.25, "r_y2": 445.71, "r_x3": 163.11, "r_y3": 445.71, "coord_origin": "TOPLEFT" }, "text": "Popular table structure data-sets will be published in OTSL format to", "orig": "Popular table structure data-sets will be published in OTSL format to", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 58, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 163.11, "r_y0": 464.73, "r_x1": 225.56, "r_y1": 464.73, "r_x2": 225.56, "r_y2": 456.66, "r_x3": 163.11, "r_y3": 456.66, "coord_origin": "TOPLEFT" }, "text": "the community.", "orig": "the community.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 4, "label": "text", "bbox": { "l": 163.11, "t": 478.69, "r": 452.24, "b": 497.79, "coord_origin": "TOPLEFT" }, "confidence": 0.93, "cells": [ { "index": 59, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 163.11, "r_y0": 486.62, "r_x1": 211.94, "r_y1": 486.62, "r_x2": 211.94, "r_y2": 478.69, "r_x3": 163.11, "r_y3": 478.69, "coord_origin": "TOPLEFT" }, "text": "Keywords:", "orig": "Keywords:", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 60, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 216.55, "r_y0": 486.83, "r_x1": 452.24, "r_y1": 486.83, "r_x2": 452.24, "r_y2": 478.76, "r_x3": 216.55, "r_y3": 478.76, "coord_origin": "TOPLEFT" }, "text": "Table Structure Recognition \u00b7 Data Representation \u00b7 Trans-", "orig": "Table Structure Recognition \u00b7 Data Representation \u00b7 Trans-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 61, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 163.11, "r_y0": 497.79, "r_x1": 257.64, "r_y1": 497.79, "r_x2": 257.64, "r_y2": 489.72, "r_x3": 163.11, "r_y3": 489.72, "coord_origin": "TOPLEFT" }, "text": "formers \u00b7 Optimization.", "orig": "formers \u00b7 Optimization.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 3, "label": "section_header", "bbox": { "l": 134.77, "t": 522.12, "r": 228.93, "b": 532.69, "coord_origin": "TOPLEFT" }, "confidence": 0.939, "cells": [ { "index": 62, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.77, "r_y0": 532.69, "r_x1": 141.49, "r_y1": 532.69, "r_x2": 141.49, "r_y2": 522.12, "r_x3": 134.77, "r_y3": 522.12, "coord_origin": "TOPLEFT" }, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 63, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 154.94, "r_y0": 532.69, "r_x1": 228.93, "r_y1": 532.69, "r_x2": 228.93, "r_y2": 522.12, "r_x3": 154.94, "r_y3": 522.12, "coord_origin": "TOPLEFT" }, "text": "Introduction", "orig": "Introduction", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 0, "label": "text", "bbox": { "l": 134.77, "t": 548.29, "r": 480.6, "b": 628.81, "coord_origin": "TOPLEFT" }, "confidence": 0.984, "cells": [ { "index": 64, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.77, "r_y0": 557.08, "r_x1": 480.59, "r_y1": 557.08, "r_x2": 480.59, "r_y2": 548.29, "r_x3": 134.77, "r_y3": 548.29, "coord_origin": "TOPLEFT" }, "text": "Tables are ubiquitous in documents such as scientific papers, patents, reports,", "orig": "Tables are ubiquitous in documents such as scientific papers, patents, reports,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 65, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.77, "r_y0": 569.04, "r_x1": 480.59, "r_y1": 569.04, "r_x2": 480.59, "r_y2": 560.24, "r_x3": 134.77, "r_y3": 560.24, "coord_origin": "TOPLEFT" }, "text": "manuals, specification sheets or marketing material. They often encode highly", "orig": "manuals, specification sheets or marketing material. They often encode highly", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 66, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.77, "r_y0": 580.99, "r_x1": 480.59, "r_y1": 580.99, "r_x2": 480.59, "r_y2": 572.2, "r_x3": 134.77, "r_y3": 572.2, "coord_origin": "TOPLEFT" }, "text": "valuable information and therefore need to be extracted with high accuracy.", "orig": "valuable information and therefore need to be extracted with high accuracy.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 67, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.77, "r_y0": 592.95, "r_x1": 480.6, "r_y1": 592.95, "r_x2": 480.6, "r_y2": 584.15, "r_x3": 134.77, "r_y3": 584.15, "coord_origin": "TOPLEFT" }, "text": "Unfortunately, tables appear in documents in various sizes, styling and struc-", "orig": "Unfortunately, tables appear in documents in various sizes, styling and struc-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 68, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.77, "r_y0": 604.9, "r_x1": 480.59, "r_y1": 604.9, "r_x2": 480.59, "r_y2": 596.11, "r_x3": 134.77, "r_y3": 596.11, "coord_origin": "TOPLEFT" }, "text": "ture, making it difficult to recover their correct structure with simple analyt-", "orig": "ture, making it difficult to recover their correct structure with simple analyt-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 69, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.77, "r_y0": 616.86, "r_x1": 480.59, "r_y1": 616.86, "r_x2": 480.59, "r_y2": 608.06, "r_x3": 134.77, "r_y3": 608.06, "coord_origin": "TOPLEFT" }, "text": "ical methods. Therefore, accurate table extraction is achieved these days with", "orig": "ical methods. Therefore, accurate table extraction is achieved these days with", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 70, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.77, "r_y0": 628.81, "r_x1": 279.33, "r_y1": 628.81, "r_x2": 279.33, "r_y2": 620.02, "r_x3": 134.77, "r_y3": 620.02, "coord_origin": "TOPLEFT" }, "text": "machine-learning based methods.", "orig": "machine-learning based methods.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 2, "label": "text", "bbox": { "l": 134.77, "t": 632.15, "r": 480.6, "b": 664.85, "coord_origin": "TOPLEFT" }, "confidence": 0.97, "cells": [ { "index": 71, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 149.71, "r_y0": 640.94, "r_x1": 480.59, "r_y1": 640.94, "r_x2": 480.59, "r_y2": 632.15, "r_x3": 149.71, "r_y3": 632.15, "coord_origin": "TOPLEFT" }, "text": "In modern document understanding systems [1,15], table extraction is typi-", "orig": "In modern document understanding systems [1,15], table extraction is typi-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 72, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.77, "r_y0": 652.9, "r_x1": 480.6, "r_y1": 652.9, "r_x2": 480.6, "r_y2": 644.1, "r_x3": 134.77, "r_y3": 644.1, "coord_origin": "TOPLEFT" }, "text": "cally a two-step process. Firstly, every table on a page is located with a bounding", "orig": "cally a two-step process. Firstly, every table on a page is located with a bounding", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 73, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.77, "r_y0": 664.85, "r_x1": 480.59, "r_y1": 664.85, "r_x2": 480.59, "r_y2": 656.06, "r_x3": 134.77, "r_y3": 656.06, "coord_origin": "TOPLEFT" }, "text": "box, and secondly, their logical row and column structure is recognized. As of", "orig": "box, and secondly, their logical row and column structure is recognized. As of", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 6, "label": "page_header", "bbox": { "l": 18.34, "t": 209.48, "r": 36.34, "b": 555.0, "coord_origin": "TOPLEFT" }, "confidence": 0.89, "cells": [ { "index": 74, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 18.34, "r_y0": 555.0, "r_x1": 36.34, "r_y1": 555.0, "r_x2": 36.34, "r_y2": 209.48, "r_x3": 18.34, "r_y3": 209.48, "coord_origin": "TOPLEFT" }, "text": "arXiv:2305.03393v1 [cs.CV] 5 May 2023", "orig": "arXiv:2305.03393v1 [cs.CV] 5 May 2023", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] } ] }, "tablestructure": { "table_map": {} }, "figures_classification": null, "equations_prediction": null, "vlm_response": null }, "assembled": { "elements": [ { "label": "section_header", "id": 5, "page_no": 0, "cluster": { "id": 5, "label": "section_header", "bbox": { "l": 134.76, "t": 115.9, "r": 480.6, "b": 146.51, "coord_origin": "TOPLEFT" }, "confidence": 0.892, "cells": [ { "index": 0, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 128.58, "r_x1": 480.6, "r_y1": 128.58, "r_x2": 480.6, "r_y2": 115.9, "r_x3": 134.76, "r_y3": 115.9, "coord_origin": "TOPLEFT" }, "text": "Optimized Table Tokenization for Table Structure", "orig": "Optimized Table Tokenization for Table Structure", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 1, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 266.67, "r_y0": 146.51, "r_x1": 348.69, "r_y1": 146.51, "r_x2": 348.69, "r_y2": 133.83, "r_x3": 266.67, "r_y3": 133.83, "coord_origin": "TOPLEFT" }, "text": "Recognition", "orig": "Recognition", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "Optimized Table Tokenization for Table Structure Recognition" }, { "label": "key_value_region", "id": 16, "page_no": 0, "cluster": { "id": 16, "label": "key_value_region", "bbox": { "l": 139.34, "t": 169.69, "r": 476.01, "b": 236.28, "coord_origin": "TOPLEFT" }, "confidence": 0.484, "cells": [ { "index": 2, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.23, "r_y0": 180.47, "r_x1": 217.04, "r_y1": 180.47, "r_x2": 217.04, "r_y2": 171.67, "r_x3": 151.23, "r_y3": 171.67, "coord_origin": "TOPLEFT" }, "text": "Maksym Lysak", "orig": "Maksym Lysak", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 3, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 217.05, "r_y0": 176.27, "r_x1": 235.19, "r_y1": 176.27, "r_x2": 235.19, "r_y2": 170.08, "r_x3": 217.05, "r_y3": 170.08, "coord_origin": "TOPLEFT" }, "text": "[0000", "orig": "[0000", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 4, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 235.19, "r_y0": 176.27, "r_x1": 241.41, "r_y1": 176.27, "r_x2": 241.41, "r_y2": 169.69, "r_x3": 235.19, "r_y3": 169.69, "coord_origin": "TOPLEFT" }, "text": "\u2212", "orig": "\u2212", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 5, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 241.41, "r_y0": 176.27, "r_x1": 257.3, "r_y1": 176.27, "r_x2": 257.3, "r_y2": 170.08, "r_x3": 241.41, "r_y3": 170.08, "coord_origin": "TOPLEFT" }, "text": "0002", "orig": "0002", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 6, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 257.3, "r_y0": 176.27, "r_x1": 263.52, "r_y1": 176.27, "r_x2": 263.52, "r_y2": 169.69, "r_x3": 257.3, "r_y3": 169.69, "coord_origin": "TOPLEFT" }, "text": "\u2212", "orig": "\u2212", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 7, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 263.52, "r_y0": 176.27, "r_x1": 279.41, "r_y1": 176.27, "r_x2": 279.41, "r_y2": 170.08, "r_x3": 263.52, "r_y3": 170.08, "coord_origin": "TOPLEFT" }, "text": "3723", "orig": "3723", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 8, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 279.41, "r_y0": 176.27, "r_x1": 285.64, "r_y1": 176.27, "r_x2": 285.64, "r_y2": 169.69, "r_x3": 279.41, "r_y3": 169.69, "coord_origin": "TOPLEFT" }, "text": "\u2212", "orig": "\u2212", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 9, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 285.64, "r_y0": 180.47, "r_x1": 392.28, "r_y1": 180.47, "r_x2": 392.28, "r_y2": 171.67, "r_x3": 285.64, "r_y3": 171.67, "coord_origin": "TOPLEFT" }, "text": "$^{6960]}$, Ahmed Nassar[0000", "orig": "$^{6960]}$, Ahmed Nassar[0000", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 10, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 392.28, "r_y0": 176.27, "r_x1": 398.5, "r_y1": 176.27, "r_x2": 398.5, "r_y2": 169.69, "r_x3": 392.28, "r_y3": 169.69, "coord_origin": "TOPLEFT" }, "text": "\u2212", "orig": "\u2212", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 11, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 398.5, "r_y0": 176.27, "r_x1": 414.39, "r_y1": 176.27, "r_x2": 414.39, "r_y2": 170.08, "r_x3": 398.5, "r_y3": 170.08, "coord_origin": "TOPLEFT" }, "text": "0002", "orig": "0002", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 12, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 414.39, "r_y0": 176.27, "r_x1": 420.61, "r_y1": 176.27, "r_x2": 420.61, "r_y2": 169.69, "r_x3": 414.39, "r_y3": 169.69, "coord_origin": "TOPLEFT" }, "text": "\u2212", "orig": "\u2212", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 13, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 420.61, "r_y0": 176.27, "r_x1": 436.5, "r_y1": 176.27, "r_x2": 436.5, "r_y2": 170.08, "r_x3": 420.61, "r_y3": 170.08, "coord_origin": "TOPLEFT" }, "text": "9468", "orig": "9468", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 14, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 436.5, "r_y0": 176.27, "r_x1": 442.72, "r_y1": 176.27, "r_x2": 442.72, "r_y2": 169.69, "r_x3": 436.5, "r_y3": 169.69, "coord_origin": "TOPLEFT" }, "text": "\u2212", "orig": "\u2212", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 15, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 442.73, "r_y0": 180.47, "r_x1": 464.13, "r_y1": 180.47, "r_x2": 464.13, "r_y2": 171.67, "r_x3": 442.73, "r_y3": 171.67, "coord_origin": "TOPLEFT" }, "text": "$^{0822]}$,", "orig": "$^{0822]}$,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 16, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 139.34, "r_y0": 192.43, "r_x1": 224.81, "r_y1": 192.43, "r_x2": 224.81, "r_y2": 183.63, "r_x3": 139.34, "r_y3": 183.63, "coord_origin": "TOPLEFT" }, "text": "Nikolaos Livathinos", "orig": "Nikolaos Livathinos", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 17, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 224.81, "r_y0": 188.23, "r_x1": 242.95, "r_y1": 188.23, "r_x2": 242.95, "r_y2": 182.04, "r_x3": 224.81, "r_y3": 182.04, "coord_origin": "TOPLEFT" }, "text": "[0000", "orig": "[0000", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 18, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 242.95, "r_y0": 188.23, "r_x1": 249.17, "r_y1": 188.23, "r_x2": 249.17, "r_y2": 181.65, "r_x3": 242.95, "r_y3": 181.65, "coord_origin": "TOPLEFT" }, "text": "\u2212", "orig": "\u2212", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 19, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 249.17, "r_y0": 188.23, "r_x1": 265.06, "r_y1": 188.23, "r_x2": 265.06, "r_y2": 182.04, "r_x3": 249.17, "r_y3": 182.04, "coord_origin": "TOPLEFT" }, "text": "0001", "orig": "0001", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 20, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 265.06, "r_y0": 188.23, "r_x1": 271.29, "r_y1": 188.23, "r_x2": 271.29, "r_y2": 181.65, "r_x3": 265.06, "r_y3": 181.65, "coord_origin": "TOPLEFT" }, "text": "\u2212", "orig": "\u2212", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 21, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 271.29, "r_y0": 188.23, "r_x1": 287.17, "r_y1": 188.23, "r_x2": 287.17, "r_y2": 182.04, "r_x3": 271.29, "r_y3": 182.04, "coord_origin": "TOPLEFT" }, "text": "8513", "orig": "8513", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 22, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 287.17, "r_y0": 188.23, "r_x1": 293.4, "r_y1": 188.23, "r_x2": 293.4, "r_y2": 181.65, "r_x3": 287.17, "r_y3": 181.65, "coord_origin": "TOPLEFT" }, "text": "\u2212", "orig": "\u2212", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 23, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 293.4, "r_y0": 192.43, "r_x1": 404.16, "r_y1": 192.43, "r_x2": 404.16, "r_y2": 183.63, "r_x3": 293.4, "r_y3": 183.63, "coord_origin": "TOPLEFT" }, "text": "$^{3491]}$, Christoph Auer[0000", "orig": "$^{3491]}$, Christoph Auer[0000", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 24, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 404.16, "r_y0": 188.23, "r_x1": 410.38, "r_y1": 188.23, "r_x2": 410.38, "r_y2": 181.65, "r_x3": 404.16, "r_y3": 181.65, "coord_origin": "TOPLEFT" }, "text": "\u2212", "orig": "\u2212", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 25, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 410.39, "r_y0": 188.23, "r_x1": 426.27, "r_y1": 188.23, "r_x2": 426.27, "r_y2": 182.04, "r_x3": 410.39, "r_y3": 182.04, "coord_origin": "TOPLEFT" }, "text": "0001", "orig": "0001", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 26, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 426.27, "r_y0": 188.23, "r_x1": 432.5, "r_y1": 188.23, "r_x2": 432.5, "r_y2": 181.65, "r_x3": 426.27, "r_y3": 181.65, "coord_origin": "TOPLEFT" }, "text": "\u2212", "orig": "\u2212", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 27, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 432.5, "r_y0": 188.23, "r_x1": 448.38, "r_y1": 188.23, "r_x2": 448.38, "r_y2": 182.04, "r_x3": 432.5, "r_y3": 182.04, "coord_origin": "TOPLEFT" }, "text": "5761", "orig": "5761", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 28, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 448.38, "r_y0": 188.23, "r_x1": 454.61, "r_y1": 188.23, "r_x2": 454.61, "r_y2": 181.65, "r_x3": 448.38, "r_y3": 181.65, "coord_origin": "TOPLEFT" }, "text": "\u2212", "orig": "\u2212", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 29, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 454.61, "r_y0": 192.43, "r_x1": 476.01, "r_y1": 192.43, "r_x2": 476.01, "r_y2": 183.63, "r_x3": 454.61, "r_y3": 183.63, "coord_origin": "TOPLEFT" }, "text": "$^{0422]}$,", "orig": "$^{0422]}$,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 30, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 229.52, "r_y0": 204.38, "r_x1": 298.61, "r_y1": 204.38, "r_x2": 298.61, "r_y2": 195.58, "r_x3": 229.52, "r_y3": 195.58, "coord_origin": "TOPLEFT" }, "text": "and Peter Staar", "orig": "and Peter Staar", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 31, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 298.61, "r_y0": 200.19, "r_x1": 316.75, "r_y1": 200.19, "r_x2": 316.75, "r_y2": 193.99, "r_x3": 298.61, "r_y3": 193.99, "coord_origin": "TOPLEFT" }, "text": "[0000", "orig": "[0000", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 32, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 316.75, "r_y0": 200.19, "r_x1": 322.97, "r_y1": 200.19, "r_x2": 322.97, "r_y2": 193.6, "r_x3": 316.75, "r_y3": 193.6, "coord_origin": "TOPLEFT" }, "text": "\u2212", "orig": "\u2212", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 33, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 322.97, "r_y0": 200.19, "r_x1": 338.86, "r_y1": 200.19, "r_x2": 338.86, "r_y2": 193.99, "r_x3": 322.97, "r_y3": 193.99, "coord_origin": "TOPLEFT" }, "text": "0002", "orig": "0002", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 34, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 338.86, "r_y0": 200.19, "r_x1": 345.08, "r_y1": 200.19, "r_x2": 345.08, "r_y2": 193.6, "r_x3": 338.86, "r_y3": 193.6, "coord_origin": "TOPLEFT" }, "text": "\u2212", "orig": "\u2212", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 35, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 345.09, "r_y0": 200.19, "r_x1": 360.97, "r_y1": 200.19, "r_x2": 360.97, "r_y2": 193.99, "r_x3": 345.09, "r_y3": 193.99, "coord_origin": "TOPLEFT" }, "text": "8088", "orig": "8088", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 36, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 360.97, "r_y0": 200.19, "r_x1": 367.2, "r_y1": 200.19, "r_x2": 367.2, "r_y2": 193.6, "r_x3": 360.97, "r_y3": 193.6, "coord_origin": "TOPLEFT" }, "text": "\u2212", "orig": "\u2212", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 37, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 367.2, "r_y0": 200.19, "r_x1": 385.34, "r_y1": 200.19, "r_x2": 385.34, "r_y2": 193.99, "r_x3": 367.2, "r_y3": 193.99, "coord_origin": "TOPLEFT" }, "text": "0823]", "orig": "0823]", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 38, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 279.11, "r_y0": 225.27, "r_x1": 336.25, "r_y1": 225.27, "r_x2": 336.25, "r_y2": 217.2, "r_x3": 279.11, "r_y3": 217.2, "coord_origin": "TOPLEFT" }, "text": "IBM Research", "orig": "IBM Research", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 39, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 222.97, "r_y0": 236.28, "r_x1": 392.39, "r_y1": 236.28, "r_x2": 392.39, "r_y2": 228.81, "r_x3": 222.97, "r_y3": 228.81, "coord_origin": "TOPLEFT" }, "text": "{mly,ahn,nli,cau,taa}@zurich.ibm.com", "orig": "{mly,ahn,nli,cau,taa}@zurich.ibm.com", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [ { "id": 7, "label": "text", "bbox": { "l": 139.34, "t": 169.69, "r": 476.01, "b": 200.19, "coord_origin": "TOPLEFT" }, "confidence": 0.792, "cells": [ { "index": 2, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.23, "r_y0": 180.47, "r_x1": 217.04, "r_y1": 180.47, "r_x2": 217.04, "r_y2": 171.67, "r_x3": 151.23, "r_y3": 171.67, "coord_origin": "TOPLEFT" }, "text": "Maksym Lysak", "orig": "Maksym Lysak", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 3, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 217.05, "r_y0": 176.27, "r_x1": 235.19, "r_y1": 176.27, "r_x2": 235.19, "r_y2": 170.08, "r_x3": 217.05, "r_y3": 170.08, "coord_origin": "TOPLEFT" }, "text": "[0000", "orig": "[0000", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 4, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 235.19, "r_y0": 176.27, "r_x1": 241.41, "r_y1": 176.27, "r_x2": 241.41, "r_y2": 169.69, "r_x3": 235.19, "r_y3": 169.69, "coord_origin": "TOPLEFT" }, "text": "\u2212", "orig": "\u2212", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 5, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 241.41, "r_y0": 176.27, "r_x1": 257.3, "r_y1": 176.27, "r_x2": 257.3, "r_y2": 170.08, "r_x3": 241.41, "r_y3": 170.08, "coord_origin": "TOPLEFT" }, "text": "0002", "orig": "0002", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 6, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 257.3, "r_y0": 176.27, "r_x1": 263.52, "r_y1": 176.27, "r_x2": 263.52, "r_y2": 169.69, "r_x3": 257.3, "r_y3": 169.69, "coord_origin": "TOPLEFT" }, "text": "\u2212", "orig": "\u2212", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 7, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 263.52, "r_y0": 176.27, "r_x1": 279.41, "r_y1": 176.27, "r_x2": 279.41, "r_y2": 170.08, "r_x3": 263.52, "r_y3": 170.08, "coord_origin": "TOPLEFT" }, "text": "3723", "orig": "3723", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 8, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 279.41, "r_y0": 176.27, "r_x1": 285.64, "r_y1": 176.27, "r_x2": 285.64, "r_y2": 169.69, "r_x3": 279.41, "r_y3": 169.69, "coord_origin": "TOPLEFT" }, "text": "\u2212", "orig": "\u2212", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 9, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 285.64, "r_y0": 180.47, "r_x1": 392.28, "r_y1": 180.47, "r_x2": 392.28, "r_y2": 171.67, "r_x3": 285.64, "r_y3": 171.67, "coord_origin": "TOPLEFT" }, "text": "$^{6960]}$, Ahmed Nassar[0000", "orig": "$^{6960]}$, Ahmed Nassar[0000", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 10, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 392.28, "r_y0": 176.27, "r_x1": 398.5, "r_y1": 176.27, "r_x2": 398.5, "r_y2": 169.69, "r_x3": 392.28, "r_y3": 169.69, "coord_origin": "TOPLEFT" }, "text": "\u2212", "orig": "\u2212", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 11, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 398.5, "r_y0": 176.27, "r_x1": 414.39, "r_y1": 176.27, "r_x2": 414.39, "r_y2": 170.08, "r_x3": 398.5, "r_y3": 170.08, "coord_origin": "TOPLEFT" }, "text": "0002", "orig": "0002", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 12, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 414.39, "r_y0": 176.27, "r_x1": 420.61, "r_y1": 176.27, "r_x2": 420.61, "r_y2": 169.69, "r_x3": 414.39, "r_y3": 169.69, "coord_origin": "TOPLEFT" }, "text": "\u2212", "orig": "\u2212", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 13, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 420.61, "r_y0": 176.27, "r_x1": 436.5, "r_y1": 176.27, "r_x2": 436.5, "r_y2": 170.08, "r_x3": 420.61, "r_y3": 170.08, "coord_origin": "TOPLEFT" }, "text": "9468", "orig": "9468", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 14, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 436.5, "r_y0": 176.27, "r_x1": 442.72, "r_y1": 176.27, "r_x2": 442.72, "r_y2": 169.69, "r_x3": 436.5, "r_y3": 169.69, "coord_origin": "TOPLEFT" }, "text": "\u2212", "orig": "\u2212", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 15, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 442.73, "r_y0": 180.47, "r_x1": 464.13, "r_y1": 180.47, "r_x2": 464.13, "r_y2": 171.67, "r_x3": 442.73, "r_y3": 171.67, "coord_origin": "TOPLEFT" }, "text": "$^{0822]}$,", "orig": "$^{0822]}$,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 16, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 139.34, "r_y0": 192.43, "r_x1": 224.81, "r_y1": 192.43, "r_x2": 224.81, "r_y2": 183.63, "r_x3": 139.34, "r_y3": 183.63, "coord_origin": "TOPLEFT" }, "text": "Nikolaos Livathinos", "orig": "Nikolaos Livathinos", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 17, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 224.81, "r_y0": 188.23, "r_x1": 242.95, "r_y1": 188.23, "r_x2": 242.95, "r_y2": 182.04, "r_x3": 224.81, "r_y3": 182.04, "coord_origin": "TOPLEFT" }, "text": "[0000", "orig": "[0000", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 18, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 242.95, "r_y0": 188.23, "r_x1": 249.17, "r_y1": 188.23, "r_x2": 249.17, "r_y2": 181.65, "r_x3": 242.95, "r_y3": 181.65, "coord_origin": "TOPLEFT" }, "text": "\u2212", "orig": "\u2212", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 19, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 249.17, "r_y0": 188.23, "r_x1": 265.06, "r_y1": 188.23, "r_x2": 265.06, "r_y2": 182.04, "r_x3": 249.17, "r_y3": 182.04, "coord_origin": "TOPLEFT" }, "text": "0001", "orig": "0001", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 20, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 265.06, "r_y0": 188.23, "r_x1": 271.29, "r_y1": 188.23, "r_x2": 271.29, "r_y2": 181.65, "r_x3": 265.06, "r_y3": 181.65, "coord_origin": "TOPLEFT" }, "text": "\u2212", "orig": "\u2212", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 21, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 271.29, "r_y0": 188.23, "r_x1": 287.17, "r_y1": 188.23, "r_x2": 287.17, "r_y2": 182.04, "r_x3": 271.29, "r_y3": 182.04, "coord_origin": "TOPLEFT" }, "text": "8513", "orig": "8513", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 22, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 287.17, "r_y0": 188.23, "r_x1": 293.4, "r_y1": 188.23, "r_x2": 293.4, "r_y2": 181.65, "r_x3": 287.17, "r_y3": 181.65, "coord_origin": "TOPLEFT" }, "text": "\u2212", "orig": "\u2212", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 23, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 293.4, "r_y0": 192.43, "r_x1": 404.16, "r_y1": 192.43, "r_x2": 404.16, "r_y2": 183.63, "r_x3": 293.4, "r_y3": 183.63, "coord_origin": "TOPLEFT" }, "text": "$^{3491]}$, Christoph Auer[0000", "orig": "$^{3491]}$, Christoph Auer[0000", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 24, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 404.16, "r_y0": 188.23, "r_x1": 410.38, "r_y1": 188.23, "r_x2": 410.38, "r_y2": 181.65, "r_x3": 404.16, "r_y3": 181.65, "coord_origin": "TOPLEFT" }, "text": "\u2212", "orig": "\u2212", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 25, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 410.39, "r_y0": 188.23, "r_x1": 426.27, "r_y1": 188.23, "r_x2": 426.27, "r_y2": 182.04, "r_x3": 410.39, "r_y3": 182.04, "coord_origin": "TOPLEFT" }, "text": "0001", "orig": "0001", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 26, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 426.27, "r_y0": 188.23, "r_x1": 432.5, "r_y1": 188.23, "r_x2": 432.5, "r_y2": 181.65, "r_x3": 426.27, "r_y3": 181.65, "coord_origin": "TOPLEFT" }, "text": "\u2212", "orig": "\u2212", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 27, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 432.5, "r_y0": 188.23, "r_x1": 448.38, "r_y1": 188.23, "r_x2": 448.38, "r_y2": 182.04, "r_x3": 432.5, "r_y3": 182.04, "coord_origin": "TOPLEFT" }, "text": "5761", "orig": "5761", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 28, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 448.38, "r_y0": 188.23, "r_x1": 454.61, "r_y1": 188.23, "r_x2": 454.61, "r_y2": 181.65, "r_x3": 448.38, "r_y3": 181.65, "coord_origin": "TOPLEFT" }, "text": "\u2212", "orig": "\u2212", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 29, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 454.61, "r_y0": 192.43, "r_x1": 476.01, "r_y1": 192.43, "r_x2": 476.01, "r_y2": 183.63, "r_x3": 454.61, "r_y3": 183.63, "coord_origin": "TOPLEFT" }, "text": "$^{0422]}$,", "orig": "$^{0422]}$,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 31, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 298.61, "r_y0": 200.19, "r_x1": 316.75, "r_y1": 200.19, "r_x2": 316.75, "r_y2": 193.99, "r_x3": 298.61, "r_y3": 193.99, "coord_origin": "TOPLEFT" }, "text": "[0000", "orig": "[0000", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 32, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 316.75, "r_y0": 200.19, "r_x1": 322.97, "r_y1": 200.19, "r_x2": 322.97, "r_y2": 193.6, "r_x3": 316.75, "r_y3": 193.6, "coord_origin": "TOPLEFT" }, "text": "\u2212", "orig": "\u2212", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 33, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 322.97, "r_y0": 200.19, "r_x1": 338.86, "r_y1": 200.19, "r_x2": 338.86, "r_y2": 193.99, "r_x3": 322.97, "r_y3": 193.99, "coord_origin": "TOPLEFT" }, "text": "0002", "orig": "0002", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 34, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 338.86, "r_y0": 200.19, "r_x1": 345.08, "r_y1": 200.19, "r_x2": 345.08, "r_y2": 193.6, "r_x3": 338.86, "r_y3": 193.6, "coord_origin": "TOPLEFT" }, "text": "\u2212", "orig": "\u2212", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 35, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 345.09, "r_y0": 200.19, "r_x1": 360.97, "r_y1": 200.19, "r_x2": 360.97, "r_y2": 193.99, "r_x3": 345.09, "r_y3": 193.99, "coord_origin": "TOPLEFT" }, "text": "8088", "orig": "8088", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 36, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 360.97, "r_y0": 200.19, "r_x1": 367.2, "r_y1": 200.19, "r_x2": 367.2, "r_y2": 193.6, "r_x3": 360.97, "r_y3": 193.6, "coord_origin": "TOPLEFT" }, "text": "\u2212", "orig": "\u2212", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 37, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 367.2, "r_y0": 200.19, "r_x1": 385.34, "r_y1": 200.19, "r_x2": 385.34, "r_y2": 193.99, "r_x3": 367.2, "r_y3": 193.99, "coord_origin": "TOPLEFT" }, "text": "0823]", "orig": "0823]", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 13, "label": "text", "bbox": { "l": 229.52, "t": 195.58, "r": 298.61, "b": 204.38, "coord_origin": "TOPLEFT" }, "confidence": 0.502, "cells": [ { "index": 30, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 229.52, "r_y0": 204.38, "r_x1": 298.61, "r_y1": 204.38, "r_x2": 298.61, "r_y2": 195.58, "r_x3": 229.52, "r_y3": 195.58, "coord_origin": "TOPLEFT" }, "text": "and Peter Staar", "orig": "and Peter Staar", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 9, "label": "text", "bbox": { "l": 279.11, "t": 217.2, "r": 336.25, "b": 225.27, "coord_origin": "TOPLEFT" }, "confidence": 0.631, "cells": [ { "index": 38, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 279.11, "r_y0": 225.27, "r_x1": 336.25, "r_y1": 225.27, "r_x2": 336.25, "r_y2": 217.2, "r_x3": 279.11, "r_y3": 217.2, "coord_origin": "TOPLEFT" }, "text": "IBM Research", "orig": "IBM Research", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 8, "label": "text", "bbox": { "l": 222.97, "t": 228.81, "r": 392.39, "b": 236.28, "coord_origin": "TOPLEFT" }, "confidence": 0.692, "cells": [ { "index": 39, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 222.97, "r_y0": 236.28, "r_x1": 392.39, "r_y1": 236.28, "r_x2": 392.39, "r_y2": 228.81, "r_x3": 222.97, "r_y3": 228.81, "coord_origin": "TOPLEFT" }, "text": "{mly,ahn,nli,cau,taa}@zurich.ibm.com", "orig": "{mly,ahn,nli,cau,taa}@zurich.ibm.com", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] } ] }, "text": null }, { "label": "text", "id": 1, "page_no": 0, "cluster": { "id": 1, "label": "text", "bbox": { "l": 163.11, "t": 270.3, "r": 452.25, "b": 464.73, "coord_origin": "TOPLEFT" }, "confidence": 0.981, "cells": [ { "index": 40, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 163.11, "r_y0": 278.23, "r_x1": 206.64, "r_y1": 278.23, "r_x2": 206.64, "r_y2": 270.3, "r_x3": 163.11, "r_y3": 270.3, "coord_origin": "TOPLEFT" }, "text": "Abstract.", "orig": "Abstract.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 41, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 211.62, "r_y0": 278.43, "r_x1": 452.24, "r_y1": 278.43, "r_x2": 452.24, "r_y2": 270.36, "r_x3": 211.62, "r_y3": 270.36, "coord_origin": "TOPLEFT" }, "text": "Extracting tables from documents is a crucial task in any", "orig": "Extracting tables from documents is a crucial task in any", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 42, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 163.11, "r_y0": 289.39, "r_x1": 452.24, "r_y1": 289.39, "r_x2": 452.24, "r_y2": 281.32, "r_x3": 163.11, "r_y3": 281.32, "coord_origin": "TOPLEFT" }, "text": "document conversion pipeline. Recently, transformer-based models have", "orig": "document conversion pipeline. Recently, transformer-based models have", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 43, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 163.11, "r_y0": 300.35, "r_x1": 452.25, "r_y1": 300.35, "r_x2": 452.25, "r_y2": 292.28, "r_x3": 163.11, "r_y3": 292.28, "coord_origin": "TOPLEFT" }, "text": "demonstrated that table-structure can be recognized with impressive ac-", "orig": "demonstrated that table-structure can be recognized with impressive ac-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 44, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 163.11, "r_y0": 311.31, "r_x1": 452.24, "r_y1": 311.31, "r_x2": 452.24, "r_y2": 303.24, "r_x3": 163.11, "r_y3": 303.24, "coord_origin": "TOPLEFT" }, "text": "curacy using Image-to-Markup-Sequence (Im2Seq) approaches. Taking", "orig": "curacy using Image-to-Markup-Sequence (Im2Seq) approaches. Taking", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 45, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 163.11, "r_y0": 322.27, "r_x1": 452.25, "r_y1": 322.27, "r_x2": 452.25, "r_y2": 314.2, "r_x3": 163.11, "r_y3": 314.2, "coord_origin": "TOPLEFT" }, "text": "only the image of a table, such models predict a sequence of tokens (e.g.", "orig": "only the image of a table, such models predict a sequence of tokens (e.g.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 46, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 163.11, "r_y0": 333.23, "r_x1": 452.25, "r_y1": 333.23, "r_x2": 452.25, "r_y2": 325.16, "r_x3": 163.11, "r_y3": 325.16, "coord_origin": "TOPLEFT" }, "text": "in HTML, LaTeX) which represent the structure of the table. Since the", "orig": "in HTML, LaTeX) which represent the structure of the table. Since the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 47, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 163.11, "r_y0": 344.19, "r_x1": 452.25, "r_y1": 344.19, "r_x2": 452.25, "r_y2": 336.12, "r_x3": 163.11, "r_y3": 336.12, "coord_origin": "TOPLEFT" }, "text": "token representation of the table structure has a significant impact on", "orig": "token representation of the table structure has a significant impact on", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 48, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 163.11, "r_y0": 355.15, "r_x1": 452.25, "r_y1": 355.15, "r_x2": 452.25, "r_y2": 347.08, "r_x3": 163.11, "r_y3": 347.08, "coord_origin": "TOPLEFT" }, "text": "the accuracy and run-time performance of any Im2Seq model, we inves-", "orig": "the accuracy and run-time performance of any Im2Seq model, we inves-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 49, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 163.11, "r_y0": 366.1, "r_x1": 452.25, "r_y1": 366.1, "r_x2": 452.25, "r_y2": 358.03, "r_x3": 163.11, "r_y3": 358.03, "coord_origin": "TOPLEFT" }, "text": "tigate in this paper how table-structure representation can be optimised.", "orig": "tigate in this paper how table-structure representation can be optimised.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 50, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 163.11, "r_y0": 377.06, "r_x1": 452.25, "r_y1": 377.06, "r_x2": 452.25, "r_y2": 368.99, "r_x3": 163.11, "r_y3": 368.99, "coord_origin": "TOPLEFT" }, "text": "We propose a new, optimised table-structure language (OTSL) with a", "orig": "We propose a new, optimised table-structure language (OTSL) with a", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 51, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 163.11, "r_y0": 388.02, "r_x1": 452.24, "r_y1": 388.02, "r_x2": 452.24, "r_y2": 379.95, "r_x3": 163.11, "r_y3": 379.95, "coord_origin": "TOPLEFT" }, "text": "minimized vocabulary and specific rules. The benefits of OTSL are that", "orig": "minimized vocabulary and specific rules. The benefits of OTSL are that", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 52, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 163.11, "r_y0": 398.98, "r_x1": 452.24, "r_y1": 398.98, "r_x2": 452.24, "r_y2": 390.91, "r_x3": 163.11, "r_y3": 390.91, "coord_origin": "TOPLEFT" }, "text": "it reduces the number of tokens to 5 (HTML needs 28+) and shortens", "orig": "it reduces the number of tokens to 5 (HTML needs 28+) and shortens", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 53, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 163.11, "r_y0": 409.94, "r_x1": 452.25, "r_y1": 409.94, "r_x2": 452.25, "r_y2": 401.87, "r_x3": 163.11, "r_y3": 401.87, "coord_origin": "TOPLEFT" }, "text": "the sequence length to half of HTML on average. Consequently, model", "orig": "the sequence length to half of HTML on average. Consequently, model", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 54, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 163.11, "r_y0": 420.9, "r_x1": 452.24, "r_y1": 420.9, "r_x2": 452.24, "r_y2": 412.83, "r_x3": 163.11, "r_y3": 412.83, "coord_origin": "TOPLEFT" }, "text": "accuracy improves significantly, inference time is halved compared to", "orig": "accuracy improves significantly, inference time is halved compared to", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 55, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 163.11, "r_y0": 431.86, "r_x1": 452.24, "r_y1": 431.86, "r_x2": 452.24, "r_y2": 423.79, "r_x3": 163.11, "r_y3": 423.79, "coord_origin": "TOPLEFT" }, "text": "HTML-based models, and the predicted table structures are always syn-", "orig": "HTML-based models, and the predicted table structures are always syn-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 56, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 163.11, "r_y0": 442.82, "r_x1": 452.24, "r_y1": 442.82, "r_x2": 452.24, "r_y2": 434.75, "r_x3": 163.11, "r_y3": 434.75, "coord_origin": "TOPLEFT" }, "text": "tactically correct. This in turn eliminates most post-processing needs.", "orig": "tactically correct. This in turn eliminates most post-processing needs.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 57, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 163.11, "r_y0": 453.78, "r_x1": 452.25, "r_y1": 453.78, "r_x2": 452.25, "r_y2": 445.71, "r_x3": 163.11, "r_y3": 445.71, "coord_origin": "TOPLEFT" }, "text": "Popular table structure data-sets will be published in OTSL format to", "orig": "Popular table structure data-sets will be published in OTSL format to", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 58, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 163.11, "r_y0": 464.73, "r_x1": 225.56, "r_y1": 464.73, "r_x2": 225.56, "r_y2": 456.66, "r_x3": 163.11, "r_y3": 456.66, "coord_origin": "TOPLEFT" }, "text": "the community.", "orig": "the community.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "Abstract. Extracting tables from documents is a crucial task in any document conversion pipeline. Recently, transformer-based models have demonstrated that table-structure can be recognized with impressive accuracy using Image-to-Markup-Sequence (Im2Seq) approaches. Taking only the image of a table, such models predict a sequence of tokens (e.g. in HTML, LaTeX) which represent the structure of the table. Since the token representation of the table structure has a significant impact on the accuracy and run-time performance of any Im2Seq model, we investigate in this paper how table-structure representation can be optimised. We propose a new, optimised table-structure language (OTSL) with a minimized vocabulary and specific rules. The benefits of OTSL are that it reduces the number of tokens to 5 (HTML needs 28+) and shortens the sequence length to half of HTML on average. Consequently, model accuracy improves significantly, inference time is halved compared to HTML-based models, and the predicted table structures are always syntactically correct. This in turn eliminates most post-processing needs. Popular table structure data-sets will be published in OTSL format to the community." }, { "label": "text", "id": 4, "page_no": 0, "cluster": { "id": 4, "label": "text", "bbox": { "l": 163.11, "t": 478.69, "r": 452.24, "b": 497.79, "coord_origin": "TOPLEFT" }, "confidence": 0.93, "cells": [ { "index": 59, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 163.11, "r_y0": 486.62, "r_x1": 211.94, "r_y1": 486.62, "r_x2": 211.94, "r_y2": 478.69, "r_x3": 163.11, "r_y3": 478.69, "coord_origin": "TOPLEFT" }, "text": "Keywords:", "orig": "Keywords:", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 60, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 216.55, "r_y0": 486.83, "r_x1": 452.24, "r_y1": 486.83, "r_x2": 452.24, "r_y2": 478.76, "r_x3": 216.55, "r_y3": 478.76, "coord_origin": "TOPLEFT" }, "text": "Table Structure Recognition \u00b7 Data Representation \u00b7 Trans-", "orig": "Table Structure Recognition \u00b7 Data Representation \u00b7 Trans-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 61, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 163.11, "r_y0": 497.79, "r_x1": 257.64, "r_y1": 497.79, "r_x2": 257.64, "r_y2": 489.72, "r_x3": 163.11, "r_y3": 489.72, "coord_origin": "TOPLEFT" }, "text": "formers \u00b7 Optimization.", "orig": "formers \u00b7 Optimization.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "Keywords: Table Structure Recognition \u00b7 Data Representation \u00b7 Transformers \u00b7 Optimization." }, { "label": "section_header", "id": 3, "page_no": 0, "cluster": { "id": 3, "label": "section_header", "bbox": { "l": 134.77, "t": 522.12, "r": 228.93, "b": 532.69, "coord_origin": "TOPLEFT" }, "confidence": 0.939, "cells": [ { "index": 62, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.77, "r_y0": 532.69, "r_x1": 141.49, "r_y1": 532.69, "r_x2": 141.49, "r_y2": 522.12, "r_x3": 134.77, "r_y3": 522.12, "coord_origin": "TOPLEFT" }, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 63, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 154.94, "r_y0": 532.69, "r_x1": 228.93, "r_y1": 532.69, "r_x2": 228.93, "r_y2": 522.12, "r_x3": 154.94, "r_y3": 522.12, "coord_origin": "TOPLEFT" }, "text": "Introduction", "orig": "Introduction", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "1 Introduction" }, { "label": "text", "id": 0, "page_no": 0, "cluster": { "id": 0, "label": "text", "bbox": { "l": 134.77, "t": 548.29, "r": 480.6, "b": 628.81, "coord_origin": "TOPLEFT" }, "confidence": 0.984, "cells": [ { "index": 64, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.77, "r_y0": 557.08, "r_x1": 480.59, "r_y1": 557.08, "r_x2": 480.59, "r_y2": 548.29, "r_x3": 134.77, "r_y3": 548.29, "coord_origin": "TOPLEFT" }, "text": "Tables are ubiquitous in documents such as scientific papers, patents, reports,", "orig": "Tables are ubiquitous in documents such as scientific papers, patents, reports,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 65, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.77, "r_y0": 569.04, "r_x1": 480.59, "r_y1": 569.04, "r_x2": 480.59, "r_y2": 560.24, "r_x3": 134.77, "r_y3": 560.24, "coord_origin": "TOPLEFT" }, "text": "manuals, specification sheets or marketing material. They often encode highly", "orig": "manuals, specification sheets or marketing material. They often encode highly", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 66, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.77, "r_y0": 580.99, "r_x1": 480.59, "r_y1": 580.99, "r_x2": 480.59, "r_y2": 572.2, "r_x3": 134.77, "r_y3": 572.2, "coord_origin": "TOPLEFT" }, "text": "valuable information and therefore need to be extracted with high accuracy.", "orig": "valuable information and therefore need to be extracted with high accuracy.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 67, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.77, "r_y0": 592.95, "r_x1": 480.6, "r_y1": 592.95, "r_x2": 480.6, "r_y2": 584.15, "r_x3": 134.77, "r_y3": 584.15, "coord_origin": "TOPLEFT" }, "text": "Unfortunately, tables appear in documents in various sizes, styling and struc-", "orig": "Unfortunately, tables appear in documents in various sizes, styling and struc-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 68, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.77, "r_y0": 604.9, "r_x1": 480.59, "r_y1": 604.9, "r_x2": 480.59, "r_y2": 596.11, "r_x3": 134.77, "r_y3": 596.11, "coord_origin": "TOPLEFT" }, "text": "ture, making it difficult to recover their correct structure with simple analyt-", "orig": "ture, making it difficult to recover their correct structure with simple analyt-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 69, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.77, "r_y0": 616.86, "r_x1": 480.59, "r_y1": 616.86, "r_x2": 480.59, "r_y2": 608.06, "r_x3": 134.77, "r_y3": 608.06, "coord_origin": "TOPLEFT" }, "text": "ical methods. Therefore, accurate table extraction is achieved these days with", "orig": "ical methods. Therefore, accurate table extraction is achieved these days with", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 70, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.77, "r_y0": 628.81, "r_x1": 279.33, "r_y1": 628.81, "r_x2": 279.33, "r_y2": 620.02, "r_x3": 134.77, "r_y3": 620.02, "coord_origin": "TOPLEFT" }, "text": "machine-learning based methods.", "orig": "machine-learning based methods.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "Tables are ubiquitous in documents such as scientific papers, patents, reports, manuals, specification sheets or marketing material. They often encode highly valuable information and therefore need to be extracted with high accuracy. Unfortunately, tables appear in documents in various sizes, styling and structure, making it difficult to recover their correct structure with simple analytical methods. Therefore, accurate table extraction is achieved these days with machine-learning based methods." }, { "label": "text", "id": 2, "page_no": 0, "cluster": { "id": 2, "label": "text", "bbox": { "l": 134.77, "t": 632.15, "r": 480.6, "b": 664.85, "coord_origin": "TOPLEFT" }, "confidence": 0.97, "cells": [ { "index": 71, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 149.71, "r_y0": 640.94, "r_x1": 480.59, "r_y1": 640.94, "r_x2": 480.59, "r_y2": 632.15, "r_x3": 149.71, "r_y3": 632.15, "coord_origin": "TOPLEFT" }, "text": "In modern document understanding systems [1,15], table extraction is typi-", "orig": "In modern document understanding systems [1,15], table extraction is typi-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 72, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.77, "r_y0": 652.9, "r_x1": 480.6, "r_y1": 652.9, "r_x2": 480.6, "r_y2": 644.1, "r_x3": 134.77, "r_y3": 644.1, "coord_origin": "TOPLEFT" }, "text": "cally a two-step process. Firstly, every table on a page is located with a bounding", "orig": "cally a two-step process. Firstly, every table on a page is located with a bounding", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 73, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.77, "r_y0": 664.85, "r_x1": 480.59, "r_y1": 664.85, "r_x2": 480.59, "r_y2": 656.06, "r_x3": 134.77, "r_y3": 656.06, "coord_origin": "TOPLEFT" }, "text": "box, and secondly, their logical row and column structure is recognized. As of", "orig": "box, and secondly, their logical row and column structure is recognized. As of", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "In modern document understanding systems [1,15], table extraction is typically a two-step process. Firstly, every table on a page is located with a bounding box, and secondly, their logical row and column structure is recognized. As of" }, { "label": "page_header", "id": 6, "page_no": 0, "cluster": { "id": 6, "label": "page_header", "bbox": { "l": 18.34, "t": 209.48, "r": 36.34, "b": 555.0, "coord_origin": "TOPLEFT" }, "confidence": 0.89, "cells": [ { "index": 74, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 18.34, "r_y0": 555.0, "r_x1": 36.34, "r_y1": 555.0, "r_x2": 36.34, "r_y2": 209.48, "r_x3": 18.34, "r_y3": 209.48, "coord_origin": "TOPLEFT" }, "text": "arXiv:2305.03393v1 [cs.CV] 5 May 2023", "orig": "arXiv:2305.03393v1 [cs.CV] 5 May 2023", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "arXiv:2305.03393v1 [cs.CV] 5 May 2023" } ], "body": [ { "label": "section_header", "id": 5, "page_no": 0, "cluster": { "id": 5, "label": "section_header", "bbox": { "l": 134.76, "t": 115.9, "r": 480.6, "b": 146.51, "coord_origin": "TOPLEFT" }, "confidence": 0.892, "cells": [ { "index": 0, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 128.58, "r_x1": 480.6, "r_y1": 128.58, "r_x2": 480.6, "r_y2": 115.9, "r_x3": 134.76, "r_y3": 115.9, "coord_origin": "TOPLEFT" }, "text": "Optimized Table Tokenization for Table Structure", "orig": "Optimized Table Tokenization for Table Structure", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 1, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 266.67, "r_y0": 146.51, "r_x1": 348.69, "r_y1": 146.51, "r_x2": 348.69, "r_y2": 133.83, "r_x3": 266.67, "r_y3": 133.83, "coord_origin": "TOPLEFT" }, "text": "Recognition", "orig": "Recognition", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "Optimized Table Tokenization for Table Structure Recognition" }, { "label": "key_value_region", "id": 16, "page_no": 0, "cluster": { "id": 16, "label": "key_value_region", "bbox": { "l": 139.34, "t": 169.69, "r": 476.01, "b": 236.28, "coord_origin": "TOPLEFT" }, "confidence": 0.484, "cells": [ { "index": 2, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.23, "r_y0": 180.47, "r_x1": 217.04, "r_y1": 180.47, "r_x2": 217.04, "r_y2": 171.67, "r_x3": 151.23, "r_y3": 171.67, "coord_origin": "TOPLEFT" }, "text": "Maksym Lysak", "orig": "Maksym Lysak", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 3, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 217.05, "r_y0": 176.27, "r_x1": 235.19, "r_y1": 176.27, "r_x2": 235.19, "r_y2": 170.08, "r_x3": 217.05, "r_y3": 170.08, "coord_origin": "TOPLEFT" }, "text": "[0000", "orig": "[0000", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 4, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 235.19, "r_y0": 176.27, "r_x1": 241.41, "r_y1": 176.27, "r_x2": 241.41, "r_y2": 169.69, "r_x3": 235.19, "r_y3": 169.69, "coord_origin": "TOPLEFT" }, "text": "\u2212", "orig": "\u2212", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 5, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 241.41, "r_y0": 176.27, "r_x1": 257.3, "r_y1": 176.27, "r_x2": 257.3, "r_y2": 170.08, "r_x3": 241.41, "r_y3": 170.08, "coord_origin": "TOPLEFT" }, "text": "0002", "orig": "0002", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 6, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 257.3, "r_y0": 176.27, "r_x1": 263.52, "r_y1": 176.27, "r_x2": 263.52, "r_y2": 169.69, "r_x3": 257.3, "r_y3": 169.69, "coord_origin": "TOPLEFT" }, "text": "\u2212", "orig": "\u2212", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 7, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 263.52, "r_y0": 176.27, "r_x1": 279.41, "r_y1": 176.27, "r_x2": 279.41, "r_y2": 170.08, "r_x3": 263.52, "r_y3": 170.08, "coord_origin": "TOPLEFT" }, "text": "3723", "orig": "3723", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 8, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 279.41, "r_y0": 176.27, "r_x1": 285.64, "r_y1": 176.27, "r_x2": 285.64, "r_y2": 169.69, "r_x3": 279.41, "r_y3": 169.69, "coord_origin": "TOPLEFT" }, "text": "\u2212", "orig": "\u2212", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 9, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 285.64, "r_y0": 180.47, "r_x1": 392.28, "r_y1": 180.47, "r_x2": 392.28, "r_y2": 171.67, "r_x3": 285.64, "r_y3": 171.67, "coord_origin": "TOPLEFT" }, "text": "$^{6960]}$, Ahmed Nassar[0000", "orig": "$^{6960]}$, Ahmed Nassar[0000", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 10, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 392.28, "r_y0": 176.27, "r_x1": 398.5, "r_y1": 176.27, "r_x2": 398.5, "r_y2": 169.69, "r_x3": 392.28, "r_y3": 169.69, "coord_origin": "TOPLEFT" }, "text": "\u2212", "orig": "\u2212", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 11, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 398.5, "r_y0": 176.27, "r_x1": 414.39, "r_y1": 176.27, "r_x2": 414.39, "r_y2": 170.08, "r_x3": 398.5, "r_y3": 170.08, "coord_origin": "TOPLEFT" }, "text": "0002", "orig": "0002", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 12, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 414.39, "r_y0": 176.27, "r_x1": 420.61, "r_y1": 176.27, "r_x2": 420.61, "r_y2": 169.69, "r_x3": 414.39, "r_y3": 169.69, "coord_origin": "TOPLEFT" }, "text": "\u2212", "orig": "\u2212", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 13, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 420.61, "r_y0": 176.27, "r_x1": 436.5, "r_y1": 176.27, "r_x2": 436.5, "r_y2": 170.08, "r_x3": 420.61, "r_y3": 170.08, "coord_origin": "TOPLEFT" }, "text": "9468", "orig": "9468", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 14, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 436.5, "r_y0": 176.27, "r_x1": 442.72, "r_y1": 176.27, "r_x2": 442.72, "r_y2": 169.69, "r_x3": 436.5, "r_y3": 169.69, "coord_origin": "TOPLEFT" }, "text": "\u2212", "orig": "\u2212", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 15, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 442.73, "r_y0": 180.47, "r_x1": 464.13, "r_y1": 180.47, "r_x2": 464.13, "r_y2": 171.67, "r_x3": 442.73, "r_y3": 171.67, "coord_origin": "TOPLEFT" }, "text": "$^{0822]}$,", "orig": "$^{0822]}$,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 16, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 139.34, "r_y0": 192.43, "r_x1": 224.81, "r_y1": 192.43, "r_x2": 224.81, "r_y2": 183.63, "r_x3": 139.34, "r_y3": 183.63, "coord_origin": "TOPLEFT" }, "text": "Nikolaos Livathinos", "orig": "Nikolaos Livathinos", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 17, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 224.81, "r_y0": 188.23, "r_x1": 242.95, "r_y1": 188.23, "r_x2": 242.95, "r_y2": 182.04, "r_x3": 224.81, "r_y3": 182.04, "coord_origin": "TOPLEFT" }, "text": "[0000", "orig": "[0000", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 18, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 242.95, "r_y0": 188.23, "r_x1": 249.17, "r_y1": 188.23, "r_x2": 249.17, "r_y2": 181.65, "r_x3": 242.95, "r_y3": 181.65, "coord_origin": "TOPLEFT" }, "text": "\u2212", "orig": "\u2212", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 19, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 249.17, "r_y0": 188.23, "r_x1": 265.06, "r_y1": 188.23, "r_x2": 265.06, "r_y2": 182.04, "r_x3": 249.17, "r_y3": 182.04, "coord_origin": "TOPLEFT" }, "text": "0001", "orig": "0001", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 20, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 265.06, "r_y0": 188.23, "r_x1": 271.29, "r_y1": 188.23, "r_x2": 271.29, "r_y2": 181.65, "r_x3": 265.06, "r_y3": 181.65, "coord_origin": "TOPLEFT" }, "text": "\u2212", "orig": "\u2212", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 21, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 271.29, "r_y0": 188.23, "r_x1": 287.17, "r_y1": 188.23, "r_x2": 287.17, "r_y2": 182.04, "r_x3": 271.29, "r_y3": 182.04, "coord_origin": "TOPLEFT" }, "text": "8513", "orig": "8513", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 22, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 287.17, "r_y0": 188.23, "r_x1": 293.4, "r_y1": 188.23, "r_x2": 293.4, "r_y2": 181.65, "r_x3": 287.17, "r_y3": 181.65, "coord_origin": "TOPLEFT" }, "text": "\u2212", "orig": "\u2212", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 23, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 293.4, "r_y0": 192.43, "r_x1": 404.16, "r_y1": 192.43, "r_x2": 404.16, "r_y2": 183.63, "r_x3": 293.4, "r_y3": 183.63, "coord_origin": "TOPLEFT" }, "text": "$^{3491]}$, Christoph Auer[0000", "orig": "$^{3491]}$, Christoph Auer[0000", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 24, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 404.16, "r_y0": 188.23, "r_x1": 410.38, "r_y1": 188.23, "r_x2": 410.38, "r_y2": 181.65, "r_x3": 404.16, "r_y3": 181.65, "coord_origin": "TOPLEFT" }, "text": "\u2212", "orig": "\u2212", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 25, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 410.39, "r_y0": 188.23, "r_x1": 426.27, "r_y1": 188.23, "r_x2": 426.27, "r_y2": 182.04, "r_x3": 410.39, "r_y3": 182.04, "coord_origin": "TOPLEFT" }, "text": "0001", "orig": "0001", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 26, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 426.27, "r_y0": 188.23, "r_x1": 432.5, "r_y1": 188.23, "r_x2": 432.5, "r_y2": 181.65, "r_x3": 426.27, "r_y3": 181.65, "coord_origin": "TOPLEFT" }, "text": "\u2212", "orig": "\u2212", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 27, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 432.5, "r_y0": 188.23, "r_x1": 448.38, "r_y1": 188.23, "r_x2": 448.38, "r_y2": 182.04, "r_x3": 432.5, "r_y3": 182.04, "coord_origin": "TOPLEFT" }, "text": "5761", "orig": "5761", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 28, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 448.38, "r_y0": 188.23, "r_x1": 454.61, "r_y1": 188.23, "r_x2": 454.61, "r_y2": 181.65, "r_x3": 448.38, "r_y3": 181.65, "coord_origin": "TOPLEFT" }, "text": "\u2212", "orig": "\u2212", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 29, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 454.61, "r_y0": 192.43, "r_x1": 476.01, "r_y1": 192.43, "r_x2": 476.01, "r_y2": 183.63, "r_x3": 454.61, "r_y3": 183.63, "coord_origin": "TOPLEFT" }, "text": "$^{0422]}$,", "orig": "$^{0422]}$,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 30, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 229.52, "r_y0": 204.38, "r_x1": 298.61, "r_y1": 204.38, "r_x2": 298.61, "r_y2": 195.58, "r_x3": 229.52, "r_y3": 195.58, "coord_origin": "TOPLEFT" }, "text": "and Peter Staar", "orig": "and Peter Staar", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 31, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 298.61, "r_y0": 200.19, "r_x1": 316.75, "r_y1": 200.19, "r_x2": 316.75, "r_y2": 193.99, "r_x3": 298.61, "r_y3": 193.99, "coord_origin": "TOPLEFT" }, "text": "[0000", "orig": "[0000", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 32, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 316.75, "r_y0": 200.19, "r_x1": 322.97, "r_y1": 200.19, "r_x2": 322.97, "r_y2": 193.6, "r_x3": 316.75, "r_y3": 193.6, "coord_origin": "TOPLEFT" }, "text": "\u2212", "orig": "\u2212", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 33, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 322.97, "r_y0": 200.19, "r_x1": 338.86, "r_y1": 200.19, "r_x2": 338.86, "r_y2": 193.99, "r_x3": 322.97, "r_y3": 193.99, "coord_origin": "TOPLEFT" }, "text": "0002", "orig": "0002", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 34, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 338.86, "r_y0": 200.19, "r_x1": 345.08, "r_y1": 200.19, "r_x2": 345.08, "r_y2": 193.6, "r_x3": 338.86, "r_y3": 193.6, "coord_origin": "TOPLEFT" }, "text": "\u2212", "orig": "\u2212", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 35, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 345.09, "r_y0": 200.19, "r_x1": 360.97, "r_y1": 200.19, "r_x2": 360.97, "r_y2": 193.99, "r_x3": 345.09, "r_y3": 193.99, "coord_origin": "TOPLEFT" }, "text": "8088", "orig": "8088", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 36, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 360.97, "r_y0": 200.19, "r_x1": 367.2, "r_y1": 200.19, "r_x2": 367.2, "r_y2": 193.6, "r_x3": 360.97, "r_y3": 193.6, "coord_origin": "TOPLEFT" }, "text": "\u2212", "orig": "\u2212", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 37, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 367.2, "r_y0": 200.19, "r_x1": 385.34, "r_y1": 200.19, "r_x2": 385.34, "r_y2": 193.99, "r_x3": 367.2, "r_y3": 193.99, "coord_origin": "TOPLEFT" }, "text": "0823]", "orig": "0823]", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 38, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 279.11, "r_y0": 225.27, "r_x1": 336.25, "r_y1": 225.27, "r_x2": 336.25, "r_y2": 217.2, "r_x3": 279.11, "r_y3": 217.2, "coord_origin": "TOPLEFT" }, "text": "IBM Research", "orig": "IBM Research", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 39, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 222.97, "r_y0": 236.28, "r_x1": 392.39, "r_y1": 236.28, "r_x2": 392.39, "r_y2": 228.81, "r_x3": 222.97, "r_y3": 228.81, "coord_origin": "TOPLEFT" }, "text": "{mly,ahn,nli,cau,taa}@zurich.ibm.com", "orig": "{mly,ahn,nli,cau,taa}@zurich.ibm.com", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [ { "id": 7, "label": "text", "bbox": { "l": 139.34, "t": 169.69, "r": 476.01, "b": 200.19, "coord_origin": "TOPLEFT" }, "confidence": 0.792, "cells": [ { "index": 2, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.23, "r_y0": 180.47, "r_x1": 217.04, "r_y1": 180.47, "r_x2": 217.04, "r_y2": 171.67, "r_x3": 151.23, "r_y3": 171.67, "coord_origin": "TOPLEFT" }, "text": "Maksym Lysak", "orig": "Maksym Lysak", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 3, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 217.05, "r_y0": 176.27, "r_x1": 235.19, "r_y1": 176.27, "r_x2": 235.19, "r_y2": 170.08, "r_x3": 217.05, "r_y3": 170.08, "coord_origin": "TOPLEFT" }, "text": "[0000", "orig": "[0000", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 4, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 235.19, "r_y0": 176.27, "r_x1": 241.41, "r_y1": 176.27, "r_x2": 241.41, "r_y2": 169.69, "r_x3": 235.19, "r_y3": 169.69, "coord_origin": "TOPLEFT" }, "text": "\u2212", "orig": "\u2212", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 5, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 241.41, "r_y0": 176.27, "r_x1": 257.3, "r_y1": 176.27, "r_x2": 257.3, "r_y2": 170.08, "r_x3": 241.41, "r_y3": 170.08, "coord_origin": "TOPLEFT" }, "text": "0002", "orig": "0002", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 6, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 257.3, "r_y0": 176.27, "r_x1": 263.52, "r_y1": 176.27, "r_x2": 263.52, "r_y2": 169.69, "r_x3": 257.3, "r_y3": 169.69, "coord_origin": "TOPLEFT" }, "text": "\u2212", "orig": "\u2212", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 7, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 263.52, "r_y0": 176.27, "r_x1": 279.41, "r_y1": 176.27, "r_x2": 279.41, "r_y2": 170.08, "r_x3": 263.52, "r_y3": 170.08, "coord_origin": "TOPLEFT" }, "text": "3723", "orig": "3723", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 8, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 279.41, "r_y0": 176.27, "r_x1": 285.64, "r_y1": 176.27, "r_x2": 285.64, "r_y2": 169.69, "r_x3": 279.41, "r_y3": 169.69, "coord_origin": "TOPLEFT" }, "text": "\u2212", "orig": "\u2212", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 9, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 285.64, "r_y0": 180.47, "r_x1": 392.28, "r_y1": 180.47, "r_x2": 392.28, "r_y2": 171.67, "r_x3": 285.64, "r_y3": 171.67, "coord_origin": "TOPLEFT" }, "text": "$^{6960]}$, Ahmed Nassar[0000", "orig": "$^{6960]}$, Ahmed Nassar[0000", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 10, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 392.28, "r_y0": 176.27, "r_x1": 398.5, "r_y1": 176.27, "r_x2": 398.5, "r_y2": 169.69, "r_x3": 392.28, "r_y3": 169.69, "coord_origin": "TOPLEFT" }, "text": "\u2212", "orig": "\u2212", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 11, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 398.5, "r_y0": 176.27, "r_x1": 414.39, "r_y1": 176.27, "r_x2": 414.39, "r_y2": 170.08, "r_x3": 398.5, "r_y3": 170.08, "coord_origin": "TOPLEFT" }, "text": "0002", "orig": "0002", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 12, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 414.39, "r_y0": 176.27, "r_x1": 420.61, "r_y1": 176.27, "r_x2": 420.61, "r_y2": 169.69, "r_x3": 414.39, "r_y3": 169.69, "coord_origin": "TOPLEFT" }, "text": "\u2212", "orig": "\u2212", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 13, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 420.61, "r_y0": 176.27, "r_x1": 436.5, "r_y1": 176.27, "r_x2": 436.5, "r_y2": 170.08, "r_x3": 420.61, "r_y3": 170.08, "coord_origin": "TOPLEFT" }, "text": "9468", "orig": "9468", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 14, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 436.5, "r_y0": 176.27, "r_x1": 442.72, "r_y1": 176.27, "r_x2": 442.72, "r_y2": 169.69, "r_x3": 436.5, "r_y3": 169.69, "coord_origin": "TOPLEFT" }, "text": "\u2212", "orig": "\u2212", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 15, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 442.73, "r_y0": 180.47, "r_x1": 464.13, "r_y1": 180.47, "r_x2": 464.13, "r_y2": 171.67, "r_x3": 442.73, "r_y3": 171.67, "coord_origin": "TOPLEFT" }, "text": "$^{0822]}$,", "orig": "$^{0822]}$,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 16, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 139.34, "r_y0": 192.43, "r_x1": 224.81, "r_y1": 192.43, "r_x2": 224.81, "r_y2": 183.63, "r_x3": 139.34, "r_y3": 183.63, "coord_origin": "TOPLEFT" }, "text": "Nikolaos Livathinos", "orig": "Nikolaos Livathinos", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 17, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 224.81, "r_y0": 188.23, "r_x1": 242.95, "r_y1": 188.23, "r_x2": 242.95, "r_y2": 182.04, "r_x3": 224.81, "r_y3": 182.04, "coord_origin": "TOPLEFT" }, "text": "[0000", "orig": "[0000", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 18, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 242.95, "r_y0": 188.23, "r_x1": 249.17, "r_y1": 188.23, "r_x2": 249.17, "r_y2": 181.65, "r_x3": 242.95, "r_y3": 181.65, "coord_origin": "TOPLEFT" }, "text": "\u2212", "orig": "\u2212", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 19, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 249.17, "r_y0": 188.23, "r_x1": 265.06, "r_y1": 188.23, "r_x2": 265.06, "r_y2": 182.04, "r_x3": 249.17, "r_y3": 182.04, "coord_origin": "TOPLEFT" }, "text": "0001", "orig": "0001", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 20, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 265.06, "r_y0": 188.23, "r_x1": 271.29, "r_y1": 188.23, "r_x2": 271.29, "r_y2": 181.65, "r_x3": 265.06, "r_y3": 181.65, "coord_origin": "TOPLEFT" }, "text": "\u2212", "orig": "\u2212", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 21, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 271.29, "r_y0": 188.23, "r_x1": 287.17, "r_y1": 188.23, "r_x2": 287.17, "r_y2": 182.04, "r_x3": 271.29, "r_y3": 182.04, "coord_origin": "TOPLEFT" }, "text": "8513", "orig": "8513", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 22, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 287.17, "r_y0": 188.23, "r_x1": 293.4, "r_y1": 188.23, "r_x2": 293.4, "r_y2": 181.65, "r_x3": 287.17, "r_y3": 181.65, "coord_origin": "TOPLEFT" }, "text": "\u2212", "orig": "\u2212", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 23, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 293.4, "r_y0": 192.43, "r_x1": 404.16, "r_y1": 192.43, "r_x2": 404.16, "r_y2": 183.63, "r_x3": 293.4, "r_y3": 183.63, "coord_origin": "TOPLEFT" }, "text": "$^{3491]}$, Christoph Auer[0000", "orig": "$^{3491]}$, Christoph Auer[0000", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 24, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 404.16, "r_y0": 188.23, "r_x1": 410.38, "r_y1": 188.23, "r_x2": 410.38, "r_y2": 181.65, "r_x3": 404.16, "r_y3": 181.65, "coord_origin": "TOPLEFT" }, "text": "\u2212", "orig": "\u2212", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 25, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 410.39, "r_y0": 188.23, "r_x1": 426.27, "r_y1": 188.23, "r_x2": 426.27, "r_y2": 182.04, "r_x3": 410.39, "r_y3": 182.04, "coord_origin": "TOPLEFT" }, "text": "0001", "orig": "0001", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 26, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 426.27, "r_y0": 188.23, "r_x1": 432.5, "r_y1": 188.23, "r_x2": 432.5, "r_y2": 181.65, "r_x3": 426.27, "r_y3": 181.65, "coord_origin": "TOPLEFT" }, "text": "\u2212", "orig": "\u2212", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 27, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 432.5, "r_y0": 188.23, "r_x1": 448.38, "r_y1": 188.23, "r_x2": 448.38, "r_y2": 182.04, "r_x3": 432.5, "r_y3": 182.04, "coord_origin": "TOPLEFT" }, "text": "5761", "orig": "5761", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 28, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 448.38, "r_y0": 188.23, "r_x1": 454.61, "r_y1": 188.23, "r_x2": 454.61, "r_y2": 181.65, "r_x3": 448.38, "r_y3": 181.65, "coord_origin": "TOPLEFT" }, "text": "\u2212", "orig": "\u2212", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 29, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 454.61, "r_y0": 192.43, "r_x1": 476.01, "r_y1": 192.43, "r_x2": 476.01, "r_y2": 183.63, "r_x3": 454.61, "r_y3": 183.63, "coord_origin": "TOPLEFT" }, "text": "$^{0422]}$,", "orig": "$^{0422]}$,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 31, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 298.61, "r_y0": 200.19, "r_x1": 316.75, "r_y1": 200.19, "r_x2": 316.75, "r_y2": 193.99, "r_x3": 298.61, "r_y3": 193.99, "coord_origin": "TOPLEFT" }, "text": "[0000", "orig": "[0000", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 32, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 316.75, "r_y0": 200.19, "r_x1": 322.97, "r_y1": 200.19, "r_x2": 322.97, "r_y2": 193.6, "r_x3": 316.75, "r_y3": 193.6, "coord_origin": "TOPLEFT" }, "text": "\u2212", "orig": "\u2212", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 33, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 322.97, "r_y0": 200.19, "r_x1": 338.86, "r_y1": 200.19, "r_x2": 338.86, "r_y2": 193.99, "r_x3": 322.97, "r_y3": 193.99, "coord_origin": "TOPLEFT" }, "text": "0002", "orig": "0002", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 34, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 338.86, "r_y0": 200.19, "r_x1": 345.08, "r_y1": 200.19, "r_x2": 345.08, "r_y2": 193.6, "r_x3": 338.86, "r_y3": 193.6, "coord_origin": "TOPLEFT" }, "text": "\u2212", "orig": "\u2212", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 35, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 345.09, "r_y0": 200.19, "r_x1": 360.97, "r_y1": 200.19, "r_x2": 360.97, "r_y2": 193.99, "r_x3": 345.09, "r_y3": 193.99, "coord_origin": "TOPLEFT" }, "text": "8088", "orig": "8088", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 36, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 360.97, "r_y0": 200.19, "r_x1": 367.2, "r_y1": 200.19, "r_x2": 367.2, "r_y2": 193.6, "r_x3": 360.97, "r_y3": 193.6, "coord_origin": "TOPLEFT" }, "text": "\u2212", "orig": "\u2212", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 37, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 367.2, "r_y0": 200.19, "r_x1": 385.34, "r_y1": 200.19, "r_x2": 385.34, "r_y2": 193.99, "r_x3": 367.2, "r_y3": 193.99, "coord_origin": "TOPLEFT" }, "text": "0823]", "orig": "0823]", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 13, "label": "text", "bbox": { "l": 229.52, "t": 195.58, "r": 298.61, "b": 204.38, "coord_origin": "TOPLEFT" }, "confidence": 0.502, "cells": [ { "index": 30, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 229.52, "r_y0": 204.38, "r_x1": 298.61, "r_y1": 204.38, "r_x2": 298.61, "r_y2": 195.58, "r_x3": 229.52, "r_y3": 195.58, "coord_origin": "TOPLEFT" }, "text": "and Peter Staar", "orig": "and Peter Staar", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 9, "label": "text", "bbox": { "l": 279.11, "t": 217.2, "r": 336.25, "b": 225.27, "coord_origin": "TOPLEFT" }, "confidence": 0.631, "cells": [ { "index": 38, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 279.11, "r_y0": 225.27, "r_x1": 336.25, "r_y1": 225.27, "r_x2": 336.25, "r_y2": 217.2, "r_x3": 279.11, "r_y3": 217.2, "coord_origin": "TOPLEFT" }, "text": "IBM Research", "orig": "IBM Research", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 8, "label": "text", "bbox": { "l": 222.97, "t": 228.81, "r": 392.39, "b": 236.28, "coord_origin": "TOPLEFT" }, "confidence": 0.692, "cells": [ { "index": 39, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 222.97, "r_y0": 236.28, "r_x1": 392.39, "r_y1": 236.28, "r_x2": 392.39, "r_y2": 228.81, "r_x3": 222.97, "r_y3": 228.81, "coord_origin": "TOPLEFT" }, "text": "{mly,ahn,nli,cau,taa}@zurich.ibm.com", "orig": "{mly,ahn,nli,cau,taa}@zurich.ibm.com", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] } ] }, "text": null }, { "label": "text", "id": 1, "page_no": 0, "cluster": { "id": 1, "label": "text", "bbox": { "l": 163.11, "t": 270.3, "r": 452.25, "b": 464.73, "coord_origin": "TOPLEFT" }, "confidence": 0.981, "cells": [ { "index": 40, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 163.11, "r_y0": 278.23, "r_x1": 206.64, "r_y1": 278.23, "r_x2": 206.64, "r_y2": 270.3, "r_x3": 163.11, "r_y3": 270.3, "coord_origin": "TOPLEFT" }, "text": "Abstract.", "orig": "Abstract.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 41, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 211.62, "r_y0": 278.43, "r_x1": 452.24, "r_y1": 278.43, "r_x2": 452.24, "r_y2": 270.36, "r_x3": 211.62, "r_y3": 270.36, "coord_origin": "TOPLEFT" }, "text": "Extracting tables from documents is a crucial task in any", "orig": "Extracting tables from documents is a crucial task in any", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 42, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 163.11, "r_y0": 289.39, "r_x1": 452.24, "r_y1": 289.39, "r_x2": 452.24, "r_y2": 281.32, "r_x3": 163.11, "r_y3": 281.32, "coord_origin": "TOPLEFT" }, "text": "document conversion pipeline. Recently, transformer-based models have", "orig": "document conversion pipeline. Recently, transformer-based models have", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 43, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 163.11, "r_y0": 300.35, "r_x1": 452.25, "r_y1": 300.35, "r_x2": 452.25, "r_y2": 292.28, "r_x3": 163.11, "r_y3": 292.28, "coord_origin": "TOPLEFT" }, "text": "demonstrated that table-structure can be recognized with impressive ac-", "orig": "demonstrated that table-structure can be recognized with impressive ac-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 44, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 163.11, "r_y0": 311.31, "r_x1": 452.24, "r_y1": 311.31, "r_x2": 452.24, "r_y2": 303.24, "r_x3": 163.11, "r_y3": 303.24, "coord_origin": "TOPLEFT" }, "text": "curacy using Image-to-Markup-Sequence (Im2Seq) approaches. Taking", "orig": "curacy using Image-to-Markup-Sequence (Im2Seq) approaches. Taking", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 45, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 163.11, "r_y0": 322.27, "r_x1": 452.25, "r_y1": 322.27, "r_x2": 452.25, "r_y2": 314.2, "r_x3": 163.11, "r_y3": 314.2, "coord_origin": "TOPLEFT" }, "text": "only the image of a table, such models predict a sequence of tokens (e.g.", "orig": "only the image of a table, such models predict a sequence of tokens (e.g.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 46, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 163.11, "r_y0": 333.23, "r_x1": 452.25, "r_y1": 333.23, "r_x2": 452.25, "r_y2": 325.16, "r_x3": 163.11, "r_y3": 325.16, "coord_origin": "TOPLEFT" }, "text": "in HTML, LaTeX) which represent the structure of the table. Since the", "orig": "in HTML, LaTeX) which represent the structure of the table. Since the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 47, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 163.11, "r_y0": 344.19, "r_x1": 452.25, "r_y1": 344.19, "r_x2": 452.25, "r_y2": 336.12, "r_x3": 163.11, "r_y3": 336.12, "coord_origin": "TOPLEFT" }, "text": "token representation of the table structure has a significant impact on", "orig": "token representation of the table structure has a significant impact on", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 48, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 163.11, "r_y0": 355.15, "r_x1": 452.25, "r_y1": 355.15, "r_x2": 452.25, "r_y2": 347.08, "r_x3": 163.11, "r_y3": 347.08, "coord_origin": "TOPLEFT" }, "text": "the accuracy and run-time performance of any Im2Seq model, we inves-", "orig": "the accuracy and run-time performance of any Im2Seq model, we inves-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 49, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 163.11, "r_y0": 366.1, "r_x1": 452.25, "r_y1": 366.1, "r_x2": 452.25, "r_y2": 358.03, "r_x3": 163.11, "r_y3": 358.03, "coord_origin": "TOPLEFT" }, "text": "tigate in this paper how table-structure representation can be optimised.", "orig": "tigate in this paper how table-structure representation can be optimised.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 50, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 163.11, "r_y0": 377.06, "r_x1": 452.25, "r_y1": 377.06, "r_x2": 452.25, "r_y2": 368.99, "r_x3": 163.11, "r_y3": 368.99, "coord_origin": "TOPLEFT" }, "text": "We propose a new, optimised table-structure language (OTSL) with a", "orig": "We propose a new, optimised table-structure language (OTSL) with a", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 51, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 163.11, "r_y0": 388.02, "r_x1": 452.24, "r_y1": 388.02, "r_x2": 452.24, "r_y2": 379.95, "r_x3": 163.11, "r_y3": 379.95, "coord_origin": "TOPLEFT" }, "text": "minimized vocabulary and specific rules. The benefits of OTSL are that", "orig": "minimized vocabulary and specific rules. The benefits of OTSL are that", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 52, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 163.11, "r_y0": 398.98, "r_x1": 452.24, "r_y1": 398.98, "r_x2": 452.24, "r_y2": 390.91, "r_x3": 163.11, "r_y3": 390.91, "coord_origin": "TOPLEFT" }, "text": "it reduces the number of tokens to 5 (HTML needs 28+) and shortens", "orig": "it reduces the number of tokens to 5 (HTML needs 28+) and shortens", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 53, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 163.11, "r_y0": 409.94, "r_x1": 452.25, "r_y1": 409.94, "r_x2": 452.25, "r_y2": 401.87, "r_x3": 163.11, "r_y3": 401.87, "coord_origin": "TOPLEFT" }, "text": "the sequence length to half of HTML on average. Consequently, model", "orig": "the sequence length to half of HTML on average. Consequently, model", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 54, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 163.11, "r_y0": 420.9, "r_x1": 452.24, "r_y1": 420.9, "r_x2": 452.24, "r_y2": 412.83, "r_x3": 163.11, "r_y3": 412.83, "coord_origin": "TOPLEFT" }, "text": "accuracy improves significantly, inference time is halved compared to", "orig": "accuracy improves significantly, inference time is halved compared to", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 55, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 163.11, "r_y0": 431.86, "r_x1": 452.24, "r_y1": 431.86, "r_x2": 452.24, "r_y2": 423.79, "r_x3": 163.11, "r_y3": 423.79, "coord_origin": "TOPLEFT" }, "text": "HTML-based models, and the predicted table structures are always syn-", "orig": "HTML-based models, and the predicted table structures are always syn-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 56, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 163.11, "r_y0": 442.82, "r_x1": 452.24, "r_y1": 442.82, "r_x2": 452.24, "r_y2": 434.75, "r_x3": 163.11, "r_y3": 434.75, "coord_origin": "TOPLEFT" }, "text": "tactically correct. This in turn eliminates most post-processing needs.", "orig": "tactically correct. This in turn eliminates most post-processing needs.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 57, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 163.11, "r_y0": 453.78, "r_x1": 452.25, "r_y1": 453.78, "r_x2": 452.25, "r_y2": 445.71, "r_x3": 163.11, "r_y3": 445.71, "coord_origin": "TOPLEFT" }, "text": "Popular table structure data-sets will be published in OTSL format to", "orig": "Popular table structure data-sets will be published in OTSL format to", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 58, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 163.11, "r_y0": 464.73, "r_x1": 225.56, "r_y1": 464.73, "r_x2": 225.56, "r_y2": 456.66, "r_x3": 163.11, "r_y3": 456.66, "coord_origin": "TOPLEFT" }, "text": "the community.", "orig": "the community.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "Abstract. Extracting tables from documents is a crucial task in any document conversion pipeline. Recently, transformer-based models have demonstrated that table-structure can be recognized with impressive accuracy using Image-to-Markup-Sequence (Im2Seq) approaches. Taking only the image of a table, such models predict a sequence of tokens (e.g. in HTML, LaTeX) which represent the structure of the table. Since the token representation of the table structure has a significant impact on the accuracy and run-time performance of any Im2Seq model, we investigate in this paper how table-structure representation can be optimised. We propose a new, optimised table-structure language (OTSL) with a minimized vocabulary and specific rules. The benefits of OTSL are that it reduces the number of tokens to 5 (HTML needs 28+) and shortens the sequence length to half of HTML on average. Consequently, model accuracy improves significantly, inference time is halved compared to HTML-based models, and the predicted table structures are always syntactically correct. This in turn eliminates most post-processing needs. Popular table structure data-sets will be published in OTSL format to the community." }, { "label": "text", "id": 4, "page_no": 0, "cluster": { "id": 4, "label": "text", "bbox": { "l": 163.11, "t": 478.69, "r": 452.24, "b": 497.79, "coord_origin": "TOPLEFT" }, "confidence": 0.93, "cells": [ { "index": 59, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 163.11, "r_y0": 486.62, "r_x1": 211.94, "r_y1": 486.62, "r_x2": 211.94, "r_y2": 478.69, "r_x3": 163.11, "r_y3": 478.69, "coord_origin": "TOPLEFT" }, "text": "Keywords:", "orig": "Keywords:", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 60, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 216.55, "r_y0": 486.83, "r_x1": 452.24, "r_y1": 486.83, "r_x2": 452.24, "r_y2": 478.76, "r_x3": 216.55, "r_y3": 478.76, "coord_origin": "TOPLEFT" }, "text": "Table Structure Recognition \u00b7 Data Representation \u00b7 Trans-", "orig": "Table Structure Recognition \u00b7 Data Representation \u00b7 Trans-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 61, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 163.11, "r_y0": 497.79, "r_x1": 257.64, "r_y1": 497.79, "r_x2": 257.64, "r_y2": 489.72, "r_x3": 163.11, "r_y3": 489.72, "coord_origin": "TOPLEFT" }, "text": "formers \u00b7 Optimization.", "orig": "formers \u00b7 Optimization.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "Keywords: Table Structure Recognition \u00b7 Data Representation \u00b7 Transformers \u00b7 Optimization." }, { "label": "section_header", "id": 3, "page_no": 0, "cluster": { "id": 3, "label": "section_header", "bbox": { "l": 134.77, "t": 522.12, "r": 228.93, "b": 532.69, "coord_origin": "TOPLEFT" }, "confidence": 0.939, "cells": [ { "index": 62, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.77, "r_y0": 532.69, "r_x1": 141.49, "r_y1": 532.69, "r_x2": 141.49, "r_y2": 522.12, "r_x3": 134.77, "r_y3": 522.12, "coord_origin": "TOPLEFT" }, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 63, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 154.94, "r_y0": 532.69, "r_x1": 228.93, "r_y1": 532.69, "r_x2": 228.93, "r_y2": 522.12, "r_x3": 154.94, "r_y3": 522.12, "coord_origin": "TOPLEFT" }, "text": "Introduction", "orig": "Introduction", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "1 Introduction" }, { "label": "text", "id": 0, "page_no": 0, "cluster": { "id": 0, "label": "text", "bbox": { "l": 134.77, "t": 548.29, "r": 480.6, "b": 628.81, "coord_origin": "TOPLEFT" }, "confidence": 0.984, "cells": [ { "index": 64, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.77, "r_y0": 557.08, "r_x1": 480.59, "r_y1": 557.08, "r_x2": 480.59, "r_y2": 548.29, "r_x3": 134.77, "r_y3": 548.29, "coord_origin": "TOPLEFT" }, "text": "Tables are ubiquitous in documents such as scientific papers, patents, reports,", "orig": "Tables are ubiquitous in documents such as scientific papers, patents, reports,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 65, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.77, "r_y0": 569.04, "r_x1": 480.59, "r_y1": 569.04, "r_x2": 480.59, "r_y2": 560.24, "r_x3": 134.77, "r_y3": 560.24, "coord_origin": "TOPLEFT" }, "text": "manuals, specification sheets or marketing material. They often encode highly", "orig": "manuals, specification sheets or marketing material. They often encode highly", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 66, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.77, "r_y0": 580.99, "r_x1": 480.59, "r_y1": 580.99, "r_x2": 480.59, "r_y2": 572.2, "r_x3": 134.77, "r_y3": 572.2, "coord_origin": "TOPLEFT" }, "text": "valuable information and therefore need to be extracted with high accuracy.", "orig": "valuable information and therefore need to be extracted with high accuracy.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 67, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.77, "r_y0": 592.95, "r_x1": 480.6, "r_y1": 592.95, "r_x2": 480.6, "r_y2": 584.15, "r_x3": 134.77, "r_y3": 584.15, "coord_origin": "TOPLEFT" }, "text": "Unfortunately, tables appear in documents in various sizes, styling and struc-", "orig": "Unfortunately, tables appear in documents in various sizes, styling and struc-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 68, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.77, "r_y0": 604.9, "r_x1": 480.59, "r_y1": 604.9, "r_x2": 480.59, "r_y2": 596.11, "r_x3": 134.77, "r_y3": 596.11, "coord_origin": "TOPLEFT" }, "text": "ture, making it difficult to recover their correct structure with simple analyt-", "orig": "ture, making it difficult to recover their correct structure with simple analyt-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 69, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.77, "r_y0": 616.86, "r_x1": 480.59, "r_y1": 616.86, "r_x2": 480.59, "r_y2": 608.06, "r_x3": 134.77, "r_y3": 608.06, "coord_origin": "TOPLEFT" }, "text": "ical methods. Therefore, accurate table extraction is achieved these days with", "orig": "ical methods. Therefore, accurate table extraction is achieved these days with", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 70, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.77, "r_y0": 628.81, "r_x1": 279.33, "r_y1": 628.81, "r_x2": 279.33, "r_y2": 620.02, "r_x3": 134.77, "r_y3": 620.02, "coord_origin": "TOPLEFT" }, "text": "machine-learning based methods.", "orig": "machine-learning based methods.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "Tables are ubiquitous in documents such as scientific papers, patents, reports, manuals, specification sheets or marketing material. They often encode highly valuable information and therefore need to be extracted with high accuracy. Unfortunately, tables appear in documents in various sizes, styling and structure, making it difficult to recover their correct structure with simple analytical methods. Therefore, accurate table extraction is achieved these days with machine-learning based methods." }, { "label": "text", "id": 2, "page_no": 0, "cluster": { "id": 2, "label": "text", "bbox": { "l": 134.77, "t": 632.15, "r": 480.6, "b": 664.85, "coord_origin": "TOPLEFT" }, "confidence": 0.97, "cells": [ { "index": 71, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 149.71, "r_y0": 640.94, "r_x1": 480.59, "r_y1": 640.94, "r_x2": 480.59, "r_y2": 632.15, "r_x3": 149.71, "r_y3": 632.15, "coord_origin": "TOPLEFT" }, "text": "In modern document understanding systems [1,15], table extraction is typi-", "orig": "In modern document understanding systems [1,15], table extraction is typi-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 72, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.77, "r_y0": 652.9, "r_x1": 480.6, "r_y1": 652.9, "r_x2": 480.6, "r_y2": 644.1, "r_x3": 134.77, "r_y3": 644.1, "coord_origin": "TOPLEFT" }, "text": "cally a two-step process. Firstly, every table on a page is located with a bounding", "orig": "cally a two-step process. Firstly, every table on a page is located with a bounding", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 73, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.77, "r_y0": 664.85, "r_x1": 480.59, "r_y1": 664.85, "r_x2": 480.59, "r_y2": 656.06, "r_x3": 134.77, "r_y3": 656.06, "coord_origin": "TOPLEFT" }, "text": "box, and secondly, their logical row and column structure is recognized. As of", "orig": "box, and secondly, their logical row and column structure is recognized. As of", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "In modern document understanding systems [1,15], table extraction is typically a two-step process. Firstly, every table on a page is located with a bounding box, and secondly, their logical row and column structure is recognized. As of" } ], "headers": [ { "label": "page_header", "id": 6, "page_no": 0, "cluster": { "id": 6, "label": "page_header", "bbox": { "l": 18.34, "t": 209.48, "r": 36.34, "b": 555.0, "coord_origin": "TOPLEFT" }, "confidence": 0.89, "cells": [ { "index": 74, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 18.34, "r_y0": 555.0, "r_x1": 36.34, "r_y1": 555.0, "r_x2": 36.34, "r_y2": 209.48, "r_x3": 18.34, "r_y3": 209.48, "coord_origin": "TOPLEFT" }, "text": "arXiv:2305.03393v1 [cs.CV] 5 May 2023", "orig": "arXiv:2305.03393v1 [cs.CV] 5 May 2023", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "arXiv:2305.03393v1 [cs.CV] 5 May 2023" } ] } }, { "page_no": 1, "size": { "width": 612.0, "height": 792.0 }, "parsed_page": { "dimension": { "angle": 0.0, "rect": { "r_x0": 0.0, "r_y0": 0.0, "r_x1": 612.0, "r_y1": 0.0, "r_x2": 612.0, "r_y2": 792.0, "r_x3": 0.0, "r_y3": 792.0, "coord_origin": "BOTTOMLEFT" }, "boundary_type": "crop_box", "art_bbox": { "l": 0.0, "t": 792.0, "r": 612.0, "b": 0.0, "coord_origin": "BOTTOMLEFT" }, "bleed_bbox": { "l": 0.0, "t": 792.0, "r": 612.0, "b": 0.0, "coord_origin": "BOTTOMLEFT" }, "crop_bbox": { "l": 0.0, "t": 792.0, "r": 612.0, "b": 0.0, "coord_origin": "BOTTOMLEFT" }, "media_bbox": { "l": 0.0, "t": 792.0, "r": 612.0, "b": 0.0, "coord_origin": "BOTTOMLEFT" }, "trim_bbox": { "l": 0.0, "t": 792.0, "r": 612.0, "b": 0.0, "coord_origin": "BOTTOMLEFT" } }, "bitmap_resources": [], "char_cells": [], "word_cells": [], "textline_cells": [ { "index": 0, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 101.84, "r_x1": 139.37, "r_y1": 101.84, "r_x2": 139.37, "r_y2": 93.77, "r_x3": 134.76, "r_y3": 93.77, "coord_origin": "TOPLEFT" }, "text": "2", "orig": "2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 1, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 167.81, "r_y0": 101.84, "r_x1": 178.08, "r_y1": 101.84, "r_x2": 178.08, "r_y2": 93.77, "r_x3": 167.81, "r_y3": 93.77, "coord_origin": "TOPLEFT" }, "text": "M.", "orig": "M.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 2, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 182.37, "r_y0": 101.84, "r_x1": 231.72, "r_y1": 101.84, "r_x2": 231.72, "r_y2": 93.77, "r_x3": 182.37, "r_y3": 93.77, "coord_origin": "TOPLEFT" }, "text": "Lysak, et al.", "orig": "Lysak, et al.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 3, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 134.26, "r_x1": 162.64, "r_y1": 134.26, "r_x2": 162.64, "r_y2": 126.33, "r_x3": 134.76, "r_y3": 126.33, "coord_origin": "TOPLEFT" }, "text": "Fig. 1.", "orig": "Fig. 1.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 4, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 167.06, "r_y0": 134.47, "r_x1": 480.59, "r_y1": 134.47, "r_x2": 480.59, "r_y2": 126.4, "r_x3": 167.06, "r_y3": 126.4, "coord_origin": "TOPLEFT" }, "text": "Comparison between HTML and OTSL table structure representation: (A)", "orig": "Comparison between HTML and OTSL table structure representation: (A)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 5, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 145.43, "r_x1": 480.59, "r_y1": 145.43, "r_x2": 480.59, "r_y2": 137.36, "r_x3": 134.76, "r_y3": 137.36, "coord_origin": "TOPLEFT" }, "text": "table-example with complex row and column headers, including a 2D empty span,", "orig": "table-example with complex row and column headers, including a 2D empty span,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 6, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 156.38, "r_x1": 147.95, "r_y1": 156.38, "r_x2": 147.95, "r_y2": 148.31, "r_x3": 134.76, "r_y3": 148.31, "coord_origin": "TOPLEFT" }, "text": "(B)", "orig": "(B)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 7, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 152.39, "r_y0": 156.38, "r_x1": 480.59, "r_y1": 156.38, "r_x2": 480.59, "r_y2": 148.31, "r_x3": 152.39, "r_y3": 148.31, "coord_origin": "TOPLEFT" }, "text": "minimal graphical representation of table structure using rectangular layout, (C)", "orig": "minimal graphical representation of table structure using rectangular layout, (C)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 8, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 167.34, "r_x1": 480.59, "r_y1": 167.34, "r_x2": 480.59, "r_y2": 159.27, "r_x3": 134.76, "r_y3": 159.27, "coord_origin": "TOPLEFT" }, "text": "HTML representation, (D) OTSL representation. This example demonstrates many of", "orig": "HTML representation, (D) OTSL representation. This example demonstrates many of", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 9, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 178.3, "r_x1": 480.59, "r_y1": 178.3, "r_x2": 480.59, "r_y2": 170.23, "r_x3": 134.76, "r_y3": 170.23, "coord_origin": "TOPLEFT" }, "text": "the key-features of OTSL, namely its reduced vocabulary size (12 versus 5 in this case),", "orig": "the key-features of OTSL, namely its reduced vocabulary size (12 versus 5 in this case),", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 10, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 189.26, "r_x1": 480.59, "r_y1": 189.26, "r_x2": 480.59, "r_y2": 181.19, "r_x3": 134.76, "r_y3": 181.19, "coord_origin": "TOPLEFT" }, "text": "its reduced sequence length (55 versus 30) and a enhanced internal structure (variable", "orig": "its reduced sequence length (55 versus 30) and a enhanced internal structure (variable", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 11, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 200.22, "r_x1": 460.87, "r_y1": 200.22, "r_x2": 460.87, "r_y2": 192.15, "r_x3": 134.76, "r_y3": 192.15, "coord_origin": "TOPLEFT" }, "text": "token sequence length per row in HTML versus a fixed length of rows in OTSL).", "orig": "token sequence length per row in HTML versus a fixed length of rows in OTSL).", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 12, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 396.41, "r_y0": 289.51, "r_x1": 402.97, "r_y1": 289.51, "r_x2": 402.97, "r_y2": 280.98, "r_x3": 396.41, "r_y3": 280.98, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 13, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 418.59, "r_y0": 289.42, "r_x1": 425.15, "r_y1": 289.42, "r_x2": 425.15, "r_y2": 280.9, "r_x3": 418.59, "r_y3": 280.9, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 14, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 395.75, "r_y0": 311.76, "r_x1": 402.31, "r_y1": 311.76, "r_x2": 402.31, "r_y2": 303.24, "r_x3": 395.75, "r_y3": 303.24, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 15, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 407.54, "r_y0": 311.9, "r_x1": 414.1, "r_y1": 311.9, "r_x2": 414.1, "r_y2": 303.37, "r_x3": 407.54, "r_y3": 303.37, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 16, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 407.56, "r_y0": 322.93, "r_x1": 414.13, "r_y1": 322.93, "r_x2": 414.13, "r_y2": 314.41, "r_x3": 407.56, "r_y3": 314.41, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 17, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 418.51, "r_y0": 300.61, "r_x1": 425.07, "r_y1": 300.61, "r_x2": 425.07, "r_y2": 292.09, "r_x3": 418.51, "r_y3": 292.09, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 18, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 429.6, "r_y0": 300.62, "r_x1": 436.16, "r_y1": 300.62, "r_x2": 436.16, "r_y2": 292.09, "r_x3": 429.6, "r_y3": 292.09, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 19, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 440.69, "r_y0": 300.54, "r_x1": 447.25, "r_y1": 300.54, "r_x2": 447.25, "r_y2": 292.01, "r_x3": 440.69, "r_y3": 292.01, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 20, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 418.62, "r_y0": 311.82, "r_x1": 425.19, "r_y1": 311.82, "r_x2": 425.19, "r_y2": 303.29, "r_x3": 418.62, "r_y3": 303.29, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 21, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 429.71, "r_y0": 311.83, "r_x1": 436.27, "r_y1": 311.83, "r_x2": 436.27, "r_y2": 303.3, "r_x3": 429.71, "r_y3": 303.3, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 22, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 440.8, "r_y0": 311.75, "r_x1": 447.36, "r_y1": 311.75, "r_x2": 447.36, "r_y2": 303.22, "r_x3": 440.8, "r_y3": 303.22, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 23, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 418.63, "r_y0": 323.09, "r_x1": 425.19, "r_y1": 323.09, "r_x2": 425.19, "r_y2": 314.57, "r_x3": 418.63, "r_y3": 314.57, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 24, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 429.71, "r_y0": 323.1, "r_x1": 436.27, "r_y1": 323.1, "r_x2": 436.27, "r_y2": 314.57, "r_x3": 429.71, "r_y3": 314.57, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 25, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 440.8, "r_y0": 323.02, "r_x1": 447.36, "r_y1": 323.02, "r_x2": 447.36, "r_y2": 314.5, "r_x3": 440.8, "r_y3": 314.5, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 26, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 407.4, "r_y0": 333.82, "r_x1": 413.96, "r_y1": 333.82, "r_x2": 413.96, "r_y2": 325.29, "r_x3": 407.4, "r_y3": 325.29, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 27, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 418.46, "r_y0": 333.98, "r_x1": 425.02, "r_y1": 333.98, "r_x2": 425.02, "r_y2": 325.45, "r_x3": 418.46, "r_y3": 325.45, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 28, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 429.55, "r_y0": 333.98, "r_x1": 436.11, "r_y1": 333.98, "r_x2": 436.11, "r_y2": 325.46, "r_x3": 429.55, "r_y3": 325.46, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 29, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 440.64, "r_y0": 333.91, "r_x1": 447.2, "r_y1": 333.91, "r_x2": 447.2, "r_y2": 325.38, "r_x3": 440.64, "r_y3": 325.38, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 30, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 451.9, "r_y0": 288.68, "r_x1": 463.51, "r_y1": 288.68, "r_x2": 463.51, "r_y2": 280.16, "r_x3": 451.9, "r_y3": 280.16, "coord_origin": "TOPLEFT" }, "text": "NL", "orig": "NL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 31, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 452.16, "r_y0": 300.12, "r_x1": 463.77, "r_y1": 300.12, "r_x2": 463.77, "r_y2": 291.6, "r_x3": 452.16, "r_y3": 291.6, "coord_origin": "TOPLEFT" }, "text": "NL", "orig": "NL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 32, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 452.18, "r_y0": 311.37, "r_x1": 463.79, "r_y1": 311.37, "r_x2": 463.79, "r_y2": 302.84, "r_x3": 452.18, "r_y3": 302.84, "coord_origin": "TOPLEFT" }, "text": "NL", "orig": "NL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 33, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 452.1, "r_y0": 322.65, "r_x1": 463.72, "r_y1": 322.65, "r_x2": 463.72, "r_y2": 314.12, "r_x3": 452.1, "r_y3": 314.12, "coord_origin": "TOPLEFT" }, "text": "NL", "orig": "NL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 34, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 452.3, "r_y0": 333.99, "r_x1": 463.91, "r_y1": 333.99, "r_x2": 463.91, "r_y2": 325.47, "r_x3": 452.3, "r_y3": 325.47, "coord_origin": "TOPLEFT" }, "text": "NL", "orig": "NL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 35, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 396.1, "r_y0": 323.02, "r_x1": 402.66, "r_y1": 323.02, "r_x2": 402.66, "r_y2": 314.49, "r_x3": 396.1, "r_y3": 314.49, "coord_origin": "TOPLEFT" }, "text": "U", "orig": "U", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 36, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 396.0, "r_y0": 333.91, "r_x1": 402.56, "r_y1": 333.91, "r_x2": 402.56, "r_y2": 325.39, "r_x3": 396.0, "r_y3": 325.39, "coord_origin": "TOPLEFT" }, "text": "U", "orig": "U", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 37, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 396.27, "r_y0": 300.8, "r_x1": 402.84, "r_y1": 300.8, "r_x2": 402.84, "r_y2": 292.27, "r_x3": 396.27, "r_y3": 292.27, "coord_origin": "TOPLEFT" }, "text": "U", "orig": "U", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 38, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 408.55, "r_y0": 289.49, "r_x1": 413.6, "r_y1": 289.49, "r_x2": 413.6, "r_y2": 280.97, "r_x3": 408.55, "r_y3": 280.97, "coord_origin": "TOPLEFT" }, "text": "L", "orig": "L", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 39, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 430.59, "r_y0": 289.02, "r_x1": 435.64, "r_y1": 289.02, "r_x2": 435.64, "r_y2": 280.5, "r_x3": 430.59, "r_y3": 280.5, "coord_origin": "TOPLEFT" }, "text": "L", "orig": "L", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 40, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 441.08, "r_y0": 288.91, "r_x1": 446.13, "r_y1": 288.91, "r_x2": 446.13, "r_y2": 280.38, "r_x3": 441.08, "r_y3": 280.38, "coord_origin": "TOPLEFT" }, "text": "L", "orig": "L", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 41, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 407.97, "r_y0": 300.66, "r_x1": 414.04, "r_y1": 300.66, "r_x2": 414.04, "r_y2": 292.13, "r_x3": 407.97, "r_y3": 292.13, "coord_origin": "TOPLEFT" }, "text": "X", "orig": "X", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 42, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 441.26, "r_y0": 419.71, "r_x1": 452.87, "r_y1": 419.71, "r_x2": 452.87, "r_y2": 411.18, "r_x3": 441.26, "r_y3": 411.18, "coord_origin": "TOPLEFT" }, "text": "NL", "orig": "NL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 43, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 393.75, "r_y0": 406.9, "r_x1": 432.49, "r_y1": 406.9, "r_x2": 432.49, "r_y2": 399.79, "r_x3": 393.75, "r_y3": 399.79, "coord_origin": "TOPLEFT" }, "text": "vocabulary:", "orig": "vocabulary:", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 44, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 434.59, "r_y0": 406.9, "r_x1": 438.8, "r_y1": 406.9, "r_x2": 438.8, "r_y2": 399.79, "r_x3": 434.59, "r_y3": 399.79, "coord_origin": "TOPLEFT" }, "text": "5", "orig": "5", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 45, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 440.91, "r_y0": 406.9, "r_x1": 463.22, "r_y1": 406.9, "r_x2": 463.22, "r_y2": 399.79, "r_x3": 440.91, "r_y3": 399.79, "coord_origin": "TOPLEFT" }, "text": "tokens", "orig": "tokens", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 46, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 384.12, "r_y0": 265.65, "r_x1": 413.99, "r_y1": 265.65, "r_x2": 413.99, "r_y2": 258.55, "r_x3": 384.12, "r_y3": 258.55, "coord_origin": "TOPLEFT" }, "text": "D OTSL", "orig": "D OTSL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 47, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 393.75, "r_y0": 273.78, "r_x1": 451.45, "r_y1": 273.78, "r_x2": 451.45, "r_y2": 266.68, "r_x3": 393.75, "r_y3": 266.68, "coord_origin": "TOPLEFT" }, "text": "sequence length:", "orig": "sequence length:", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 48, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 453.55, "r_y0": 273.78, "r_x1": 461.97, "r_y1": 273.78, "r_x2": 461.97, "r_y2": 266.68, "r_x3": 453.55, "r_y3": 266.68, "coord_origin": "TOPLEFT" }, "text": "30", "orig": "30", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 49, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.79, "r_y0": 406.86, "r_x1": 233.89, "r_y1": 406.86, "r_x2": 233.89, "r_y2": 399.76, "r_x3": 151.79, "r_y3": 399.76, "coord_origin": "TOPLEFT" }, "text": "vocabulary for this table:", "orig": "vocabulary for this table:", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 50, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 235.99, "r_y0": 406.86, "r_x1": 244.42, "r_y1": 406.86, "r_x2": 244.42, "r_y2": 399.76, "r_x3": 235.99, "r_y3": 399.76, "coord_origin": "TOPLEFT" }, "text": "12", "orig": "12", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 51, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 246.52, "r_y0": 406.86, "r_x1": 268.84, "r_y1": 406.86, "r_x2": 268.84, "r_y2": 399.76, "r_x3": 246.52, "r_y3": 399.76, "coord_origin": "TOPLEFT" }, "text": "tokens", "orig": "tokens", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 52, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 154.33, "r_y0": 220.68, "r_x1": 159.8, "r_y1": 220.68, "r_x2": 159.8, "r_y2": 213.57, "r_x3": 154.33, "r_y3": 213.57, "coord_origin": "TOPLEFT" }, "text": "A", "orig": "A", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 53, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 321.07, "r_y0": 220.68, "r_x1": 326.54, "r_y1": 220.68, "r_x2": 326.54, "r_y2": 213.57, "r_x3": 321.07, "r_y3": 213.57, "coord_origin": "TOPLEFT" }, "text": "B", "orig": "B", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 54, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 153.09, "r_y0": 286.7, "r_x1": 175.84, "r_y1": 286.7, "r_x2": 175.84, "r_y2": 280.3, "r_x3": 153.09, "r_y3": 280.3, "coord_origin": "TOPLEFT" }, "text": "", "orig": "
", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 55, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 160.67, "r_y0": 293.52, "r_x1": 172.8, "r_y1": 293.52, "r_x2": 172.8, "r_y2": 287.12, "r_x3": 160.67, "r_y3": 287.12, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 56, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 168.25, "r_y0": 300.33, "r_x1": 177.91, "r_y1": 300.33, "r_x2": 177.91, "r_y2": 293.94, "r_x3": 168.25, "r_y3": 293.94, "coord_origin": "TOPLEFT" }, "text": "", "orig": ">", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 60, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 263.36, "r_y0": 300.33, "r_x1": 278.9, "r_y1": 300.33, "r_x2": 278.9, "r_y2": 293.94, "r_x3": 263.36, "r_y3": 293.94, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 61, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 280.79, "r_y0": 300.33, "r_x1": 290.46, "r_y1": 300.33, "r_x2": 290.46, "r_y2": 293.94, "r_x3": 280.79, "r_y3": 293.94, "coord_origin": "TOPLEFT" }, "text": "", "orig": ">", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 64, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 335.93, "r_y0": 300.33, "r_x1": 351.47, "r_y1": 300.33, "r_x2": 351.47, "r_y2": 293.94, "r_x3": 335.93, "r_y3": 293.94, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 65, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 160.67, "r_y0": 307.15, "r_x1": 174.69, "r_y1": 307.15, "r_x2": 174.69, "r_y2": 300.75, "r_x3": 160.67, "r_y3": 300.75, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 66, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 160.67, "r_y0": 313.97, "r_x1": 172.8, "r_y1": 313.97, "r_x2": 172.8, "r_y2": 307.57, "r_x3": 160.67, "r_y3": 307.57, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 67, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 168.25, "r_y0": 320.78, "r_x1": 181.89, "r_y1": 320.78, "r_x2": 181.89, "r_y2": 314.39, "r_x3": 168.25, "r_y3": 314.39, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 69, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 201.22, "r_y0": 320.78, "r_x1": 214.87, "r_y1": 320.78, "r_x2": 214.87, "r_y2": 314.39, "r_x3": 201.22, "r_y3": 314.39, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 71, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 234.19, "r_y0": 320.78, "r_x1": 247.84, "r_y1": 320.78, "r_x2": 247.84, "r_y2": 314.39, "r_x3": 234.19, "r_y3": 314.39, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 73, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 160.67, "r_y0": 327.6, "r_x1": 174.69, "r_y1": 327.6, "r_x2": 174.69, "r_y2": 321.2, "r_x3": 160.67, "r_y3": 321.2, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 74, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 160.67, "r_y0": 334.42, "r_x1": 172.8, "r_y1": 334.42, "r_x2": 172.8, "r_y2": 328.02, "r_x3": 160.67, "r_y3": 328.02, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 75, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 168.25, "r_y0": 341.23, "r_x1": 373.09, "r_y1": 341.23, "r_x2": 373.09, "r_y2": 334.84, "r_x3": 168.25, "r_y3": 334.84, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 76, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 160.67, "r_y0": 348.05, "r_x1": 174.69, "r_y1": 348.05, "r_x2": 174.69, "r_y2": 341.66, "r_x3": 160.67, "r_y3": 341.66, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 77, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 160.67, "r_y0": 354.87, "r_x1": 172.8, "r_y1": 354.87, "r_x2": 172.8, "r_y2": 348.47, "r_x3": 160.67, "r_y3": 348.47, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 78, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 168.25, "r_y0": 361.68, "r_x1": 181.89, "r_y1": 361.68, "r_x2": 181.89, "r_y2": 355.29, "r_x3": 168.25, "r_y3": 355.29, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 80, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 201.22, "r_y0": 361.68, "r_x1": 214.87, "r_y1": 361.68, "r_x2": 214.87, "r_y2": 355.29, "r_x3": 201.22, "r_y3": 355.29, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 82, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 234.19, "r_y0": 361.68, "r_x1": 247.84, "r_y1": 361.68, "r_x2": 247.84, "r_y2": 355.29, "r_x3": 234.19, "r_y3": 355.29, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 84, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 267.17, "r_y0": 361.68, "r_x1": 280.81, "r_y1": 361.68, "r_x2": 280.81, "r_y2": 355.29, "r_x3": 267.17, "r_y3": 355.29, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 86, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 160.67, "r_y0": 368.5, "r_x1": 174.69, "r_y1": 368.5, "r_x2": 174.69, "r_y2": 362.11, "r_x3": 160.67, "r_y3": 362.11, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 87, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 160.67, "r_y0": 375.32, "r_x1": 172.8, "r_y1": 375.32, "r_x2": 172.8, "r_y2": 368.92, "r_x3": 160.67, "r_y3": 368.92, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 88, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 168.25, "r_y0": 382.13, "r_x1": 181.89, "r_y1": 382.13, "r_x2": 181.89, "r_y2": 375.74, "r_x3": 168.25, "r_y3": 375.74, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 90, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 201.22, "r_y0": 382.13, "r_x1": 214.87, "r_y1": 382.13, "r_x2": 214.87, "r_y2": 375.74, "r_x3": 201.22, "r_y3": 375.74, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 92, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 234.19, "r_y0": 382.13, "r_x1": 247.84, "r_y1": 382.13, "r_x2": 247.84, "r_y2": 375.74, "r_x3": 234.19, "r_y3": 375.74, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 94, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 267.17, "r_y0": 382.13, "r_x1": 280.81, "r_y1": 382.13, "r_x2": 280.81, "r_y2": 375.74, "r_x3": 267.17, "r_y3": 375.74, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 96, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 160.67, "r_y0": 388.95, "r_x1": 174.69, "r_y1": 388.95, "r_x2": 174.69, "r_y2": 382.56, "r_x3": 160.67, "r_y3": 382.56, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 97, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 153.09, "r_y0": 395.77, "r_x1": 177.73, "r_y1": 395.77, "r_x2": 177.73, "r_y2": 389.37, "r_x3": 153.09, "r_y3": 389.37, "coord_origin": "TOPLEFT" }, "text": "
", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 68, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 183.79, "r_y0": 320.78, "r_x1": 199.33, "r_y1": 320.78, "r_x2": 199.33, "r_y2": 314.39, "r_x3": 183.79, "r_y3": 314.39, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 70, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 216.76, "r_y0": 320.78, "r_x1": 232.3, "r_y1": 320.78, "r_x2": 232.3, "r_y2": 314.39, "r_x3": 216.76, "r_y3": 314.39, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 72, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 249.73, "r_y0": 320.78, "r_x1": 265.27, "r_y1": 320.78, "r_x2": 265.27, "r_y2": 314.39, "r_x3": 249.73, "r_y3": 314.39, "coord_origin": "TOPLEFT" }, "text": "
", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 79, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 183.79, "r_y0": 361.68, "r_x1": 199.33, "r_y1": 361.68, "r_x2": 199.33, "r_y2": 355.29, "r_x3": 183.79, "r_y3": 355.29, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 81, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 216.76, "r_y0": 361.68, "r_x1": 232.3, "r_y1": 361.68, "r_x2": 232.3, "r_y2": 355.29, "r_x3": 216.76, "r_y3": 355.29, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 83, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 249.73, "r_y0": 361.68, "r_x1": 265.27, "r_y1": 361.68, "r_x2": 265.27, "r_y2": 355.29, "r_x3": 249.73, "r_y3": 355.29, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 85, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 282.71, "r_y0": 361.68, "r_x1": 298.25, "r_y1": 361.68, "r_x2": 298.25, "r_y2": 355.29, "r_x3": 282.71, "r_y3": 355.29, "coord_origin": "TOPLEFT" }, "text": "
", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 89, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 183.79, "r_y0": 382.13, "r_x1": 199.33, "r_y1": 382.13, "r_x2": 199.33, "r_y2": 375.74, "r_x3": 183.79, "r_y3": 375.74, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 91, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 216.76, "r_y0": 382.13, "r_x1": 232.3, "r_y1": 382.13, "r_x2": 232.3, "r_y2": 375.74, "r_x3": 216.76, "r_y3": 375.74, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 93, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 249.73, "r_y0": 382.13, "r_x1": 265.27, "r_y1": 382.13, "r_x2": 265.27, "r_y2": 375.74, "r_x3": 249.73, "r_y3": 375.74, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 95, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 282.71, "r_y0": 382.13, "r_x1": 298.25, "r_y1": 382.13, "r_x2": 298.25, "r_y2": 375.74, "r_x3": 282.71, "r_y3": 375.74, "coord_origin": "TOPLEFT" }, "text": "
", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 98, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 395.06, "r_y0": 419.86, "r_x1": 401.62, "r_y1": 419.86, "r_x2": 401.62, "r_y2": 411.33, "r_x3": 395.06, "r_y3": 411.33, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 99, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 407.42, "r_y0": 419.86, "r_x1": 412.48, "r_y1": 419.86, "r_x2": 412.48, "r_y2": 411.33, "r_x3": 407.42, "r_y3": 411.33, "coord_origin": "TOPLEFT" }, "text": "L", "orig": "L", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 100, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 418.69, "r_y0": 419.86, "r_x1": 425.26, "r_y1": 419.86, "r_x2": 425.26, "r_y2": 411.33, "r_x3": 418.69, "r_y3": 411.33, "coord_origin": "TOPLEFT" }, "text": "U", "orig": "U", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 101, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 430.51, "r_y0": 419.86, "r_x1": 436.57, "r_y1": 419.86, "r_x2": 436.57, "r_y2": 411.33, "r_x3": 430.51, "r_y3": 411.33, "coord_origin": "TOPLEFT" }, "text": "X", "orig": "X", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 102, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 152.36, "r_y0": 416.17, "r_x1": 175.11, "r_y1": 416.17, "r_x2": 175.11, "r_y2": 409.77, "r_x3": 152.36, "r_y3": 409.77, "coord_origin": "TOPLEFT" }, "text": "", "orig": "
", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 103, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 178.89, "r_y0": 416.17, "r_x1": 191.02, "r_y1": 416.17, "r_x2": 191.02, "r_y2": 409.77, "r_x3": 178.89, "r_y3": 409.77, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 104, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 194.81, "r_y0": 416.17, "r_x1": 208.83, "r_y1": 416.17, "r_x2": 208.83, "r_y2": 409.77, "r_x3": 194.81, "r_y3": 409.77, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 105, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 212.61, "r_y0": 416.17, "r_x1": 226.26, "r_y1": 416.17, "r_x2": 226.26, "r_y2": 409.77, "r_x3": 212.61, "r_y3": 409.77, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 107, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 249.38, "r_y0": 416.17, "r_x1": 259.04, "r_y1": 416.17, "r_x2": 259.04, "r_y2": 409.77, "r_x3": 249.38, "r_y3": 409.77, "coord_origin": "TOPLEFT" }, "text": "", "orig": ">", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 113, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 244.46, "r_y0": 424.5, "r_x1": 269.1, "r_y1": 424.5, "r_x2": 269.1, "r_y2": 418.11, "r_x3": 244.46, "r_y3": 418.11, "coord_origin": "TOPLEFT" }, "text": "
", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 106, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 230.05, "r_y0": 416.17, "r_x1": 245.59, "r_y1": 416.17, "r_x2": 245.59, "r_y2": 409.77, "r_x3": 230.05, "r_y3": 409.77, "coord_origin": "TOPLEFT" }, "text": "
", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 114, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 154.51, "r_y0": 265.71, "r_x1": 159.62, "r_y1": 265.71, "r_x2": 159.62, "r_y2": 258.6, "r_x3": 154.51, "r_y3": 258.6, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 115, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 164.74, "r_y0": 265.71, "r_x1": 185.22, "r_y1": 265.71, "r_x2": 185.22, "r_y2": 258.6, "r_x3": 164.74, "r_y3": 258.6, "coord_origin": "TOPLEFT" }, "text": "HTML", "orig": "HTML", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 116, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 164.35, "r_y0": 273.6, "r_x1": 222.05, "r_y1": 273.6, "r_x2": 222.05, "r_y2": 266.5, "r_x3": 164.35, "r_y3": 266.5, "coord_origin": "TOPLEFT" }, "text": "sequence length:", "orig": "sequence length:", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 117, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 224.15, "r_y0": 273.6, "r_x1": 232.58, "r_y1": 273.6, "r_x2": 232.58, "r_y2": 266.5, "r_x3": 224.15, "r_y3": 266.5, "coord_origin": "TOPLEFT" }, "text": "55", "orig": "55", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 118, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 461.11, "r_x1": 161.33, "r_y1": 461.11, "r_x2": 161.33, "r_y2": 452.31, "r_x3": 134.76, "r_y3": 452.31, "coord_origin": "TOPLEFT" }, "text": "today,", "orig": "today,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 119, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 164.27, "r_y0": 461.11, "r_x1": 226.29, "r_y1": 461.11, "r_x2": 226.29, "r_y2": 452.31, "r_x3": 164.27, "r_y3": 452.31, "coord_origin": "TOPLEFT" }, "text": "table detection", "orig": "table detection", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 120, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 229.99, "r_y0": 461.11, "r_x1": 480.59, "r_y1": 461.11, "r_x2": 480.59, "r_y2": 452.31, "r_x3": 229.99, "r_y3": 452.31, "coord_origin": "TOPLEFT" }, "text": "in documents is a well understood problem, and the latest", "orig": "in documents is a well understood problem, and the latest", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 121, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.77, "r_y0": 473.07, "r_x1": 480.59, "r_y1": 473.07, "r_x2": 480.59, "r_y2": 464.27, "r_x3": 134.77, "r_y3": 464.27, "coord_origin": "TOPLEFT" }, "text": "state-of-the-art (SOTA) object detection methods provide an accuracy compa-", "orig": "state-of-the-art (SOTA) object detection methods provide an accuracy compa-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 122, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.77, "r_y0": 485.02, "r_x1": 480.59, "r_y1": 485.02, "r_x2": 480.59, "r_y2": 476.22, "r_x3": 134.77, "r_y3": 476.22, "coord_origin": "TOPLEFT" }, "text": "rable to human observers [7,8,10,14,23]. On the other hand, the problem of table", "orig": "rable to human observers [7,8,10,14,23]. On the other hand, the problem of table", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 123, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.77, "r_y0": 496.98, "r_x1": 480.59, "r_y1": 496.98, "r_x2": 480.59, "r_y2": 488.18, "r_x3": 134.77, "r_y3": 488.18, "coord_origin": "TOPLEFT" }, "text": "structure recognition (TSR) is a lot more challenging and remains a very active", "orig": "structure recognition (TSR) is a lot more challenging and remains a very active", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 124, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.77, "r_y0": 508.93, "r_x1": 480.59, "r_y1": 508.93, "r_x2": 480.59, "r_y2": 500.13, "r_x3": 134.77, "r_y3": 500.13, "coord_origin": "TOPLEFT" }, "text": "area of research, in which many novel machine learning algorithms are being", "orig": "area of research, in which many novel machine learning algorithms are being", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 125, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.77, "r_y0": 520.89, "r_x1": 313.25, "r_y1": 520.89, "r_x2": 313.25, "r_y2": 512.09, "r_x3": 134.77, "r_y3": 512.09, "coord_origin": "TOPLEFT" }, "text": "explored [3,4,5,9,11,12,13,14,17,18,21,22].", "orig": "explored [3,4,5,9,11,12,13,14,17,18,21,22].", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 126, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 149.71, "r_y0": 533.35, "r_x1": 480.59, "r_y1": 533.35, "r_x2": 480.59, "r_y2": 524.55, "r_x3": 149.71, "r_y3": 524.55, "coord_origin": "TOPLEFT" }, "text": "Recently emerging SOTA methods for table structure recognition employ", "orig": "Recently emerging SOTA methods for table structure recognition employ", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 127, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.77, "r_y0": 545.3, "r_x1": 480.59, "r_y1": 545.3, "r_x2": 480.59, "r_y2": 536.51, "r_x3": 134.77, "r_y3": 536.51, "coord_origin": "TOPLEFT" }, "text": "transformer-based models, in which an image of the table is provided to the net-", "orig": "transformer-based models, in which an image of the table is provided to the net-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 128, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.77, "r_y0": 557.26, "r_x1": 480.59, "r_y1": 557.26, "r_x2": 480.59, "r_y2": 548.46, "r_x3": 134.77, "r_y3": 548.46, "coord_origin": "TOPLEFT" }, "text": "work in order to predict the structure of the table as a sequence of tokens. These", "orig": "work in order to predict the structure of the table as a sequence of tokens. These", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 129, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.77, "r_y0": 569.21, "r_x1": 480.59, "r_y1": 569.21, "r_x2": 480.59, "r_y2": 560.42, "r_x3": 134.77, "r_y3": 560.42, "coord_origin": "TOPLEFT" }, "text": "image-to-sequence (Im2Seq) models are extremely powerful, since they allow for", "orig": "image-to-sequence (Im2Seq) models are extremely powerful, since they allow for", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 130, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.77, "r_y0": 581.17, "r_x1": 480.59, "r_y1": 581.17, "r_x2": 480.59, "r_y2": 572.37, "r_x3": 134.77, "r_y3": 572.37, "coord_origin": "TOPLEFT" }, "text": "a purely data-driven solution. The tokens of the sequence typically belong to a", "orig": "a purely data-driven solution. The tokens of the sequence typically belong to a", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 131, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.77, "r_y0": 593.12, "r_x1": 480.59, "r_y1": 593.12, "r_x2": 480.59, "r_y2": 584.33, "r_x3": 134.77, "r_y3": 584.33, "coord_origin": "TOPLEFT" }, "text": "markup language such as HTML, Latex or Markdown, which allow to describe", "orig": "markup language such as HTML, Latex or Markdown, which allow to describe", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 132, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.77, "r_y0": 605.08, "r_x1": 480.59, "r_y1": 605.08, "r_x2": 480.59, "r_y2": 596.28, "r_x3": 134.77, "r_y3": 596.28, "coord_origin": "TOPLEFT" }, "text": "table structure as rows, columns and spanning cells in various configurations.", "orig": "table structure as rows, columns and spanning cells in various configurations.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 133, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.77, "r_y0": 617.03, "r_x1": 480.59, "r_y1": 617.03, "r_x2": 480.59, "r_y2": 608.24, "r_x3": 134.77, "r_y3": 608.24, "coord_origin": "TOPLEFT" }, "text": "In Figure 1, we illustrate how HTML is used to represent the table-structure", "orig": "In Figure 1, we illustrate how HTML is used to represent the table-structure", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 134, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.77, "r_y0": 628.99, "r_x1": 480.59, "r_y1": 628.99, "r_x2": 480.59, "r_y2": 620.19, "r_x3": 134.77, "r_y3": 620.19, "coord_origin": "TOPLEFT" }, "text": "of a particular example table. Public table-structure data sets such as PubTab-", "orig": "of a particular example table. Public table-structure data sets such as PubTab-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 135, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.77, "r_y0": 640.94, "r_x1": 480.59, "r_y1": 640.94, "r_x2": 480.59, "r_y2": 632.15, "r_x3": 134.77, "r_y3": 632.15, "coord_origin": "TOPLEFT" }, "text": "Net [22], and FinTabNet [21], which were created in a semi-automated way from", "orig": "Net [22], and FinTabNet [21], which were created in a semi-automated way from", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 136, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.77, "r_y0": 652.9, "r_x1": 480.59, "r_y1": 652.9, "r_x2": 480.59, "r_y2": 644.1, "r_x3": 134.77, "r_y3": 644.1, "coord_origin": "TOPLEFT" }, "text": "paired PDF and HTML sources (e.g. PubMed Central), popularized primarily", "orig": "paired PDF and HTML sources (e.g. PubMed Central), popularized primarily", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 137, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.77, "r_y0": 664.85, "r_x1": 421.45, "r_y1": 664.85, "r_x2": 421.45, "r_y2": 656.06, "r_x3": 134.77, "r_y3": 656.06, "coord_origin": "TOPLEFT" }, "text": "the use of HTML as ground-truth representation format for TSR.", "orig": "the use of HTML as ground-truth representation format for TSR.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "has_chars": false, "has_words": false, "has_lines": true, "image": null, "lines": [] }, "predictions": { "layout": { "clusters": [ { "id": 5, "label": "page_header", "bbox": { "l": 134.76, "t": 93.77, "r": 139.37, "b": 101.84, "coord_origin": "TOPLEFT" }, "confidence": 0.858, "cells": [ { "index": 0, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 101.84, "r_x1": 139.37, "r_y1": 101.84, "r_x2": 139.37, "r_y2": 93.77, "r_x3": 134.76, "r_y3": 93.77, "coord_origin": "TOPLEFT" }, "text": "2", "orig": "2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 3, "label": "page_header", "bbox": { "l": 167.81, "t": 93.77, "r": 231.72, "b": 101.84, "coord_origin": "TOPLEFT" }, "confidence": 0.908, "cells": [ { "index": 1, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 167.81, "r_y0": 101.84, "r_x1": 178.08, "r_y1": 101.84, "r_x2": 178.08, "r_y2": 93.77, "r_x3": 167.81, "r_y3": 93.77, "coord_origin": "TOPLEFT" }, "text": "M.", "orig": "M.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 2, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 182.37, "r_y0": 101.84, "r_x1": 231.72, "r_y1": 101.84, "r_x2": 231.72, "r_y2": 93.77, "r_x3": 182.37, "r_y3": 93.77, "coord_origin": "TOPLEFT" }, "text": "Lysak, et al.", "orig": "Lysak, et al.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 4, "label": "caption", "bbox": { "l": 134.76, "t": 126.33, "r": 480.59, "b": 200.22, "coord_origin": "TOPLEFT" }, "confidence": 0.894, "cells": [ { "index": 3, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 134.26, "r_x1": 162.64, "r_y1": 134.26, "r_x2": 162.64, "r_y2": 126.33, "r_x3": 134.76, "r_y3": 126.33, "coord_origin": "TOPLEFT" }, "text": "Fig. 1.", "orig": "Fig. 1.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 4, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 167.06, "r_y0": 134.47, "r_x1": 480.59, "r_y1": 134.47, "r_x2": 480.59, "r_y2": 126.4, "r_x3": 167.06, "r_y3": 126.4, "coord_origin": "TOPLEFT" }, "text": "Comparison between HTML and OTSL table structure representation: (A)", "orig": "Comparison between HTML and OTSL table structure representation: (A)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 5, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 145.43, "r_x1": 480.59, "r_y1": 145.43, "r_x2": 480.59, "r_y2": 137.36, "r_x3": 134.76, "r_y3": 137.36, "coord_origin": "TOPLEFT" }, "text": "table-example with complex row and column headers, including a 2D empty span,", "orig": "table-example with complex row and column headers, including a 2D empty span,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 6, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 156.38, "r_x1": 147.95, "r_y1": 156.38, "r_x2": 147.95, "r_y2": 148.31, "r_x3": 134.76, "r_y3": 148.31, "coord_origin": "TOPLEFT" }, "text": "(B)", "orig": "(B)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 7, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 152.39, "r_y0": 156.38, "r_x1": 480.59, "r_y1": 156.38, "r_x2": 480.59, "r_y2": 148.31, "r_x3": 152.39, "r_y3": 148.31, "coord_origin": "TOPLEFT" }, "text": "minimal graphical representation of table structure using rectangular layout, (C)", "orig": "minimal graphical representation of table structure using rectangular layout, (C)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 8, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 167.34, "r_x1": 480.59, "r_y1": 167.34, "r_x2": 480.59, "r_y2": 159.27, "r_x3": 134.76, "r_y3": 159.27, "coord_origin": "TOPLEFT" }, "text": "HTML representation, (D) OTSL representation. This example demonstrates many of", "orig": "HTML representation, (D) OTSL representation. This example demonstrates many of", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 9, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 178.3, "r_x1": 480.59, "r_y1": 178.3, "r_x2": 480.59, "r_y2": 170.23, "r_x3": 134.76, "r_y3": 170.23, "coord_origin": "TOPLEFT" }, "text": "the key-features of OTSL, namely its reduced vocabulary size (12 versus 5 in this case),", "orig": "the key-features of OTSL, namely its reduced vocabulary size (12 versus 5 in this case),", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 10, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 189.26, "r_x1": 480.59, "r_y1": 189.26, "r_x2": 480.59, "r_y2": 181.19, "r_x3": 134.76, "r_y3": 181.19, "coord_origin": "TOPLEFT" }, "text": "its reduced sequence length (55 versus 30) and a enhanced internal structure (variable", "orig": "its reduced sequence length (55 versus 30) and a enhanced internal structure (variable", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 11, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 200.22, "r_x1": 460.87, "r_y1": 200.22, "r_x2": 460.87, "r_y2": 192.15, "r_x3": 134.76, "r_y3": 192.15, "coord_origin": "TOPLEFT" }, "text": "token sequence length per row in HTML versus a fixed length of rows in OTSL).", "orig": "token sequence length per row in HTML versus a fixed length of rows in OTSL).", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 1, "label": "picture", "bbox": { "l": 148.45, "t": 208.37, "r": 464.36, "b": 425.85, "coord_origin": "TOPLEFT" }, "confidence": 0.969, "cells": [ { "index": 12, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 396.41, "r_y0": 289.51, "r_x1": 402.97, "r_y1": 289.51, "r_x2": 402.97, "r_y2": 280.98, "r_x3": 396.41, "r_y3": 280.98, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 13, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 418.59, "r_y0": 289.42, "r_x1": 425.15, "r_y1": 289.42, "r_x2": 425.15, "r_y2": 280.9, "r_x3": 418.59, "r_y3": 280.9, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 14, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 395.75, "r_y0": 311.76, "r_x1": 402.31, "r_y1": 311.76, "r_x2": 402.31, "r_y2": 303.24, "r_x3": 395.75, "r_y3": 303.24, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 15, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 407.54, "r_y0": 311.9, "r_x1": 414.1, "r_y1": 311.9, "r_x2": 414.1, "r_y2": 303.37, "r_x3": 407.54, "r_y3": 303.37, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 16, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 407.56, "r_y0": 322.93, "r_x1": 414.13, "r_y1": 322.93, "r_x2": 414.13, "r_y2": 314.41, "r_x3": 407.56, "r_y3": 314.41, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 17, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 418.51, "r_y0": 300.61, "r_x1": 425.07, "r_y1": 300.61, "r_x2": 425.07, "r_y2": 292.09, "r_x3": 418.51, "r_y3": 292.09, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 18, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 429.6, "r_y0": 300.62, "r_x1": 436.16, "r_y1": 300.62, "r_x2": 436.16, "r_y2": 292.09, "r_x3": 429.6, "r_y3": 292.09, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 19, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 440.69, "r_y0": 300.54, "r_x1": 447.25, "r_y1": 300.54, "r_x2": 447.25, "r_y2": 292.01, "r_x3": 440.69, "r_y3": 292.01, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 20, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 418.62, "r_y0": 311.82, "r_x1": 425.19, "r_y1": 311.82, "r_x2": 425.19, "r_y2": 303.29, "r_x3": 418.62, "r_y3": 303.29, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 21, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 429.71, "r_y0": 311.83, "r_x1": 436.27, "r_y1": 311.83, "r_x2": 436.27, "r_y2": 303.3, "r_x3": 429.71, "r_y3": 303.3, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 22, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 440.8, "r_y0": 311.75, "r_x1": 447.36, "r_y1": 311.75, "r_x2": 447.36, "r_y2": 303.22, "r_x3": 440.8, "r_y3": 303.22, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 23, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 418.63, "r_y0": 323.09, "r_x1": 425.19, "r_y1": 323.09, "r_x2": 425.19, "r_y2": 314.57, "r_x3": 418.63, "r_y3": 314.57, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 24, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 429.71, "r_y0": 323.1, "r_x1": 436.27, "r_y1": 323.1, "r_x2": 436.27, "r_y2": 314.57, "r_x3": 429.71, "r_y3": 314.57, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 25, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 440.8, "r_y0": 323.02, "r_x1": 447.36, "r_y1": 323.02, "r_x2": 447.36, "r_y2": 314.5, "r_x3": 440.8, "r_y3": 314.5, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 26, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 407.4, "r_y0": 333.82, "r_x1": 413.96, "r_y1": 333.82, "r_x2": 413.96, "r_y2": 325.29, "r_x3": 407.4, "r_y3": 325.29, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 27, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 418.46, "r_y0": 333.98, "r_x1": 425.02, "r_y1": 333.98, "r_x2": 425.02, "r_y2": 325.45, "r_x3": 418.46, "r_y3": 325.45, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 28, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 429.55, "r_y0": 333.98, "r_x1": 436.11, "r_y1": 333.98, "r_x2": 436.11, "r_y2": 325.46, "r_x3": 429.55, "r_y3": 325.46, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 29, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 440.64, "r_y0": 333.91, "r_x1": 447.2, "r_y1": 333.91, "r_x2": 447.2, "r_y2": 325.38, "r_x3": 440.64, "r_y3": 325.38, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 30, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 451.9, "r_y0": 288.68, "r_x1": 463.51, "r_y1": 288.68, "r_x2": 463.51, "r_y2": 280.16, "r_x3": 451.9, "r_y3": 280.16, "coord_origin": "TOPLEFT" }, "text": "NL", "orig": "NL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 31, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 452.16, "r_y0": 300.12, "r_x1": 463.77, "r_y1": 300.12, "r_x2": 463.77, "r_y2": 291.6, "r_x3": 452.16, "r_y3": 291.6, "coord_origin": "TOPLEFT" }, "text": "NL", "orig": "NL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 32, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 452.18, "r_y0": 311.37, "r_x1": 463.79, "r_y1": 311.37, "r_x2": 463.79, "r_y2": 302.84, "r_x3": 452.18, "r_y3": 302.84, "coord_origin": "TOPLEFT" }, "text": "NL", "orig": "NL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 33, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 452.1, "r_y0": 322.65, "r_x1": 463.72, "r_y1": 322.65, "r_x2": 463.72, "r_y2": 314.12, "r_x3": 452.1, "r_y3": 314.12, "coord_origin": "TOPLEFT" }, "text": "NL", "orig": "NL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 34, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 452.3, "r_y0": 333.99, "r_x1": 463.91, "r_y1": 333.99, "r_x2": 463.91, "r_y2": 325.47, "r_x3": 452.3, "r_y3": 325.47, "coord_origin": "TOPLEFT" }, "text": "NL", "orig": "NL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 35, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 396.1, "r_y0": 323.02, "r_x1": 402.66, "r_y1": 323.02, "r_x2": 402.66, "r_y2": 314.49, "r_x3": 396.1, "r_y3": 314.49, "coord_origin": "TOPLEFT" }, "text": "U", "orig": "U", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 36, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 396.0, "r_y0": 333.91, "r_x1": 402.56, "r_y1": 333.91, "r_x2": 402.56, "r_y2": 325.39, "r_x3": 396.0, "r_y3": 325.39, "coord_origin": "TOPLEFT" }, "text": "U", "orig": "U", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 37, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 396.27, "r_y0": 300.8, "r_x1": 402.84, "r_y1": 300.8, "r_x2": 402.84, "r_y2": 292.27, "r_x3": 396.27, "r_y3": 292.27, "coord_origin": "TOPLEFT" }, "text": "U", "orig": "U", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 38, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 408.55, "r_y0": 289.49, "r_x1": 413.6, "r_y1": 289.49, "r_x2": 413.6, "r_y2": 280.97, "r_x3": 408.55, "r_y3": 280.97, "coord_origin": "TOPLEFT" }, "text": "L", "orig": "L", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 39, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 430.59, "r_y0": 289.02, "r_x1": 435.64, "r_y1": 289.02, "r_x2": 435.64, "r_y2": 280.5, "r_x3": 430.59, "r_y3": 280.5, "coord_origin": "TOPLEFT" }, "text": "L", "orig": "L", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 40, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 441.08, "r_y0": 288.91, "r_x1": 446.13, "r_y1": 288.91, "r_x2": 446.13, "r_y2": 280.38, "r_x3": 441.08, "r_y3": 280.38, "coord_origin": "TOPLEFT" }, "text": "L", "orig": "L", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 41, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 407.97, "r_y0": 300.66, "r_x1": 414.04, "r_y1": 300.66, "r_x2": 414.04, "r_y2": 292.13, "r_x3": 407.97, "r_y3": 292.13, "coord_origin": "TOPLEFT" }, "text": "X", "orig": "X", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 42, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 441.26, "r_y0": 419.71, "r_x1": 452.87, "r_y1": 419.71, "r_x2": 452.87, "r_y2": 411.18, "r_x3": 441.26, "r_y3": 411.18, "coord_origin": "TOPLEFT" }, "text": "NL", "orig": "NL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 43, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 393.75, "r_y0": 406.9, "r_x1": 432.49, "r_y1": 406.9, "r_x2": 432.49, "r_y2": 399.79, "r_x3": 393.75, "r_y3": 399.79, "coord_origin": "TOPLEFT" }, "text": "vocabulary:", "orig": "vocabulary:", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 44, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 434.59, "r_y0": 406.9, "r_x1": 438.8, "r_y1": 406.9, "r_x2": 438.8, "r_y2": 399.79, "r_x3": 434.59, "r_y3": 399.79, "coord_origin": "TOPLEFT" }, "text": "5", "orig": "5", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 45, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 440.91, "r_y0": 406.9, "r_x1": 463.22, "r_y1": 406.9, "r_x2": 463.22, "r_y2": 399.79, "r_x3": 440.91, "r_y3": 399.79, "coord_origin": "TOPLEFT" }, "text": "tokens", "orig": "tokens", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 46, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 384.12, "r_y0": 265.65, "r_x1": 413.99, "r_y1": 265.65, "r_x2": 413.99, "r_y2": 258.55, "r_x3": 384.12, "r_y3": 258.55, "coord_origin": "TOPLEFT" }, "text": "D OTSL", "orig": "D OTSL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 47, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 393.75, "r_y0": 273.78, "r_x1": 451.45, "r_y1": 273.78, "r_x2": 451.45, "r_y2": 266.68, "r_x3": 393.75, "r_y3": 266.68, "coord_origin": "TOPLEFT" }, "text": "sequence length:", "orig": "sequence length:", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 48, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 453.55, "r_y0": 273.78, "r_x1": 461.97, "r_y1": 273.78, "r_x2": 461.97, "r_y2": 266.68, "r_x3": 453.55, "r_y3": 266.68, "coord_origin": "TOPLEFT" }, "text": "30", "orig": "30", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 49, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.79, "r_y0": 406.86, "r_x1": 233.89, "r_y1": 406.86, "r_x2": 233.89, "r_y2": 399.76, "r_x3": 151.79, "r_y3": 399.76, "coord_origin": "TOPLEFT" }, "text": "vocabulary for this table:", "orig": "vocabulary for this table:", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 50, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 235.99, "r_y0": 406.86, "r_x1": 244.42, "r_y1": 406.86, "r_x2": 244.42, "r_y2": 399.76, "r_x3": 235.99, "r_y3": 399.76, "coord_origin": "TOPLEFT" }, "text": "12", "orig": "12", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 51, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 246.52, "r_y0": 406.86, "r_x1": 268.84, "r_y1": 406.86, "r_x2": 268.84, "r_y2": 399.76, "r_x3": 246.52, "r_y3": 399.76, "coord_origin": "TOPLEFT" }, "text": "tokens", "orig": "tokens", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 52, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 154.33, "r_y0": 220.68, "r_x1": 159.8, "r_y1": 220.68, "r_x2": 159.8, "r_y2": 213.57, "r_x3": 154.33, "r_y3": 213.57, "coord_origin": "TOPLEFT" }, "text": "A", "orig": "A", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 53, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 321.07, "r_y0": 220.68, "r_x1": 326.54, "r_y1": 220.68, "r_x2": 326.54, "r_y2": 213.57, "r_x3": 321.07, "r_y3": 213.57, "coord_origin": "TOPLEFT" }, "text": "B", "orig": "B", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 54, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 153.09, "r_y0": 286.7, "r_x1": 175.84, "r_y1": 286.7, "r_x2": 175.84, "r_y2": 280.3, "r_x3": 153.09, "r_y3": 280.3, "coord_origin": "TOPLEFT" }, "text": "", "orig": "
", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 55, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 160.67, "r_y0": 293.52, "r_x1": 172.8, "r_y1": 293.52, "r_x2": 172.8, "r_y2": 287.12, "r_x3": 160.67, "r_y3": 287.12, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 56, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 168.25, "r_y0": 300.33, "r_x1": 177.91, "r_y1": 300.33, "r_x2": 177.91, "r_y2": 293.94, "r_x3": 168.25, "r_y3": 293.94, "coord_origin": "TOPLEFT" }, "text": "", "orig": ">", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 60, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 263.36, "r_y0": 300.33, "r_x1": 278.9, "r_y1": 300.33, "r_x2": 278.9, "r_y2": 293.94, "r_x3": 263.36, "r_y3": 293.94, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 61, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 280.79, "r_y0": 300.33, "r_x1": 290.46, "r_y1": 300.33, "r_x2": 290.46, "r_y2": 293.94, "r_x3": 280.79, "r_y3": 293.94, "coord_origin": "TOPLEFT" }, "text": "", "orig": ">", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 64, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 335.93, "r_y0": 300.33, "r_x1": 351.47, "r_y1": 300.33, "r_x2": 351.47, "r_y2": 293.94, "r_x3": 335.93, "r_y3": 293.94, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 65, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 160.67, "r_y0": 307.15, "r_x1": 174.69, "r_y1": 307.15, "r_x2": 174.69, "r_y2": 300.75, "r_x3": 160.67, "r_y3": 300.75, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 66, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 160.67, "r_y0": 313.97, "r_x1": 172.8, "r_y1": 313.97, "r_x2": 172.8, "r_y2": 307.57, "r_x3": 160.67, "r_y3": 307.57, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 67, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 168.25, "r_y0": 320.78, "r_x1": 181.89, "r_y1": 320.78, "r_x2": 181.89, "r_y2": 314.39, "r_x3": 168.25, "r_y3": 314.39, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 69, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 201.22, "r_y0": 320.78, "r_x1": 214.87, "r_y1": 320.78, "r_x2": 214.87, "r_y2": 314.39, "r_x3": 201.22, "r_y3": 314.39, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 71, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 234.19, "r_y0": 320.78, "r_x1": 247.84, "r_y1": 320.78, "r_x2": 247.84, "r_y2": 314.39, "r_x3": 234.19, "r_y3": 314.39, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 73, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 160.67, "r_y0": 327.6, "r_x1": 174.69, "r_y1": 327.6, "r_x2": 174.69, "r_y2": 321.2, "r_x3": 160.67, "r_y3": 321.2, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 74, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 160.67, "r_y0": 334.42, "r_x1": 172.8, "r_y1": 334.42, "r_x2": 172.8, "r_y2": 328.02, "r_x3": 160.67, "r_y3": 328.02, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 75, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 168.25, "r_y0": 341.23, "r_x1": 373.09, "r_y1": 341.23, "r_x2": 373.09, "r_y2": 334.84, "r_x3": 168.25, "r_y3": 334.84, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 76, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 160.67, "r_y0": 348.05, "r_x1": 174.69, "r_y1": 348.05, "r_x2": 174.69, "r_y2": 341.66, "r_x3": 160.67, "r_y3": 341.66, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 77, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 160.67, "r_y0": 354.87, "r_x1": 172.8, "r_y1": 354.87, "r_x2": 172.8, "r_y2": 348.47, "r_x3": 160.67, "r_y3": 348.47, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 78, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 168.25, "r_y0": 361.68, "r_x1": 181.89, "r_y1": 361.68, "r_x2": 181.89, "r_y2": 355.29, "r_x3": 168.25, "r_y3": 355.29, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 80, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 201.22, "r_y0": 361.68, "r_x1": 214.87, "r_y1": 361.68, "r_x2": 214.87, "r_y2": 355.29, "r_x3": 201.22, "r_y3": 355.29, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 82, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 234.19, "r_y0": 361.68, "r_x1": 247.84, "r_y1": 361.68, "r_x2": 247.84, "r_y2": 355.29, "r_x3": 234.19, "r_y3": 355.29, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 84, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 267.17, "r_y0": 361.68, "r_x1": 280.81, "r_y1": 361.68, "r_x2": 280.81, "r_y2": 355.29, "r_x3": 267.17, "r_y3": 355.29, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 86, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 160.67, "r_y0": 368.5, "r_x1": 174.69, "r_y1": 368.5, "r_x2": 174.69, "r_y2": 362.11, "r_x3": 160.67, "r_y3": 362.11, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 87, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 160.67, "r_y0": 375.32, "r_x1": 172.8, "r_y1": 375.32, "r_x2": 172.8, "r_y2": 368.92, "r_x3": 160.67, "r_y3": 368.92, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 88, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 168.25, "r_y0": 382.13, "r_x1": 181.89, "r_y1": 382.13, "r_x2": 181.89, "r_y2": 375.74, "r_x3": 168.25, "r_y3": 375.74, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 90, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 201.22, "r_y0": 382.13, "r_x1": 214.87, "r_y1": 382.13, "r_x2": 214.87, "r_y2": 375.74, "r_x3": 201.22, "r_y3": 375.74, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 92, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 234.19, "r_y0": 382.13, "r_x1": 247.84, "r_y1": 382.13, "r_x2": 247.84, "r_y2": 375.74, "r_x3": 234.19, "r_y3": 375.74, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 94, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 267.17, "r_y0": 382.13, "r_x1": 280.81, "r_y1": 382.13, "r_x2": 280.81, "r_y2": 375.74, "r_x3": 267.17, "r_y3": 375.74, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 96, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 160.67, "r_y0": 388.95, "r_x1": 174.69, "r_y1": 388.95, "r_x2": 174.69, "r_y2": 382.56, "r_x3": 160.67, "r_y3": 382.56, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 97, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 153.09, "r_y0": 395.77, "r_x1": 177.73, "r_y1": 395.77, "r_x2": 177.73, "r_y2": 389.37, "r_x3": 153.09, "r_y3": 389.37, "coord_origin": "TOPLEFT" }, "text": "
", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 68, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 183.79, "r_y0": 320.78, "r_x1": 199.33, "r_y1": 320.78, "r_x2": 199.33, "r_y2": 314.39, "r_x3": 183.79, "r_y3": 314.39, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 70, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 216.76, "r_y0": 320.78, "r_x1": 232.3, "r_y1": 320.78, "r_x2": 232.3, "r_y2": 314.39, "r_x3": 216.76, "r_y3": 314.39, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 72, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 249.73, "r_y0": 320.78, "r_x1": 265.27, "r_y1": 320.78, "r_x2": 265.27, "r_y2": 314.39, "r_x3": 249.73, "r_y3": 314.39, "coord_origin": "TOPLEFT" }, "text": "
", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 79, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 183.79, "r_y0": 361.68, "r_x1": 199.33, "r_y1": 361.68, "r_x2": 199.33, "r_y2": 355.29, "r_x3": 183.79, "r_y3": 355.29, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 81, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 216.76, "r_y0": 361.68, "r_x1": 232.3, "r_y1": 361.68, "r_x2": 232.3, "r_y2": 355.29, "r_x3": 216.76, "r_y3": 355.29, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 83, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 249.73, "r_y0": 361.68, "r_x1": 265.27, "r_y1": 361.68, "r_x2": 265.27, "r_y2": 355.29, "r_x3": 249.73, "r_y3": 355.29, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 85, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 282.71, "r_y0": 361.68, "r_x1": 298.25, "r_y1": 361.68, "r_x2": 298.25, "r_y2": 355.29, "r_x3": 282.71, "r_y3": 355.29, "coord_origin": "TOPLEFT" }, "text": "
", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 89, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 183.79, "r_y0": 382.13, "r_x1": 199.33, "r_y1": 382.13, "r_x2": 199.33, "r_y2": 375.74, "r_x3": 183.79, "r_y3": 375.74, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 91, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 216.76, "r_y0": 382.13, "r_x1": 232.3, "r_y1": 382.13, "r_x2": 232.3, "r_y2": 375.74, "r_x3": 216.76, "r_y3": 375.74, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 93, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 249.73, "r_y0": 382.13, "r_x1": 265.27, "r_y1": 382.13, "r_x2": 265.27, "r_y2": 375.74, "r_x3": 249.73, "r_y3": 375.74, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 95, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 282.71, "r_y0": 382.13, "r_x1": 298.25, "r_y1": 382.13, "r_x2": 298.25, "r_y2": 375.74, "r_x3": 282.71, "r_y3": 375.74, "coord_origin": "TOPLEFT" }, "text": "
", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 98, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 395.06, "r_y0": 419.86, "r_x1": 401.62, "r_y1": 419.86, "r_x2": 401.62, "r_y2": 411.33, "r_x3": 395.06, "r_y3": 411.33, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 99, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 407.42, "r_y0": 419.86, "r_x1": 412.48, "r_y1": 419.86, "r_x2": 412.48, "r_y2": 411.33, "r_x3": 407.42, "r_y3": 411.33, "coord_origin": "TOPLEFT" }, "text": "L", "orig": "L", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 100, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 418.69, "r_y0": 419.86, "r_x1": 425.26, "r_y1": 419.86, "r_x2": 425.26, "r_y2": 411.33, "r_x3": 418.69, "r_y3": 411.33, "coord_origin": "TOPLEFT" }, "text": "U", "orig": "U", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 101, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 430.51, "r_y0": 419.86, "r_x1": 436.57, "r_y1": 419.86, "r_x2": 436.57, "r_y2": 411.33, "r_x3": 430.51, "r_y3": 411.33, "coord_origin": "TOPLEFT" }, "text": "X", "orig": "X", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 102, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 152.36, "r_y0": 416.17, "r_x1": 175.11, "r_y1": 416.17, "r_x2": 175.11, "r_y2": 409.77, "r_x3": 152.36, "r_y3": 409.77, "coord_origin": "TOPLEFT" }, "text": "", "orig": "
", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 103, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 178.89, "r_y0": 416.17, "r_x1": 191.02, "r_y1": 416.17, "r_x2": 191.02, "r_y2": 409.77, "r_x3": 178.89, "r_y3": 409.77, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 104, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 194.81, "r_y0": 416.17, "r_x1": 208.83, "r_y1": 416.17, "r_x2": 208.83, "r_y2": 409.77, "r_x3": 194.81, "r_y3": 409.77, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 105, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 212.61, "r_y0": 416.17, "r_x1": 226.26, "r_y1": 416.17, "r_x2": 226.26, "r_y2": 409.77, "r_x3": 212.61, "r_y3": 409.77, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 107, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 249.38, "r_y0": 416.17, "r_x1": 259.04, "r_y1": 416.17, "r_x2": 259.04, "r_y2": 409.77, "r_x3": 249.38, "r_y3": 409.77, "coord_origin": "TOPLEFT" }, "text": "", "orig": ">", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 113, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 244.46, "r_y0": 424.5, "r_x1": 269.1, "r_y1": 424.5, "r_x2": 269.1, "r_y2": 418.11, "r_x3": 244.46, "r_y3": 418.11, "coord_origin": "TOPLEFT" }, "text": "
", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 106, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 230.05, "r_y0": 416.17, "r_x1": 245.59, "r_y1": 416.17, "r_x2": 245.59, "r_y2": 409.77, "r_x3": 230.05, "r_y3": 409.77, "coord_origin": "TOPLEFT" }, "text": "
", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 114, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 154.51, "r_y0": 265.71, "r_x1": 159.62, "r_y1": 265.71, "r_x2": 159.62, "r_y2": 258.6, "r_x3": 154.51, "r_y3": 258.6, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 115, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 164.74, "r_y0": 265.71, "r_x1": 185.22, "r_y1": 265.71, "r_x2": 185.22, "r_y2": 258.6, "r_x3": 164.74, "r_y3": 258.6, "coord_origin": "TOPLEFT" }, "text": "HTML", "orig": "HTML", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 116, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 164.35, "r_y0": 273.6, "r_x1": 222.05, "r_y1": 273.6, "r_x2": 222.05, "r_y2": 266.5, "r_x3": 164.35, "r_y3": 266.5, "coord_origin": "TOPLEFT" }, "text": "sequence length:", "orig": "sequence length:", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 117, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 224.15, "r_y0": 273.6, "r_x1": 232.58, "r_y1": 273.6, "r_x2": 232.58, "r_y2": 266.5, "r_x3": 224.15, "r_y3": 266.5, "coord_origin": "TOPLEFT" }, "text": "55", "orig": "55", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [ { "id": 11, "label": "text", "bbox": { "l": 396.41, "t": 280.98, "r": 402.97, "b": 289.51, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 12, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 396.41, "r_y0": 289.51, "r_x1": 402.97, "r_y1": 289.51, "r_x2": 402.97, "r_y2": 280.98, "r_x3": 396.41, "r_y3": 280.98, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 12, "label": "text", "bbox": { "l": 418.59, "t": 280.9, "r": 425.15, "b": 289.42, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 13, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 418.59, "r_y0": 289.42, "r_x1": 425.15, "r_y1": 289.42, "r_x2": 425.15, "r_y2": 280.9, "r_x3": 418.59, "r_y3": 280.9, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 13, "label": "text", "bbox": { "l": 395.75, "t": 303.24, "r": 402.31, "b": 311.76, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 14, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 395.75, "r_y0": 311.76, "r_x1": 402.31, "r_y1": 311.76, "r_x2": 402.31, "r_y2": 303.24, "r_x3": 395.75, "r_y3": 303.24, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 14, "label": "text", "bbox": { "l": 407.54, "t": 303.37, "r": 414.1, "b": 311.9, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 15, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 407.54, "r_y0": 311.9, "r_x1": 414.1, "r_y1": 311.9, "r_x2": 414.1, "r_y2": 303.37, "r_x3": 407.54, "r_y3": 303.37, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 15, "label": "text", "bbox": { "l": 407.56, "t": 314.41, "r": 414.13, "b": 322.93, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 16, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 407.56, "r_y0": 322.93, "r_x1": 414.13, "r_y1": 322.93, "r_x2": 414.13, "r_y2": 314.41, "r_x3": 407.56, "r_y3": 314.41, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 16, "label": "text", "bbox": { "l": 418.51, "t": 292.09, "r": 425.07, "b": 300.61, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 17, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 418.51, "r_y0": 300.61, "r_x1": 425.07, "r_y1": 300.61, "r_x2": 425.07, "r_y2": 292.09, "r_x3": 418.51, "r_y3": 292.09, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 17, "label": "text", "bbox": { "l": 429.6, "t": 292.09, "r": 436.16, "b": 300.62, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 18, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 429.6, "r_y0": 300.62, "r_x1": 436.16, "r_y1": 300.62, "r_x2": 436.16, "r_y2": 292.09, "r_x3": 429.6, "r_y3": 292.09, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 18, "label": "text", "bbox": { "l": 440.69, "t": 292.01, "r": 447.25, "b": 300.54, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 19, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 440.69, "r_y0": 300.54, "r_x1": 447.25, "r_y1": 300.54, "r_x2": 447.25, "r_y2": 292.01, "r_x3": 440.69, "r_y3": 292.01, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 19, "label": "text", "bbox": { "l": 418.62, "t": 303.29, "r": 425.19, "b": 311.82, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 20, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 418.62, "r_y0": 311.82, "r_x1": 425.19, "r_y1": 311.82, "r_x2": 425.19, "r_y2": 303.29, "r_x3": 418.62, "r_y3": 303.29, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 20, "label": "text", "bbox": { "l": 429.71, "t": 303.3, "r": 436.27, "b": 311.83, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 21, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 429.71, "r_y0": 311.83, "r_x1": 436.27, "r_y1": 311.83, "r_x2": 436.27, "r_y2": 303.3, "r_x3": 429.71, "r_y3": 303.3, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 21, "label": "text", "bbox": { "l": 440.8, "t": 303.22, "r": 447.36, "b": 311.75, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 22, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 440.8, "r_y0": 311.75, "r_x1": 447.36, "r_y1": 311.75, "r_x2": 447.36, "r_y2": 303.22, "r_x3": 440.8, "r_y3": 303.22, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 22, "label": "text", "bbox": { "l": 418.63, "t": 314.57, "r": 425.19, "b": 323.09, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 23, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 418.63, "r_y0": 323.09, "r_x1": 425.19, "r_y1": 323.09, "r_x2": 425.19, "r_y2": 314.57, "r_x3": 418.63, "r_y3": 314.57, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 23, "label": "text", "bbox": { "l": 429.71, "t": 314.57, "r": 436.27, "b": 323.1, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 24, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 429.71, "r_y0": 323.1, "r_x1": 436.27, "r_y1": 323.1, "r_x2": 436.27, "r_y2": 314.57, "r_x3": 429.71, "r_y3": 314.57, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 24, "label": "text", "bbox": { "l": 440.8, "t": 314.5, "r": 447.36, "b": 323.02, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 25, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 440.8, "r_y0": 323.02, "r_x1": 447.36, "r_y1": 323.02, "r_x2": 447.36, "r_y2": 314.5, "r_x3": 440.8, "r_y3": 314.5, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 25, "label": "text", "bbox": { "l": 407.4, "t": 325.29, "r": 413.96, "b": 333.82, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 26, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 407.4, "r_y0": 333.82, "r_x1": 413.96, "r_y1": 333.82, "r_x2": 413.96, "r_y2": 325.29, "r_x3": 407.4, "r_y3": 325.29, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 26, "label": "text", "bbox": { "l": 418.46, "t": 325.45, "r": 425.02, "b": 333.98, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 27, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 418.46, "r_y0": 333.98, "r_x1": 425.02, "r_y1": 333.98, "r_x2": 425.02, "r_y2": 325.45, "r_x3": 418.46, "r_y3": 325.45, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 27, "label": "text", "bbox": { "l": 429.55, "t": 325.46, "r": 436.11, "b": 333.98, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 28, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 429.55, "r_y0": 333.98, "r_x1": 436.11, "r_y1": 333.98, "r_x2": 436.11, "r_y2": 325.46, "r_x3": 429.55, "r_y3": 325.46, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 28, "label": "text", "bbox": { "l": 440.64, "t": 325.38, "r": 447.2, "b": 333.91, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 29, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 440.64, "r_y0": 333.91, "r_x1": 447.2, "r_y1": 333.91, "r_x2": 447.2, "r_y2": 325.38, "r_x3": 440.64, "r_y3": 325.38, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 29, "label": "text", "bbox": { "l": 451.9, "t": 280.16, "r": 463.51, "b": 288.68, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 30, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 451.9, "r_y0": 288.68, "r_x1": 463.51, "r_y1": 288.68, "r_x2": 463.51, "r_y2": 280.16, "r_x3": 451.9, "r_y3": 280.16, "coord_origin": "TOPLEFT" }, "text": "NL", "orig": "NL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 30, "label": "text", "bbox": { "l": 452.16, "t": 291.6, "r": 463.77, "b": 300.12, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 31, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 452.16, "r_y0": 300.12, "r_x1": 463.77, "r_y1": 300.12, "r_x2": 463.77, "r_y2": 291.6, "r_x3": 452.16, "r_y3": 291.6, "coord_origin": "TOPLEFT" }, "text": "NL", "orig": "NL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 31, "label": "text", "bbox": { "l": 452.18, "t": 302.84, "r": 463.79, "b": 311.37, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 32, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 452.18, "r_y0": 311.37, "r_x1": 463.79, "r_y1": 311.37, "r_x2": 463.79, "r_y2": 302.84, "r_x3": 452.18, "r_y3": 302.84, "coord_origin": "TOPLEFT" }, "text": "NL", "orig": "NL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 32, "label": "text", "bbox": { "l": 452.1, "t": 314.12, "r": 463.72, "b": 322.65, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 33, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 452.1, "r_y0": 322.65, "r_x1": 463.72, "r_y1": 322.65, "r_x2": 463.72, "r_y2": 314.12, "r_x3": 452.1, "r_y3": 314.12, "coord_origin": "TOPLEFT" }, "text": "NL", "orig": "NL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 33, "label": "text", "bbox": { "l": 452.3, "t": 325.47, "r": 463.91, "b": 333.99, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 34, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 452.3, "r_y0": 333.99, "r_x1": 463.91, "r_y1": 333.99, "r_x2": 463.91, "r_y2": 325.47, "r_x3": 452.3, "r_y3": 325.47, "coord_origin": "TOPLEFT" }, "text": "NL", "orig": "NL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 34, "label": "text", "bbox": { "l": 396.1, "t": 314.49, "r": 402.66, "b": 323.02, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 35, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 396.1, "r_y0": 323.02, "r_x1": 402.66, "r_y1": 323.02, "r_x2": 402.66, "r_y2": 314.49, "r_x3": 396.1, "r_y3": 314.49, "coord_origin": "TOPLEFT" }, "text": "U", "orig": "U", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 35, "label": "text", "bbox": { "l": 396.0, "t": 325.39, "r": 402.56, "b": 333.91, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 36, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 396.0, "r_y0": 333.91, "r_x1": 402.56, "r_y1": 333.91, "r_x2": 402.56, "r_y2": 325.39, "r_x3": 396.0, "r_y3": 325.39, "coord_origin": "TOPLEFT" }, "text": "U", "orig": "U", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 36, "label": "text", "bbox": { "l": 396.27, "t": 292.27, "r": 402.84, "b": 300.8, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 37, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 396.27, "r_y0": 300.8, "r_x1": 402.84, "r_y1": 300.8, "r_x2": 402.84, "r_y2": 292.27, "r_x3": 396.27, "r_y3": 292.27, "coord_origin": "TOPLEFT" }, "text": "U", "orig": "U", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 37, "label": "text", "bbox": { "l": 408.55, "t": 280.97, "r": 413.6, "b": 289.49, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 38, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 408.55, "r_y0": 289.49, "r_x1": 413.6, "r_y1": 289.49, "r_x2": 413.6, "r_y2": 280.97, "r_x3": 408.55, "r_y3": 280.97, "coord_origin": "TOPLEFT" }, "text": "L", "orig": "L", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 38, "label": "text", "bbox": { "l": 430.59, "t": 280.5, "r": 435.64, "b": 289.02, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 39, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 430.59, "r_y0": 289.02, "r_x1": 435.64, "r_y1": 289.02, "r_x2": 435.64, "r_y2": 280.5, "r_x3": 430.59, "r_y3": 280.5, "coord_origin": "TOPLEFT" }, "text": "L", "orig": "L", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 39, "label": "text", "bbox": { "l": 441.08, "t": 280.38, "r": 446.13, "b": 288.91, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 40, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 441.08, "r_y0": 288.91, "r_x1": 446.13, "r_y1": 288.91, "r_x2": 446.13, "r_y2": 280.38, "r_x3": 441.08, "r_y3": 280.38, "coord_origin": "TOPLEFT" }, "text": "L", "orig": "L", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 40, "label": "text", "bbox": { "l": 407.97, "t": 292.13, "r": 414.04, "b": 300.66, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 41, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 407.97, "r_y0": 300.66, "r_x1": 414.04, "r_y1": 300.66, "r_x2": 414.04, "r_y2": 292.13, "r_x3": 407.97, "r_y3": 292.13, "coord_origin": "TOPLEFT" }, "text": "X", "orig": "X", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 41, "label": "text", "bbox": { "l": 441.26, "t": 411.18, "r": 452.87, "b": 419.71, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 42, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 441.26, "r_y0": 419.71, "r_x1": 452.87, "r_y1": 419.71, "r_x2": 452.87, "r_y2": 411.18, "r_x3": 441.26, "r_y3": 411.18, "coord_origin": "TOPLEFT" }, "text": "NL", "orig": "NL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 42, "label": "text", "bbox": { "l": 393.75, "t": 399.79, "r": 432.49, "b": 406.9, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 43, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 393.75, "r_y0": 406.9, "r_x1": 432.49, "r_y1": 406.9, "r_x2": 432.49, "r_y2": 399.79, "r_x3": 393.75, "r_y3": 399.79, "coord_origin": "TOPLEFT" }, "text": "vocabulary:", "orig": "vocabulary:", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 43, "label": "text", "bbox": { "l": 434.59, "t": 399.79, "r": 438.8, "b": 406.9, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 44, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 434.59, "r_y0": 406.9, "r_x1": 438.8, "r_y1": 406.9, "r_x2": 438.8, "r_y2": 399.79, "r_x3": 434.59, "r_y3": 399.79, "coord_origin": "TOPLEFT" }, "text": "5", "orig": "5", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 44, "label": "text", "bbox": { "l": 440.91, "t": 399.79, "r": 463.22, "b": 406.9, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 45, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 440.91, "r_y0": 406.9, "r_x1": 463.22, "r_y1": 406.9, "r_x2": 463.22, "r_y2": 399.79, "r_x3": 440.91, "r_y3": 399.79, "coord_origin": "TOPLEFT" }, "text": "tokens", "orig": "tokens", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 45, "label": "text", "bbox": { "l": 384.12, "t": 258.55, "r": 413.99, "b": 265.65, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 46, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 384.12, "r_y0": 265.65, "r_x1": 413.99, "r_y1": 265.65, "r_x2": 413.99, "r_y2": 258.55, "r_x3": 384.12, "r_y3": 258.55, "coord_origin": "TOPLEFT" }, "text": "D OTSL", "orig": "D OTSL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 46, "label": "text", "bbox": { "l": 393.75, "t": 266.68, "r": 451.45, "b": 273.78, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 47, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 393.75, "r_y0": 273.78, "r_x1": 451.45, "r_y1": 273.78, "r_x2": 451.45, "r_y2": 266.68, "r_x3": 393.75, "r_y3": 266.68, "coord_origin": "TOPLEFT" }, "text": "sequence length:", "orig": "sequence length:", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 47, "label": "text", "bbox": { "l": 453.55, "t": 266.68, "r": 461.97, "b": 273.78, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 48, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 453.55, "r_y0": 273.78, "r_x1": 461.97, "r_y1": 273.78, "r_x2": 461.97, "r_y2": 266.68, "r_x3": 453.55, "r_y3": 266.68, "coord_origin": "TOPLEFT" }, "text": "30", "orig": "30", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 48, "label": "text", "bbox": { "l": 151.79, "t": 399.76, "r": 233.89, "b": 406.86, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 49, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.79, "r_y0": 406.86, "r_x1": 233.89, "r_y1": 406.86, "r_x2": 233.89, "r_y2": 399.76, "r_x3": 151.79, "r_y3": 399.76, "coord_origin": "TOPLEFT" }, "text": "vocabulary for this table:", "orig": "vocabulary for this table:", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 49, "label": "text", "bbox": { "l": 235.99, "t": 399.76, "r": 244.42, "b": 406.86, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 50, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 235.99, "r_y0": 406.86, "r_x1": 244.42, "r_y1": 406.86, "r_x2": 244.42, "r_y2": 399.76, "r_x3": 235.99, "r_y3": 399.76, "coord_origin": "TOPLEFT" }, "text": "12", "orig": "12", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 50, "label": "text", "bbox": { "l": 246.52, "t": 399.76, "r": 268.84, "b": 406.86, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 51, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 246.52, "r_y0": 406.86, "r_x1": 268.84, "r_y1": 406.86, "r_x2": 268.84, "r_y2": 399.76, "r_x3": 246.52, "r_y3": 399.76, "coord_origin": "TOPLEFT" }, "text": "tokens", "orig": "tokens", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 51, "label": "text", "bbox": { "l": 154.33, "t": 213.57, "r": 159.8, "b": 220.68, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 52, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 154.33, "r_y0": 220.68, "r_x1": 159.8, "r_y1": 220.68, "r_x2": 159.8, "r_y2": 213.57, "r_x3": 154.33, "r_y3": 213.57, "coord_origin": "TOPLEFT" }, "text": "A", "orig": "A", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 52, "label": "text", "bbox": { "l": 321.07, "t": 213.57, "r": 326.54, "b": 220.68, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 53, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 321.07, "r_y0": 220.68, "r_x1": 326.54, "r_y1": 220.68, "r_x2": 326.54, "r_y2": 213.57, "r_x3": 321.07, "r_y3": 213.57, "coord_origin": "TOPLEFT" }, "text": "B", "orig": "B", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 53, "label": "text", "bbox": { "l": 153.09, "t": 280.3, "r": 175.84, "b": 286.7, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 54, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 153.09, "r_y0": 286.7, "r_x1": 175.84, "r_y1": 286.7, "r_x2": 175.84, "r_y2": 280.3, "r_x3": 153.09, "r_y3": 280.3, "coord_origin": "TOPLEFT" }, "text": "", "orig": "
", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 54, "label": "text", "bbox": { "l": 160.67, "t": 287.12, "r": 172.8, "b": 293.52, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 55, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 160.67, "r_y0": 293.52, "r_x1": 172.8, "r_y1": 293.52, "r_x2": 172.8, "r_y2": 287.12, "r_x3": 160.67, "r_y3": 287.12, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 55, "label": "text", "bbox": { "l": 168.25, "t": 293.94, "r": 177.91, "b": 300.33, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 56, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 168.25, "r_y0": 300.33, "r_x1": 177.91, "r_y1": 300.33, "r_x2": 177.91, "r_y2": 293.94, "r_x3": 168.25, "r_y3": 293.94, "coord_origin": "TOPLEFT" }, "text": "", "orig": ">", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 59, "label": "text", "bbox": { "l": 263.36, "t": 293.94, "r": 278.9, "b": 300.33, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 60, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 263.36, "r_y0": 300.33, "r_x1": 278.9, "r_y1": 300.33, "r_x2": 278.9, "r_y2": 293.94, "r_x3": 263.36, "r_y3": 293.94, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 60, "label": "text", "bbox": { "l": 280.79, "t": 293.94, "r": 290.46, "b": 300.33, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 61, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 280.79, "r_y0": 300.33, "r_x1": 290.46, "r_y1": 300.33, "r_x2": 290.46, "r_y2": 293.94, "r_x3": 280.79, "r_y3": 293.94, "coord_origin": "TOPLEFT" }, "text": "", "orig": ">", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 63, "label": "text", "bbox": { "l": 335.93, "t": 293.94, "r": 351.47, "b": 300.33, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 64, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 335.93, "r_y0": 300.33, "r_x1": 351.47, "r_y1": 300.33, "r_x2": 351.47, "r_y2": 293.94, "r_x3": 335.93, "r_y3": 293.94, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 64, "label": "text", "bbox": { "l": 160.67, "t": 300.75, "r": 174.69, "b": 307.15, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 65, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 160.67, "r_y0": 307.15, "r_x1": 174.69, "r_y1": 307.15, "r_x2": 174.69, "r_y2": 300.75, "r_x3": 160.67, "r_y3": 300.75, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 65, "label": "text", "bbox": { "l": 160.67, "t": 307.57, "r": 172.8, "b": 313.97, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 66, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 160.67, "r_y0": 313.97, "r_x1": 172.8, "r_y1": 313.97, "r_x2": 172.8, "r_y2": 307.57, "r_x3": 160.67, "r_y3": 307.57, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 66, "label": "text", "bbox": { "l": 168.25, "t": 314.39, "r": 181.89, "b": 320.78, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 67, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 168.25, "r_y0": 320.78, "r_x1": 181.89, "r_y1": 320.78, "r_x2": 181.89, "r_y2": 314.39, "r_x3": 168.25, "r_y3": 314.39, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 68, "label": "text", "bbox": { "l": 201.22, "t": 314.39, "r": 214.87, "b": 320.78, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 69, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 201.22, "r_y0": 320.78, "r_x1": 214.87, "r_y1": 320.78, "r_x2": 214.87, "r_y2": 314.39, "r_x3": 201.22, "r_y3": 314.39, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 70, "label": "text", "bbox": { "l": 234.19, "t": 314.39, "r": 247.84, "b": 320.78, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 71, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 234.19, "r_y0": 320.78, "r_x1": 247.84, "r_y1": 320.78, "r_x2": 247.84, "r_y2": 314.39, "r_x3": 234.19, "r_y3": 314.39, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 72, "label": "text", "bbox": { "l": 160.67, "t": 321.2, "r": 174.69, "b": 327.6, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 73, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 160.67, "r_y0": 327.6, "r_x1": 174.69, "r_y1": 327.6, "r_x2": 174.69, "r_y2": 321.2, "r_x3": 160.67, "r_y3": 321.2, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 73, "label": "text", "bbox": { "l": 160.67, "t": 328.02, "r": 172.8, "b": 334.42, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 74, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 160.67, "r_y0": 334.42, "r_x1": 172.8, "r_y1": 334.42, "r_x2": 172.8, "r_y2": 328.02, "r_x3": 160.67, "r_y3": 328.02, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 74, "label": "text", "bbox": { "l": 168.25, "t": 334.84, "r": 373.09, "b": 341.23, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 75, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 168.25, "r_y0": 341.23, "r_x1": 373.09, "r_y1": 341.23, "r_x2": 373.09, "r_y2": 334.84, "r_x3": 168.25, "r_y3": 334.84, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 75, "label": "text", "bbox": { "l": 160.67, "t": 341.66, "r": 174.69, "b": 348.05, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 76, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 160.67, "r_y0": 348.05, "r_x1": 174.69, "r_y1": 348.05, "r_x2": 174.69, "r_y2": 341.66, "r_x3": 160.67, "r_y3": 341.66, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 76, "label": "text", "bbox": { "l": 160.67, "t": 348.47, "r": 172.8, "b": 354.87, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 77, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 160.67, "r_y0": 354.87, "r_x1": 172.8, "r_y1": 354.87, "r_x2": 172.8, "r_y2": 348.47, "r_x3": 160.67, "r_y3": 348.47, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 77, "label": "text", "bbox": { "l": 168.25, "t": 355.29, "r": 181.89, "b": 361.68, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 78, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 168.25, "r_y0": 361.68, "r_x1": 181.89, "r_y1": 361.68, "r_x2": 181.89, "r_y2": 355.29, "r_x3": 168.25, "r_y3": 355.29, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 79, "label": "text", "bbox": { "l": 201.22, "t": 355.29, "r": 214.87, "b": 361.68, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 80, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 201.22, "r_y0": 361.68, "r_x1": 214.87, "r_y1": 361.68, "r_x2": 214.87, "r_y2": 355.29, "r_x3": 201.22, "r_y3": 355.29, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 81, "label": "text", "bbox": { "l": 234.19, "t": 355.29, "r": 247.84, "b": 361.68, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 82, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 234.19, "r_y0": 361.68, "r_x1": 247.84, "r_y1": 361.68, "r_x2": 247.84, "r_y2": 355.29, "r_x3": 234.19, "r_y3": 355.29, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 83, "label": "text", "bbox": { "l": 267.17, "t": 355.29, "r": 280.81, "b": 361.68, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 84, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 267.17, "r_y0": 361.68, "r_x1": 280.81, "r_y1": 361.68, "r_x2": 280.81, "r_y2": 355.29, "r_x3": 267.17, "r_y3": 355.29, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 85, "label": "text", "bbox": { "l": 160.67, "t": 362.11, "r": 174.69, "b": 368.5, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 86, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 160.67, "r_y0": 368.5, "r_x1": 174.69, "r_y1": 368.5, "r_x2": 174.69, "r_y2": 362.11, "r_x3": 160.67, "r_y3": 362.11, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 86, "label": "text", "bbox": { "l": 160.67, "t": 368.92, "r": 172.8, "b": 375.32, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 87, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 160.67, "r_y0": 375.32, "r_x1": 172.8, "r_y1": 375.32, "r_x2": 172.8, "r_y2": 368.92, "r_x3": 160.67, "r_y3": 368.92, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 87, "label": "text", "bbox": { "l": 168.25, "t": 375.74, "r": 181.89, "b": 382.13, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 88, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 168.25, "r_y0": 382.13, "r_x1": 181.89, "r_y1": 382.13, "r_x2": 181.89, "r_y2": 375.74, "r_x3": 168.25, "r_y3": 375.74, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 89, "label": "text", "bbox": { "l": 201.22, "t": 375.74, "r": 214.87, "b": 382.13, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 90, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 201.22, "r_y0": 382.13, "r_x1": 214.87, "r_y1": 382.13, "r_x2": 214.87, "r_y2": 375.74, "r_x3": 201.22, "r_y3": 375.74, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 91, "label": "text", "bbox": { "l": 234.19, "t": 375.74, "r": 247.84, "b": 382.13, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 92, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 234.19, "r_y0": 382.13, "r_x1": 247.84, "r_y1": 382.13, "r_x2": 247.84, "r_y2": 375.74, "r_x3": 234.19, "r_y3": 375.74, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 93, "label": "text", "bbox": { "l": 267.17, "t": 375.74, "r": 280.81, "b": 382.13, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 94, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 267.17, "r_y0": 382.13, "r_x1": 280.81, "r_y1": 382.13, "r_x2": 280.81, "r_y2": 375.74, "r_x3": 267.17, "r_y3": 375.74, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 95, "label": "text", "bbox": { "l": 160.67, "t": 382.56, "r": 174.69, "b": 388.95, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 96, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 160.67, "r_y0": 388.95, "r_x1": 174.69, "r_y1": 388.95, "r_x2": 174.69, "r_y2": 382.56, "r_x3": 160.67, "r_y3": 382.56, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 96, "label": "text", "bbox": { "l": 153.09, "t": 389.37, "r": 177.73, "b": 395.77, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 97, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 153.09, "r_y0": 395.77, "r_x1": 177.73, "r_y1": 395.77, "r_x2": 177.73, "r_y2": 389.37, "r_x3": 153.09, "r_y3": 389.37, "coord_origin": "TOPLEFT" }, "text": "
", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 67, "label": "text", "bbox": { "l": 183.79, "t": 314.39, "r": 199.33, "b": 320.78, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 68, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 183.79, "r_y0": 320.78, "r_x1": 199.33, "r_y1": 320.78, "r_x2": 199.33, "r_y2": 314.39, "r_x3": 183.79, "r_y3": 314.39, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 69, "label": "text", "bbox": { "l": 216.76, "t": 314.39, "r": 232.3, "b": 320.78, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 70, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 216.76, "r_y0": 320.78, "r_x1": 232.3, "r_y1": 320.78, "r_x2": 232.3, "r_y2": 314.39, "r_x3": 216.76, "r_y3": 314.39, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 71, "label": "text", "bbox": { "l": 249.73, "t": 314.39, "r": 265.27, "b": 320.78, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 72, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 249.73, "r_y0": 320.78, "r_x1": 265.27, "r_y1": 320.78, "r_x2": 265.27, "r_y2": 314.39, "r_x3": 249.73, "r_y3": 314.39, "coord_origin": "TOPLEFT" }, "text": "
", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 78, "label": "text", "bbox": { "l": 183.79, "t": 355.29, "r": 199.33, "b": 361.68, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 79, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 183.79, "r_y0": 361.68, "r_x1": 199.33, "r_y1": 361.68, "r_x2": 199.33, "r_y2": 355.29, "r_x3": 183.79, "r_y3": 355.29, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 80, "label": "text", "bbox": { "l": 216.76, "t": 355.29, "r": 232.3, "b": 361.68, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 81, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 216.76, "r_y0": 361.68, "r_x1": 232.3, "r_y1": 361.68, "r_x2": 232.3, "r_y2": 355.29, "r_x3": 216.76, "r_y3": 355.29, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 82, "label": "text", "bbox": { "l": 249.73, "t": 355.29, "r": 265.27, "b": 361.68, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 83, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 249.73, "r_y0": 361.68, "r_x1": 265.27, "r_y1": 361.68, "r_x2": 265.27, "r_y2": 355.29, "r_x3": 249.73, "r_y3": 355.29, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 84, "label": "text", "bbox": { "l": 282.71, "t": 355.29, "r": 298.25, "b": 361.68, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 85, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 282.71, "r_y0": 361.68, "r_x1": 298.25, "r_y1": 361.68, "r_x2": 298.25, "r_y2": 355.29, "r_x3": 282.71, "r_y3": 355.29, "coord_origin": "TOPLEFT" }, "text": "
", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 88, "label": "text", "bbox": { "l": 183.79, "t": 375.74, "r": 199.33, "b": 382.13, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 89, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 183.79, "r_y0": 382.13, "r_x1": 199.33, "r_y1": 382.13, "r_x2": 199.33, "r_y2": 375.74, "r_x3": 183.79, "r_y3": 375.74, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 90, "label": "text", "bbox": { "l": 216.76, "t": 375.74, "r": 232.3, "b": 382.13, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 91, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 216.76, "r_y0": 382.13, "r_x1": 232.3, "r_y1": 382.13, "r_x2": 232.3, "r_y2": 375.74, "r_x3": 216.76, "r_y3": 375.74, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 92, "label": "text", "bbox": { "l": 249.73, "t": 375.74, "r": 265.27, "b": 382.13, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 93, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 249.73, "r_y0": 382.13, "r_x1": 265.27, "r_y1": 382.13, "r_x2": 265.27, "r_y2": 375.74, "r_x3": 249.73, "r_y3": 375.74, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 94, "label": "text", "bbox": { "l": 282.71, "t": 375.74, "r": 298.25, "b": 382.13, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 95, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 282.71, "r_y0": 382.13, "r_x1": 298.25, "r_y1": 382.13, "r_x2": 298.25, "r_y2": 375.74, "r_x3": 282.71, "r_y3": 375.74, "coord_origin": "TOPLEFT" }, "text": "
", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 97, "label": "text", "bbox": { "l": 395.06, "t": 411.33, "r": 401.62, "b": 419.86, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 98, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 395.06, "r_y0": 419.86, "r_x1": 401.62, "r_y1": 419.86, "r_x2": 401.62, "r_y2": 411.33, "r_x3": 395.06, "r_y3": 411.33, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 98, "label": "text", "bbox": { "l": 407.42, "t": 411.33, "r": 412.48, "b": 419.86, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 99, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 407.42, "r_y0": 419.86, "r_x1": 412.48, "r_y1": 419.86, "r_x2": 412.48, "r_y2": 411.33, "r_x3": 407.42, "r_y3": 411.33, "coord_origin": "TOPLEFT" }, "text": "L", "orig": "L", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 99, "label": "text", "bbox": { "l": 418.69, "t": 411.33, "r": 425.26, "b": 419.86, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 100, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 418.69, "r_y0": 419.86, "r_x1": 425.26, "r_y1": 419.86, "r_x2": 425.26, "r_y2": 411.33, "r_x3": 418.69, "r_y3": 411.33, "coord_origin": "TOPLEFT" }, "text": "U", "orig": "U", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 100, "label": "text", "bbox": { "l": 430.51, "t": 411.33, "r": 436.57, "b": 419.86, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 101, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 430.51, "r_y0": 419.86, "r_x1": 436.57, "r_y1": 419.86, "r_x2": 436.57, "r_y2": 411.33, "r_x3": 430.51, "r_y3": 411.33, "coord_origin": "TOPLEFT" }, "text": "X", "orig": "X", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 101, "label": "text", "bbox": { "l": 152.36, "t": 409.77, "r": 175.11, "b": 416.17, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 102, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 152.36, "r_y0": 416.17, "r_x1": 175.11, "r_y1": 416.17, "r_x2": 175.11, "r_y2": 409.77, "r_x3": 152.36, "r_y3": 409.77, "coord_origin": "TOPLEFT" }, "text": "", "orig": "
", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 102, "label": "text", "bbox": { "l": 178.89, "t": 409.77, "r": 191.02, "b": 416.17, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 103, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 178.89, "r_y0": 416.17, "r_x1": 191.02, "r_y1": 416.17, "r_x2": 191.02, "r_y2": 409.77, "r_x3": 178.89, "r_y3": 409.77, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 103, "label": "text", "bbox": { "l": 194.81, "t": 409.77, "r": 208.83, "b": 416.17, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 104, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 194.81, "r_y0": 416.17, "r_x1": 208.83, "r_y1": 416.17, "r_x2": 208.83, "r_y2": 409.77, "r_x3": 194.81, "r_y3": 409.77, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 104, "label": "text", "bbox": { "l": 212.61, "t": 409.77, "r": 226.26, "b": 416.17, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 105, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 212.61, "r_y0": 416.17, "r_x1": 226.26, "r_y1": 416.17, "r_x2": 226.26, "r_y2": 409.77, "r_x3": 212.61, "r_y3": 409.77, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 106, "label": "text", "bbox": { "l": 249.38, "t": 409.77, "r": 259.04, "b": 416.17, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 107, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 249.38, "r_y0": 416.17, "r_x1": 259.04, "r_y1": 416.17, "r_x2": 259.04, "r_y2": 409.77, "r_x3": 249.38, "r_y3": 409.77, "coord_origin": "TOPLEFT" }, "text": "", "orig": ">", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 112, "label": "text", "bbox": { "l": 244.46, "t": 418.11, "r": 269.1, "b": 424.5, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 113, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 244.46, "r_y0": 424.5, "r_x1": 269.1, "r_y1": 424.5, "r_x2": 269.1, "r_y2": 418.11, "r_x3": 244.46, "r_y3": 418.11, "coord_origin": "TOPLEFT" }, "text": "
", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 105, "label": "text", "bbox": { "l": 230.05, "t": 409.77, "r": 245.59, "b": 416.17, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 106, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 230.05, "r_y0": 416.17, "r_x1": 245.59, "r_y1": 416.17, "r_x2": 245.59, "r_y2": 409.77, "r_x3": 230.05, "r_y3": 409.77, "coord_origin": "TOPLEFT" }, "text": "
", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 113, "label": "text", "bbox": { "l": 154.51, "t": 258.6, "r": 159.62, "b": 265.71, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 114, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 154.51, "r_y0": 265.71, "r_x1": 159.62, "r_y1": 265.71, "r_x2": 159.62, "r_y2": 258.6, "r_x3": 154.51, "r_y3": 258.6, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 114, "label": "text", "bbox": { "l": 164.74, "t": 258.6, "r": 185.22, "b": 265.71, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 115, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 164.74, "r_y0": 265.71, "r_x1": 185.22, "r_y1": 265.71, "r_x2": 185.22, "r_y2": 258.6, "r_x3": 164.74, "r_y3": 258.6, "coord_origin": "TOPLEFT" }, "text": "HTML", "orig": "HTML", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 115, "label": "text", "bbox": { "l": 164.35, "t": 266.5, "r": 222.05, "b": 273.6, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 116, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 164.35, "r_y0": 273.6, "r_x1": 222.05, "r_y1": 273.6, "r_x2": 222.05, "r_y2": 266.5, "r_x3": 164.35, "r_y3": 266.5, "coord_origin": "TOPLEFT" }, "text": "sequence length:", "orig": "sequence length:", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 116, "label": "text", "bbox": { "l": 224.15, "t": 266.5, "r": 232.58, "b": 273.6, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 117, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 224.15, "r_y0": 273.6, "r_x1": 232.58, "r_y1": 273.6, "r_x2": 232.58, "r_y2": 266.5, "r_x3": 224.15, "r_y3": 266.5, "coord_origin": "TOPLEFT" }, "text": "55", "orig": "55", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] } ] }, { "id": 2, "label": "text", "bbox": { "l": 134.76, "t": 452.31, "r": 480.59, "b": 520.89, "coord_origin": "TOPLEFT" }, "confidence": 0.95, "cells": [ { "index": 118, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 461.11, "r_x1": 161.33, "r_y1": 461.11, "r_x2": 161.33, "r_y2": 452.31, "r_x3": 134.76, "r_y3": 452.31, "coord_origin": "TOPLEFT" }, "text": "today,", "orig": "today,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 119, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 164.27, "r_y0": 461.11, "r_x1": 226.29, "r_y1": 461.11, "r_x2": 226.29, "r_y2": 452.31, "r_x3": 164.27, "r_y3": 452.31, "coord_origin": "TOPLEFT" }, "text": "table detection", "orig": "table detection", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 120, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 229.99, "r_y0": 461.11, "r_x1": 480.59, "r_y1": 461.11, "r_x2": 480.59, "r_y2": 452.31, "r_x3": 229.99, "r_y3": 452.31, "coord_origin": "TOPLEFT" }, "text": "in documents is a well understood problem, and the latest", "orig": "in documents is a well understood problem, and the latest", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 121, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.77, "r_y0": 473.07, "r_x1": 480.59, "r_y1": 473.07, "r_x2": 480.59, "r_y2": 464.27, "r_x3": 134.77, "r_y3": 464.27, "coord_origin": "TOPLEFT" }, "text": "state-of-the-art (SOTA) object detection methods provide an accuracy compa-", "orig": "state-of-the-art (SOTA) object detection methods provide an accuracy compa-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 122, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.77, "r_y0": 485.02, "r_x1": 480.59, "r_y1": 485.02, "r_x2": 480.59, "r_y2": 476.22, "r_x3": 134.77, "r_y3": 476.22, "coord_origin": "TOPLEFT" }, "text": "rable to human observers [7,8,10,14,23]. On the other hand, the problem of table", "orig": "rable to human observers [7,8,10,14,23]. On the other hand, the problem of table", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 123, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.77, "r_y0": 496.98, "r_x1": 480.59, "r_y1": 496.98, "r_x2": 480.59, "r_y2": 488.18, "r_x3": 134.77, "r_y3": 488.18, "coord_origin": "TOPLEFT" }, "text": "structure recognition (TSR) is a lot more challenging and remains a very active", "orig": "structure recognition (TSR) is a lot more challenging and remains a very active", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 124, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.77, "r_y0": 508.93, "r_x1": 480.59, "r_y1": 508.93, "r_x2": 480.59, "r_y2": 500.13, "r_x3": 134.77, "r_y3": 500.13, "coord_origin": "TOPLEFT" }, "text": "area of research, in which many novel machine learning algorithms are being", "orig": "area of research, in which many novel machine learning algorithms are being", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 125, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.77, "r_y0": 520.89, "r_x1": 313.25, "r_y1": 520.89, "r_x2": 313.25, "r_y2": 512.09, "r_x3": 134.77, "r_y3": 512.09, "coord_origin": "TOPLEFT" }, "text": "explored [3,4,5,9,11,12,13,14,17,18,21,22].", "orig": "explored [3,4,5,9,11,12,13,14,17,18,21,22].", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 0, "label": "text", "bbox": { "l": 134.77, "t": 524.55, "r": 480.59, "b": 664.85, "coord_origin": "TOPLEFT" }, "confidence": 0.985, "cells": [ { "index": 126, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 149.71, "r_y0": 533.35, "r_x1": 480.59, "r_y1": 533.35, "r_x2": 480.59, "r_y2": 524.55, "r_x3": 149.71, "r_y3": 524.55, "coord_origin": "TOPLEFT" }, "text": "Recently emerging SOTA methods for table structure recognition employ", "orig": "Recently emerging SOTA methods for table structure recognition employ", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 127, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.77, "r_y0": 545.3, "r_x1": 480.59, "r_y1": 545.3, "r_x2": 480.59, "r_y2": 536.51, "r_x3": 134.77, "r_y3": 536.51, "coord_origin": "TOPLEFT" }, "text": "transformer-based models, in which an image of the table is provided to the net-", "orig": "transformer-based models, in which an image of the table is provided to the net-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 128, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.77, "r_y0": 557.26, "r_x1": 480.59, "r_y1": 557.26, "r_x2": 480.59, "r_y2": 548.46, "r_x3": 134.77, "r_y3": 548.46, "coord_origin": "TOPLEFT" }, "text": "work in order to predict the structure of the table as a sequence of tokens. These", "orig": "work in order to predict the structure of the table as a sequence of tokens. These", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 129, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.77, "r_y0": 569.21, "r_x1": 480.59, "r_y1": 569.21, "r_x2": 480.59, "r_y2": 560.42, "r_x3": 134.77, "r_y3": 560.42, "coord_origin": "TOPLEFT" }, "text": "image-to-sequence (Im2Seq) models are extremely powerful, since they allow for", "orig": "image-to-sequence (Im2Seq) models are extremely powerful, since they allow for", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 130, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.77, "r_y0": 581.17, "r_x1": 480.59, "r_y1": 581.17, "r_x2": 480.59, "r_y2": 572.37, "r_x3": 134.77, "r_y3": 572.37, "coord_origin": "TOPLEFT" }, "text": "a purely data-driven solution. The tokens of the sequence typically belong to a", "orig": "a purely data-driven solution. The tokens of the sequence typically belong to a", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 131, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.77, "r_y0": 593.12, "r_x1": 480.59, "r_y1": 593.12, "r_x2": 480.59, "r_y2": 584.33, "r_x3": 134.77, "r_y3": 584.33, "coord_origin": "TOPLEFT" }, "text": "markup language such as HTML, Latex or Markdown, which allow to describe", "orig": "markup language such as HTML, Latex or Markdown, which allow to describe", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 132, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.77, "r_y0": 605.08, "r_x1": 480.59, "r_y1": 605.08, "r_x2": 480.59, "r_y2": 596.28, "r_x3": 134.77, "r_y3": 596.28, "coord_origin": "TOPLEFT" }, "text": "table structure as rows, columns and spanning cells in various configurations.", "orig": "table structure as rows, columns and spanning cells in various configurations.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 133, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.77, "r_y0": 617.03, "r_x1": 480.59, "r_y1": 617.03, "r_x2": 480.59, "r_y2": 608.24, "r_x3": 134.77, "r_y3": 608.24, "coord_origin": "TOPLEFT" }, "text": "In Figure 1, we illustrate how HTML is used to represent the table-structure", "orig": "In Figure 1, we illustrate how HTML is used to represent the table-structure", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 134, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.77, "r_y0": 628.99, "r_x1": 480.59, "r_y1": 628.99, "r_x2": 480.59, "r_y2": 620.19, "r_x3": 134.77, "r_y3": 620.19, "coord_origin": "TOPLEFT" }, "text": "of a particular example table. Public table-structure data sets such as PubTab-", "orig": "of a particular example table. Public table-structure data sets such as PubTab-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 135, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.77, "r_y0": 640.94, "r_x1": 480.59, "r_y1": 640.94, "r_x2": 480.59, "r_y2": 632.15, "r_x3": 134.77, "r_y3": 632.15, "coord_origin": "TOPLEFT" }, "text": "Net [22], and FinTabNet [21], which were created in a semi-automated way from", "orig": "Net [22], and FinTabNet [21], which were created in a semi-automated way from", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 136, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.77, "r_y0": 652.9, "r_x1": 480.59, "r_y1": 652.9, "r_x2": 480.59, "r_y2": 644.1, "r_x3": 134.77, "r_y3": 644.1, "coord_origin": "TOPLEFT" }, "text": "paired PDF and HTML sources (e.g. PubMed Central), popularized primarily", "orig": "paired PDF and HTML sources (e.g. PubMed Central), popularized primarily", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 137, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.77, "r_y0": 664.85, "r_x1": 421.45, "r_y1": 664.85, "r_x2": 421.45, "r_y2": 656.06, "r_x3": 134.77, "r_y3": 656.06, "coord_origin": "TOPLEFT" }, "text": "the use of HTML as ground-truth representation format for TSR.", "orig": "the use of HTML as ground-truth representation format for TSR.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] } ] }, "tablestructure": { "table_map": {} }, "figures_classification": null, "equations_prediction": null, "vlm_response": null }, "assembled": { "elements": [ { "label": "page_header", "id": 5, "page_no": 1, "cluster": { "id": 5, "label": "page_header", "bbox": { "l": 134.76, "t": 93.77, "r": 139.37, "b": 101.84, "coord_origin": "TOPLEFT" }, "confidence": 0.858, "cells": [ { "index": 0, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 101.84, "r_x1": 139.37, "r_y1": 101.84, "r_x2": 139.37, "r_y2": 93.77, "r_x3": 134.76, "r_y3": 93.77, "coord_origin": "TOPLEFT" }, "text": "2", "orig": "2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "2" }, { "label": "page_header", "id": 3, "page_no": 1, "cluster": { "id": 3, "label": "page_header", "bbox": { "l": 167.81, "t": 93.77, "r": 231.72, "b": 101.84, "coord_origin": "TOPLEFT" }, "confidence": 0.908, "cells": [ { "index": 1, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 167.81, "r_y0": 101.84, "r_x1": 178.08, "r_y1": 101.84, "r_x2": 178.08, "r_y2": 93.77, "r_x3": 167.81, "r_y3": 93.77, "coord_origin": "TOPLEFT" }, "text": "M.", "orig": "M.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 2, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 182.37, "r_y0": 101.84, "r_x1": 231.72, "r_y1": 101.84, "r_x2": 231.72, "r_y2": 93.77, "r_x3": 182.37, "r_y3": 93.77, "coord_origin": "TOPLEFT" }, "text": "Lysak, et al.", "orig": "Lysak, et al.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "M. Lysak, et al." }, { "label": "caption", "id": 4, "page_no": 1, "cluster": { "id": 4, "label": "caption", "bbox": { "l": 134.76, "t": 126.33, "r": 480.59, "b": 200.22, "coord_origin": "TOPLEFT" }, "confidence": 0.894, "cells": [ { "index": 3, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 134.26, "r_x1": 162.64, "r_y1": 134.26, "r_x2": 162.64, "r_y2": 126.33, "r_x3": 134.76, "r_y3": 126.33, "coord_origin": "TOPLEFT" }, "text": "Fig. 1.", "orig": "Fig. 1.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 4, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 167.06, "r_y0": 134.47, "r_x1": 480.59, "r_y1": 134.47, "r_x2": 480.59, "r_y2": 126.4, "r_x3": 167.06, "r_y3": 126.4, "coord_origin": "TOPLEFT" }, "text": "Comparison between HTML and OTSL table structure representation: (A)", "orig": "Comparison between HTML and OTSL table structure representation: (A)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 5, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 145.43, "r_x1": 480.59, "r_y1": 145.43, "r_x2": 480.59, "r_y2": 137.36, "r_x3": 134.76, "r_y3": 137.36, "coord_origin": "TOPLEFT" }, "text": "table-example with complex row and column headers, including a 2D empty span,", "orig": "table-example with complex row and column headers, including a 2D empty span,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 6, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 156.38, "r_x1": 147.95, "r_y1": 156.38, "r_x2": 147.95, "r_y2": 148.31, "r_x3": 134.76, "r_y3": 148.31, "coord_origin": "TOPLEFT" }, "text": "(B)", "orig": "(B)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 7, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 152.39, "r_y0": 156.38, "r_x1": 480.59, "r_y1": 156.38, "r_x2": 480.59, "r_y2": 148.31, "r_x3": 152.39, "r_y3": 148.31, "coord_origin": "TOPLEFT" }, "text": "minimal graphical representation of table structure using rectangular layout, (C)", "orig": "minimal graphical representation of table structure using rectangular layout, (C)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 8, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 167.34, "r_x1": 480.59, "r_y1": 167.34, "r_x2": 480.59, "r_y2": 159.27, "r_x3": 134.76, "r_y3": 159.27, "coord_origin": "TOPLEFT" }, "text": "HTML representation, (D) OTSL representation. This example demonstrates many of", "orig": "HTML representation, (D) OTSL representation. This example demonstrates many of", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 9, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 178.3, "r_x1": 480.59, "r_y1": 178.3, "r_x2": 480.59, "r_y2": 170.23, "r_x3": 134.76, "r_y3": 170.23, "coord_origin": "TOPLEFT" }, "text": "the key-features of OTSL, namely its reduced vocabulary size (12 versus 5 in this case),", "orig": "the key-features of OTSL, namely its reduced vocabulary size (12 versus 5 in this case),", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 10, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 189.26, "r_x1": 480.59, "r_y1": 189.26, "r_x2": 480.59, "r_y2": 181.19, "r_x3": 134.76, "r_y3": 181.19, "coord_origin": "TOPLEFT" }, "text": "its reduced sequence length (55 versus 30) and a enhanced internal structure (variable", "orig": "its reduced sequence length (55 versus 30) and a enhanced internal structure (variable", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 11, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 200.22, "r_x1": 460.87, "r_y1": 200.22, "r_x2": 460.87, "r_y2": 192.15, "r_x3": 134.76, "r_y3": 192.15, "coord_origin": "TOPLEFT" }, "text": "token sequence length per row in HTML versus a fixed length of rows in OTSL).", "orig": "token sequence length per row in HTML versus a fixed length of rows in OTSL).", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "Fig. 1. Comparison between HTML and OTSL table structure representation: (A) table-example with complex row and column headers, including a 2D empty span, (B) minimal graphical representation of table structure using rectangular layout, (C) HTML representation, (D) OTSL representation. This example demonstrates many of the key-features of OTSL, namely its reduced vocabulary size (12 versus 5 in this case), its reduced sequence length (55 versus 30) and a enhanced internal structure (variable token sequence length per row in HTML versus a fixed length of rows in OTSL)." }, { "label": "picture", "id": 1, "page_no": 1, "cluster": { "id": 1, "label": "picture", "bbox": { "l": 148.45, "t": 208.37, "r": 464.36, "b": 425.85, "coord_origin": "TOPLEFT" }, "confidence": 0.969, "cells": [ { "index": 12, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 396.41, "r_y0": 289.51, "r_x1": 402.97, "r_y1": 289.51, "r_x2": 402.97, "r_y2": 280.98, "r_x3": 396.41, "r_y3": 280.98, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 13, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 418.59, "r_y0": 289.42, "r_x1": 425.15, "r_y1": 289.42, "r_x2": 425.15, "r_y2": 280.9, "r_x3": 418.59, "r_y3": 280.9, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 14, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 395.75, "r_y0": 311.76, "r_x1": 402.31, "r_y1": 311.76, "r_x2": 402.31, "r_y2": 303.24, "r_x3": 395.75, "r_y3": 303.24, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 15, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 407.54, "r_y0": 311.9, "r_x1": 414.1, "r_y1": 311.9, "r_x2": 414.1, "r_y2": 303.37, "r_x3": 407.54, "r_y3": 303.37, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 16, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 407.56, "r_y0": 322.93, "r_x1": 414.13, "r_y1": 322.93, "r_x2": 414.13, "r_y2": 314.41, "r_x3": 407.56, "r_y3": 314.41, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 17, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 418.51, "r_y0": 300.61, "r_x1": 425.07, "r_y1": 300.61, "r_x2": 425.07, "r_y2": 292.09, "r_x3": 418.51, "r_y3": 292.09, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 18, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 429.6, "r_y0": 300.62, "r_x1": 436.16, "r_y1": 300.62, "r_x2": 436.16, "r_y2": 292.09, "r_x3": 429.6, "r_y3": 292.09, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 19, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 440.69, "r_y0": 300.54, "r_x1": 447.25, "r_y1": 300.54, "r_x2": 447.25, "r_y2": 292.01, "r_x3": 440.69, "r_y3": 292.01, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 20, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 418.62, "r_y0": 311.82, "r_x1": 425.19, "r_y1": 311.82, "r_x2": 425.19, "r_y2": 303.29, "r_x3": 418.62, "r_y3": 303.29, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 21, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 429.71, "r_y0": 311.83, "r_x1": 436.27, "r_y1": 311.83, "r_x2": 436.27, "r_y2": 303.3, "r_x3": 429.71, "r_y3": 303.3, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 22, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 440.8, "r_y0": 311.75, "r_x1": 447.36, "r_y1": 311.75, "r_x2": 447.36, "r_y2": 303.22, "r_x3": 440.8, "r_y3": 303.22, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 23, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 418.63, "r_y0": 323.09, "r_x1": 425.19, "r_y1": 323.09, "r_x2": 425.19, "r_y2": 314.57, "r_x3": 418.63, "r_y3": 314.57, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 24, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 429.71, "r_y0": 323.1, "r_x1": 436.27, "r_y1": 323.1, "r_x2": 436.27, "r_y2": 314.57, "r_x3": 429.71, "r_y3": 314.57, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 25, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 440.8, "r_y0": 323.02, "r_x1": 447.36, "r_y1": 323.02, "r_x2": 447.36, "r_y2": 314.5, "r_x3": 440.8, "r_y3": 314.5, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 26, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 407.4, "r_y0": 333.82, "r_x1": 413.96, "r_y1": 333.82, "r_x2": 413.96, "r_y2": 325.29, "r_x3": 407.4, "r_y3": 325.29, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 27, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 418.46, "r_y0": 333.98, "r_x1": 425.02, "r_y1": 333.98, "r_x2": 425.02, "r_y2": 325.45, "r_x3": 418.46, "r_y3": 325.45, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 28, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 429.55, "r_y0": 333.98, "r_x1": 436.11, "r_y1": 333.98, "r_x2": 436.11, "r_y2": 325.46, "r_x3": 429.55, "r_y3": 325.46, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 29, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 440.64, "r_y0": 333.91, "r_x1": 447.2, "r_y1": 333.91, "r_x2": 447.2, "r_y2": 325.38, "r_x3": 440.64, "r_y3": 325.38, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 30, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 451.9, "r_y0": 288.68, "r_x1": 463.51, "r_y1": 288.68, "r_x2": 463.51, "r_y2": 280.16, "r_x3": 451.9, "r_y3": 280.16, "coord_origin": "TOPLEFT" }, "text": "NL", "orig": "NL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 31, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 452.16, "r_y0": 300.12, "r_x1": 463.77, "r_y1": 300.12, "r_x2": 463.77, "r_y2": 291.6, "r_x3": 452.16, "r_y3": 291.6, "coord_origin": "TOPLEFT" }, "text": "NL", "orig": "NL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 32, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 452.18, "r_y0": 311.37, "r_x1": 463.79, "r_y1": 311.37, "r_x2": 463.79, "r_y2": 302.84, "r_x3": 452.18, "r_y3": 302.84, "coord_origin": "TOPLEFT" }, "text": "NL", "orig": "NL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 33, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 452.1, "r_y0": 322.65, "r_x1": 463.72, "r_y1": 322.65, "r_x2": 463.72, "r_y2": 314.12, "r_x3": 452.1, "r_y3": 314.12, "coord_origin": "TOPLEFT" }, "text": "NL", "orig": "NL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 34, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 452.3, "r_y0": 333.99, "r_x1": 463.91, "r_y1": 333.99, "r_x2": 463.91, "r_y2": 325.47, "r_x3": 452.3, "r_y3": 325.47, "coord_origin": "TOPLEFT" }, "text": "NL", "orig": "NL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 35, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 396.1, "r_y0": 323.02, "r_x1": 402.66, "r_y1": 323.02, "r_x2": 402.66, "r_y2": 314.49, "r_x3": 396.1, "r_y3": 314.49, "coord_origin": "TOPLEFT" }, "text": "U", "orig": "U", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 36, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 396.0, "r_y0": 333.91, "r_x1": 402.56, "r_y1": 333.91, "r_x2": 402.56, "r_y2": 325.39, "r_x3": 396.0, "r_y3": 325.39, "coord_origin": "TOPLEFT" }, "text": "U", "orig": "U", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 37, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 396.27, "r_y0": 300.8, "r_x1": 402.84, "r_y1": 300.8, "r_x2": 402.84, "r_y2": 292.27, "r_x3": 396.27, "r_y3": 292.27, "coord_origin": "TOPLEFT" }, "text": "U", "orig": "U", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 38, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 408.55, "r_y0": 289.49, "r_x1": 413.6, "r_y1": 289.49, "r_x2": 413.6, "r_y2": 280.97, "r_x3": 408.55, "r_y3": 280.97, "coord_origin": "TOPLEFT" }, "text": "L", "orig": "L", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 39, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 430.59, "r_y0": 289.02, "r_x1": 435.64, "r_y1": 289.02, "r_x2": 435.64, "r_y2": 280.5, "r_x3": 430.59, "r_y3": 280.5, "coord_origin": "TOPLEFT" }, "text": "L", "orig": "L", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 40, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 441.08, "r_y0": 288.91, "r_x1": 446.13, "r_y1": 288.91, "r_x2": 446.13, "r_y2": 280.38, "r_x3": 441.08, "r_y3": 280.38, "coord_origin": "TOPLEFT" }, "text": "L", "orig": "L", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 41, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 407.97, "r_y0": 300.66, "r_x1": 414.04, "r_y1": 300.66, "r_x2": 414.04, "r_y2": 292.13, "r_x3": 407.97, "r_y3": 292.13, "coord_origin": "TOPLEFT" }, "text": "X", "orig": "X", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 42, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 441.26, "r_y0": 419.71, "r_x1": 452.87, "r_y1": 419.71, "r_x2": 452.87, "r_y2": 411.18, "r_x3": 441.26, "r_y3": 411.18, "coord_origin": "TOPLEFT" }, "text": "NL", "orig": "NL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 43, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 393.75, "r_y0": 406.9, "r_x1": 432.49, "r_y1": 406.9, "r_x2": 432.49, "r_y2": 399.79, "r_x3": 393.75, "r_y3": 399.79, "coord_origin": "TOPLEFT" }, "text": "vocabulary:", "orig": "vocabulary:", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 44, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 434.59, "r_y0": 406.9, "r_x1": 438.8, "r_y1": 406.9, "r_x2": 438.8, "r_y2": 399.79, "r_x3": 434.59, "r_y3": 399.79, "coord_origin": "TOPLEFT" }, "text": "5", "orig": "5", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 45, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 440.91, "r_y0": 406.9, "r_x1": 463.22, "r_y1": 406.9, "r_x2": 463.22, "r_y2": 399.79, "r_x3": 440.91, "r_y3": 399.79, "coord_origin": "TOPLEFT" }, "text": "tokens", "orig": "tokens", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 46, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 384.12, "r_y0": 265.65, "r_x1": 413.99, "r_y1": 265.65, "r_x2": 413.99, "r_y2": 258.55, "r_x3": 384.12, "r_y3": 258.55, "coord_origin": "TOPLEFT" }, "text": "D OTSL", "orig": "D OTSL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 47, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 393.75, "r_y0": 273.78, "r_x1": 451.45, "r_y1": 273.78, "r_x2": 451.45, "r_y2": 266.68, "r_x3": 393.75, "r_y3": 266.68, "coord_origin": "TOPLEFT" }, "text": "sequence length:", "orig": "sequence length:", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 48, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 453.55, "r_y0": 273.78, "r_x1": 461.97, "r_y1": 273.78, "r_x2": 461.97, "r_y2": 266.68, "r_x3": 453.55, "r_y3": 266.68, "coord_origin": "TOPLEFT" }, "text": "30", "orig": "30", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 49, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.79, "r_y0": 406.86, "r_x1": 233.89, "r_y1": 406.86, "r_x2": 233.89, "r_y2": 399.76, "r_x3": 151.79, "r_y3": 399.76, "coord_origin": "TOPLEFT" }, "text": "vocabulary for this table:", "orig": "vocabulary for this table:", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 50, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 235.99, "r_y0": 406.86, "r_x1": 244.42, "r_y1": 406.86, "r_x2": 244.42, "r_y2": 399.76, "r_x3": 235.99, "r_y3": 399.76, "coord_origin": "TOPLEFT" }, "text": "12", "orig": "12", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 51, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 246.52, "r_y0": 406.86, "r_x1": 268.84, "r_y1": 406.86, "r_x2": 268.84, "r_y2": 399.76, "r_x3": 246.52, "r_y3": 399.76, "coord_origin": "TOPLEFT" }, "text": "tokens", "orig": "tokens", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 52, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 154.33, "r_y0": 220.68, "r_x1": 159.8, "r_y1": 220.68, "r_x2": 159.8, "r_y2": 213.57, "r_x3": 154.33, "r_y3": 213.57, "coord_origin": "TOPLEFT" }, "text": "A", "orig": "A", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 53, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 321.07, "r_y0": 220.68, "r_x1": 326.54, "r_y1": 220.68, "r_x2": 326.54, "r_y2": 213.57, "r_x3": 321.07, "r_y3": 213.57, "coord_origin": "TOPLEFT" }, "text": "B", "orig": "B", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 54, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 153.09, "r_y0": 286.7, "r_x1": 175.84, "r_y1": 286.7, "r_x2": 175.84, "r_y2": 280.3, "r_x3": 153.09, "r_y3": 280.3, "coord_origin": "TOPLEFT" }, "text": "", "orig": "
", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 55, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 160.67, "r_y0": 293.52, "r_x1": 172.8, "r_y1": 293.52, "r_x2": 172.8, "r_y2": 287.12, "r_x3": 160.67, "r_y3": 287.12, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 56, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 168.25, "r_y0": 300.33, "r_x1": 177.91, "r_y1": 300.33, "r_x2": 177.91, "r_y2": 293.94, "r_x3": 168.25, "r_y3": 293.94, "coord_origin": "TOPLEFT" }, "text": "", "orig": ">", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 60, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 263.36, "r_y0": 300.33, "r_x1": 278.9, "r_y1": 300.33, "r_x2": 278.9, "r_y2": 293.94, "r_x3": 263.36, "r_y3": 293.94, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 61, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 280.79, "r_y0": 300.33, "r_x1": 290.46, "r_y1": 300.33, "r_x2": 290.46, "r_y2": 293.94, "r_x3": 280.79, "r_y3": 293.94, "coord_origin": "TOPLEFT" }, "text": "", "orig": ">", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 64, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 335.93, "r_y0": 300.33, "r_x1": 351.47, "r_y1": 300.33, "r_x2": 351.47, "r_y2": 293.94, "r_x3": 335.93, "r_y3": 293.94, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 65, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 160.67, "r_y0": 307.15, "r_x1": 174.69, "r_y1": 307.15, "r_x2": 174.69, "r_y2": 300.75, "r_x3": 160.67, "r_y3": 300.75, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 66, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 160.67, "r_y0": 313.97, "r_x1": 172.8, "r_y1": 313.97, "r_x2": 172.8, "r_y2": 307.57, "r_x3": 160.67, "r_y3": 307.57, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 67, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 168.25, "r_y0": 320.78, "r_x1": 181.89, "r_y1": 320.78, "r_x2": 181.89, "r_y2": 314.39, "r_x3": 168.25, "r_y3": 314.39, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 69, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 201.22, "r_y0": 320.78, "r_x1": 214.87, "r_y1": 320.78, "r_x2": 214.87, "r_y2": 314.39, "r_x3": 201.22, "r_y3": 314.39, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 71, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 234.19, "r_y0": 320.78, "r_x1": 247.84, "r_y1": 320.78, "r_x2": 247.84, "r_y2": 314.39, "r_x3": 234.19, "r_y3": 314.39, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 73, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 160.67, "r_y0": 327.6, "r_x1": 174.69, "r_y1": 327.6, "r_x2": 174.69, "r_y2": 321.2, "r_x3": 160.67, "r_y3": 321.2, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 74, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 160.67, "r_y0": 334.42, "r_x1": 172.8, "r_y1": 334.42, "r_x2": 172.8, "r_y2": 328.02, "r_x3": 160.67, "r_y3": 328.02, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 75, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 168.25, "r_y0": 341.23, "r_x1": 373.09, "r_y1": 341.23, "r_x2": 373.09, "r_y2": 334.84, "r_x3": 168.25, "r_y3": 334.84, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 76, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 160.67, "r_y0": 348.05, "r_x1": 174.69, "r_y1": 348.05, "r_x2": 174.69, "r_y2": 341.66, "r_x3": 160.67, "r_y3": 341.66, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 77, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 160.67, "r_y0": 354.87, "r_x1": 172.8, "r_y1": 354.87, "r_x2": 172.8, "r_y2": 348.47, "r_x3": 160.67, "r_y3": 348.47, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 78, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 168.25, "r_y0": 361.68, "r_x1": 181.89, "r_y1": 361.68, "r_x2": 181.89, "r_y2": 355.29, "r_x3": 168.25, "r_y3": 355.29, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 80, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 201.22, "r_y0": 361.68, "r_x1": 214.87, "r_y1": 361.68, "r_x2": 214.87, "r_y2": 355.29, "r_x3": 201.22, "r_y3": 355.29, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 82, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 234.19, "r_y0": 361.68, "r_x1": 247.84, "r_y1": 361.68, "r_x2": 247.84, "r_y2": 355.29, "r_x3": 234.19, "r_y3": 355.29, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 84, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 267.17, "r_y0": 361.68, "r_x1": 280.81, "r_y1": 361.68, "r_x2": 280.81, "r_y2": 355.29, "r_x3": 267.17, "r_y3": 355.29, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 86, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 160.67, "r_y0": 368.5, "r_x1": 174.69, "r_y1": 368.5, "r_x2": 174.69, "r_y2": 362.11, "r_x3": 160.67, "r_y3": 362.11, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 87, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 160.67, "r_y0": 375.32, "r_x1": 172.8, "r_y1": 375.32, "r_x2": 172.8, "r_y2": 368.92, "r_x3": 160.67, "r_y3": 368.92, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 88, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 168.25, "r_y0": 382.13, "r_x1": 181.89, "r_y1": 382.13, "r_x2": 181.89, "r_y2": 375.74, "r_x3": 168.25, "r_y3": 375.74, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 90, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 201.22, "r_y0": 382.13, "r_x1": 214.87, "r_y1": 382.13, "r_x2": 214.87, "r_y2": 375.74, "r_x3": 201.22, "r_y3": 375.74, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 92, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 234.19, "r_y0": 382.13, "r_x1": 247.84, "r_y1": 382.13, "r_x2": 247.84, "r_y2": 375.74, "r_x3": 234.19, "r_y3": 375.74, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 94, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 267.17, "r_y0": 382.13, "r_x1": 280.81, "r_y1": 382.13, "r_x2": 280.81, "r_y2": 375.74, "r_x3": 267.17, "r_y3": 375.74, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 96, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 160.67, "r_y0": 388.95, "r_x1": 174.69, "r_y1": 388.95, "r_x2": 174.69, "r_y2": 382.56, "r_x3": 160.67, "r_y3": 382.56, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 97, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 153.09, "r_y0": 395.77, "r_x1": 177.73, "r_y1": 395.77, "r_x2": 177.73, "r_y2": 389.37, "r_x3": 153.09, "r_y3": 389.37, "coord_origin": "TOPLEFT" }, "text": "
", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 68, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 183.79, "r_y0": 320.78, "r_x1": 199.33, "r_y1": 320.78, "r_x2": 199.33, "r_y2": 314.39, "r_x3": 183.79, "r_y3": 314.39, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 70, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 216.76, "r_y0": 320.78, "r_x1": 232.3, "r_y1": 320.78, "r_x2": 232.3, "r_y2": 314.39, "r_x3": 216.76, "r_y3": 314.39, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 72, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 249.73, "r_y0": 320.78, "r_x1": 265.27, "r_y1": 320.78, "r_x2": 265.27, "r_y2": 314.39, "r_x3": 249.73, "r_y3": 314.39, "coord_origin": "TOPLEFT" }, "text": "
", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 79, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 183.79, "r_y0": 361.68, "r_x1": 199.33, "r_y1": 361.68, "r_x2": 199.33, "r_y2": 355.29, "r_x3": 183.79, "r_y3": 355.29, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 81, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 216.76, "r_y0": 361.68, "r_x1": 232.3, "r_y1": 361.68, "r_x2": 232.3, "r_y2": 355.29, "r_x3": 216.76, "r_y3": 355.29, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 83, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 249.73, "r_y0": 361.68, "r_x1": 265.27, "r_y1": 361.68, "r_x2": 265.27, "r_y2": 355.29, "r_x3": 249.73, "r_y3": 355.29, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 85, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 282.71, "r_y0": 361.68, "r_x1": 298.25, "r_y1": 361.68, "r_x2": 298.25, "r_y2": 355.29, "r_x3": 282.71, "r_y3": 355.29, "coord_origin": "TOPLEFT" }, "text": "
", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 89, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 183.79, "r_y0": 382.13, "r_x1": 199.33, "r_y1": 382.13, "r_x2": 199.33, "r_y2": 375.74, "r_x3": 183.79, "r_y3": 375.74, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 91, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 216.76, "r_y0": 382.13, "r_x1": 232.3, "r_y1": 382.13, "r_x2": 232.3, "r_y2": 375.74, "r_x3": 216.76, "r_y3": 375.74, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 93, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 249.73, "r_y0": 382.13, "r_x1": 265.27, "r_y1": 382.13, "r_x2": 265.27, "r_y2": 375.74, "r_x3": 249.73, "r_y3": 375.74, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 95, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 282.71, "r_y0": 382.13, "r_x1": 298.25, "r_y1": 382.13, "r_x2": 298.25, "r_y2": 375.74, "r_x3": 282.71, "r_y3": 375.74, "coord_origin": "TOPLEFT" }, "text": "
", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 98, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 395.06, "r_y0": 419.86, "r_x1": 401.62, "r_y1": 419.86, "r_x2": 401.62, "r_y2": 411.33, "r_x3": 395.06, "r_y3": 411.33, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 99, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 407.42, "r_y0": 419.86, "r_x1": 412.48, "r_y1": 419.86, "r_x2": 412.48, "r_y2": 411.33, "r_x3": 407.42, "r_y3": 411.33, "coord_origin": "TOPLEFT" }, "text": "L", "orig": "L", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 100, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 418.69, "r_y0": 419.86, "r_x1": 425.26, "r_y1": 419.86, "r_x2": 425.26, "r_y2": 411.33, "r_x3": 418.69, "r_y3": 411.33, "coord_origin": "TOPLEFT" }, "text": "U", "orig": "U", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 101, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 430.51, "r_y0": 419.86, "r_x1": 436.57, "r_y1": 419.86, "r_x2": 436.57, "r_y2": 411.33, "r_x3": 430.51, "r_y3": 411.33, "coord_origin": "TOPLEFT" }, "text": "X", "orig": "X", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 102, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 152.36, "r_y0": 416.17, "r_x1": 175.11, "r_y1": 416.17, "r_x2": 175.11, "r_y2": 409.77, "r_x3": 152.36, "r_y3": 409.77, "coord_origin": "TOPLEFT" }, "text": "", "orig": "
", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 103, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 178.89, "r_y0": 416.17, "r_x1": 191.02, "r_y1": 416.17, "r_x2": 191.02, "r_y2": 409.77, "r_x3": 178.89, "r_y3": 409.77, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 104, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 194.81, "r_y0": 416.17, "r_x1": 208.83, "r_y1": 416.17, "r_x2": 208.83, "r_y2": 409.77, "r_x3": 194.81, "r_y3": 409.77, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 105, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 212.61, "r_y0": 416.17, "r_x1": 226.26, "r_y1": 416.17, "r_x2": 226.26, "r_y2": 409.77, "r_x3": 212.61, "r_y3": 409.77, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 107, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 249.38, "r_y0": 416.17, "r_x1": 259.04, "r_y1": 416.17, "r_x2": 259.04, "r_y2": 409.77, "r_x3": 249.38, "r_y3": 409.77, "coord_origin": "TOPLEFT" }, "text": "", "orig": ">", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 113, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 244.46, "r_y0": 424.5, "r_x1": 269.1, "r_y1": 424.5, "r_x2": 269.1, "r_y2": 418.11, "r_x3": 244.46, "r_y3": 418.11, "coord_origin": "TOPLEFT" }, "text": "
", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 106, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 230.05, "r_y0": 416.17, "r_x1": 245.59, "r_y1": 416.17, "r_x2": 245.59, "r_y2": 409.77, "r_x3": 230.05, "r_y3": 409.77, "coord_origin": "TOPLEFT" }, "text": "
", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 114, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 154.51, "r_y0": 265.71, "r_x1": 159.62, "r_y1": 265.71, "r_x2": 159.62, "r_y2": 258.6, "r_x3": 154.51, "r_y3": 258.6, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 115, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 164.74, "r_y0": 265.71, "r_x1": 185.22, "r_y1": 265.71, "r_x2": 185.22, "r_y2": 258.6, "r_x3": 164.74, "r_y3": 258.6, "coord_origin": "TOPLEFT" }, "text": "HTML", "orig": "HTML", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 116, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 164.35, "r_y0": 273.6, "r_x1": 222.05, "r_y1": 273.6, "r_x2": 222.05, "r_y2": 266.5, "r_x3": 164.35, "r_y3": 266.5, "coord_origin": "TOPLEFT" }, "text": "sequence length:", "orig": "sequence length:", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 117, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 224.15, "r_y0": 273.6, "r_x1": 232.58, "r_y1": 273.6, "r_x2": 232.58, "r_y2": 266.5, "r_x3": 224.15, "r_y3": 266.5, "coord_origin": "TOPLEFT" }, "text": "55", "orig": "55", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [ { "id": 11, "label": "text", "bbox": { "l": 396.41, "t": 280.98, "r": 402.97, "b": 289.51, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 12, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 396.41, "r_y0": 289.51, "r_x1": 402.97, "r_y1": 289.51, "r_x2": 402.97, "r_y2": 280.98, "r_x3": 396.41, "r_y3": 280.98, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 12, "label": "text", "bbox": { "l": 418.59, "t": 280.9, "r": 425.15, "b": 289.42, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 13, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 418.59, "r_y0": 289.42, "r_x1": 425.15, "r_y1": 289.42, "r_x2": 425.15, "r_y2": 280.9, "r_x3": 418.59, "r_y3": 280.9, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 13, "label": "text", "bbox": { "l": 395.75, "t": 303.24, "r": 402.31, "b": 311.76, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 14, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 395.75, "r_y0": 311.76, "r_x1": 402.31, "r_y1": 311.76, "r_x2": 402.31, "r_y2": 303.24, "r_x3": 395.75, "r_y3": 303.24, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 14, "label": "text", "bbox": { "l": 407.54, "t": 303.37, "r": 414.1, "b": 311.9, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 15, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 407.54, "r_y0": 311.9, "r_x1": 414.1, "r_y1": 311.9, "r_x2": 414.1, "r_y2": 303.37, "r_x3": 407.54, "r_y3": 303.37, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 15, "label": "text", "bbox": { "l": 407.56, "t": 314.41, "r": 414.13, "b": 322.93, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 16, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 407.56, "r_y0": 322.93, "r_x1": 414.13, "r_y1": 322.93, "r_x2": 414.13, "r_y2": 314.41, "r_x3": 407.56, "r_y3": 314.41, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 16, "label": "text", "bbox": { "l": 418.51, "t": 292.09, "r": 425.07, "b": 300.61, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 17, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 418.51, "r_y0": 300.61, "r_x1": 425.07, "r_y1": 300.61, "r_x2": 425.07, "r_y2": 292.09, "r_x3": 418.51, "r_y3": 292.09, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 17, "label": "text", "bbox": { "l": 429.6, "t": 292.09, "r": 436.16, "b": 300.62, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 18, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 429.6, "r_y0": 300.62, "r_x1": 436.16, "r_y1": 300.62, "r_x2": 436.16, "r_y2": 292.09, "r_x3": 429.6, "r_y3": 292.09, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 18, "label": "text", "bbox": { "l": 440.69, "t": 292.01, "r": 447.25, "b": 300.54, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 19, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 440.69, "r_y0": 300.54, "r_x1": 447.25, "r_y1": 300.54, "r_x2": 447.25, "r_y2": 292.01, "r_x3": 440.69, "r_y3": 292.01, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 19, "label": "text", "bbox": { "l": 418.62, "t": 303.29, "r": 425.19, "b": 311.82, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 20, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 418.62, "r_y0": 311.82, "r_x1": 425.19, "r_y1": 311.82, "r_x2": 425.19, "r_y2": 303.29, "r_x3": 418.62, "r_y3": 303.29, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 20, "label": "text", "bbox": { "l": 429.71, "t": 303.3, "r": 436.27, "b": 311.83, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 21, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 429.71, "r_y0": 311.83, "r_x1": 436.27, "r_y1": 311.83, "r_x2": 436.27, "r_y2": 303.3, "r_x3": 429.71, "r_y3": 303.3, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 21, "label": "text", "bbox": { "l": 440.8, "t": 303.22, "r": 447.36, "b": 311.75, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 22, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 440.8, "r_y0": 311.75, "r_x1": 447.36, "r_y1": 311.75, "r_x2": 447.36, "r_y2": 303.22, "r_x3": 440.8, "r_y3": 303.22, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 22, "label": "text", "bbox": { "l": 418.63, "t": 314.57, "r": 425.19, "b": 323.09, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 23, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 418.63, "r_y0": 323.09, "r_x1": 425.19, "r_y1": 323.09, "r_x2": 425.19, "r_y2": 314.57, "r_x3": 418.63, "r_y3": 314.57, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 23, "label": "text", "bbox": { "l": 429.71, "t": 314.57, "r": 436.27, "b": 323.1, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 24, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 429.71, "r_y0": 323.1, "r_x1": 436.27, "r_y1": 323.1, "r_x2": 436.27, "r_y2": 314.57, "r_x3": 429.71, "r_y3": 314.57, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 24, "label": "text", "bbox": { "l": 440.8, "t": 314.5, "r": 447.36, "b": 323.02, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 25, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 440.8, "r_y0": 323.02, "r_x1": 447.36, "r_y1": 323.02, "r_x2": 447.36, "r_y2": 314.5, "r_x3": 440.8, "r_y3": 314.5, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 25, "label": "text", "bbox": { "l": 407.4, "t": 325.29, "r": 413.96, "b": 333.82, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 26, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 407.4, "r_y0": 333.82, "r_x1": 413.96, "r_y1": 333.82, "r_x2": 413.96, "r_y2": 325.29, "r_x3": 407.4, "r_y3": 325.29, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 26, "label": "text", "bbox": { "l": 418.46, "t": 325.45, "r": 425.02, "b": 333.98, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 27, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 418.46, "r_y0": 333.98, "r_x1": 425.02, "r_y1": 333.98, "r_x2": 425.02, "r_y2": 325.45, "r_x3": 418.46, "r_y3": 325.45, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 27, "label": "text", "bbox": { "l": 429.55, "t": 325.46, "r": 436.11, "b": 333.98, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 28, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 429.55, "r_y0": 333.98, "r_x1": 436.11, "r_y1": 333.98, "r_x2": 436.11, "r_y2": 325.46, "r_x3": 429.55, "r_y3": 325.46, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 28, "label": "text", "bbox": { "l": 440.64, "t": 325.38, "r": 447.2, "b": 333.91, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 29, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 440.64, "r_y0": 333.91, "r_x1": 447.2, "r_y1": 333.91, "r_x2": 447.2, "r_y2": 325.38, "r_x3": 440.64, "r_y3": 325.38, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 29, "label": "text", "bbox": { "l": 451.9, "t": 280.16, "r": 463.51, "b": 288.68, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 30, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 451.9, "r_y0": 288.68, "r_x1": 463.51, "r_y1": 288.68, "r_x2": 463.51, "r_y2": 280.16, "r_x3": 451.9, "r_y3": 280.16, "coord_origin": "TOPLEFT" }, "text": "NL", "orig": "NL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 30, "label": "text", "bbox": { "l": 452.16, "t": 291.6, "r": 463.77, "b": 300.12, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 31, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 452.16, "r_y0": 300.12, "r_x1": 463.77, "r_y1": 300.12, "r_x2": 463.77, "r_y2": 291.6, "r_x3": 452.16, "r_y3": 291.6, "coord_origin": "TOPLEFT" }, "text": "NL", "orig": "NL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 31, "label": "text", "bbox": { "l": 452.18, "t": 302.84, "r": 463.79, "b": 311.37, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 32, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 452.18, "r_y0": 311.37, "r_x1": 463.79, "r_y1": 311.37, "r_x2": 463.79, "r_y2": 302.84, "r_x3": 452.18, "r_y3": 302.84, "coord_origin": "TOPLEFT" }, "text": "NL", "orig": "NL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 32, "label": "text", "bbox": { "l": 452.1, "t": 314.12, "r": 463.72, "b": 322.65, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 33, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 452.1, "r_y0": 322.65, "r_x1": 463.72, "r_y1": 322.65, "r_x2": 463.72, "r_y2": 314.12, "r_x3": 452.1, "r_y3": 314.12, "coord_origin": "TOPLEFT" }, "text": "NL", "orig": "NL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 33, "label": "text", "bbox": { "l": 452.3, "t": 325.47, "r": 463.91, "b": 333.99, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 34, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 452.3, "r_y0": 333.99, "r_x1": 463.91, "r_y1": 333.99, "r_x2": 463.91, "r_y2": 325.47, "r_x3": 452.3, "r_y3": 325.47, "coord_origin": "TOPLEFT" }, "text": "NL", "orig": "NL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 34, "label": "text", "bbox": { "l": 396.1, "t": 314.49, "r": 402.66, "b": 323.02, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 35, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 396.1, "r_y0": 323.02, "r_x1": 402.66, "r_y1": 323.02, "r_x2": 402.66, "r_y2": 314.49, "r_x3": 396.1, "r_y3": 314.49, "coord_origin": "TOPLEFT" }, "text": "U", "orig": "U", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 35, "label": "text", "bbox": { "l": 396.0, "t": 325.39, "r": 402.56, "b": 333.91, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 36, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 396.0, "r_y0": 333.91, "r_x1": 402.56, "r_y1": 333.91, "r_x2": 402.56, "r_y2": 325.39, "r_x3": 396.0, "r_y3": 325.39, "coord_origin": "TOPLEFT" }, "text": "U", "orig": "U", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 36, "label": "text", "bbox": { "l": 396.27, "t": 292.27, "r": 402.84, "b": 300.8, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 37, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 396.27, "r_y0": 300.8, "r_x1": 402.84, "r_y1": 300.8, "r_x2": 402.84, "r_y2": 292.27, "r_x3": 396.27, "r_y3": 292.27, "coord_origin": "TOPLEFT" }, "text": "U", "orig": "U", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 37, "label": "text", "bbox": { "l": 408.55, "t": 280.97, "r": 413.6, "b": 289.49, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 38, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 408.55, "r_y0": 289.49, "r_x1": 413.6, "r_y1": 289.49, "r_x2": 413.6, "r_y2": 280.97, "r_x3": 408.55, "r_y3": 280.97, "coord_origin": "TOPLEFT" }, "text": "L", "orig": "L", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 38, "label": "text", "bbox": { "l": 430.59, "t": 280.5, "r": 435.64, "b": 289.02, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 39, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 430.59, "r_y0": 289.02, "r_x1": 435.64, "r_y1": 289.02, "r_x2": 435.64, "r_y2": 280.5, "r_x3": 430.59, "r_y3": 280.5, "coord_origin": "TOPLEFT" }, "text": "L", "orig": "L", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 39, "label": "text", "bbox": { "l": 441.08, "t": 280.38, "r": 446.13, "b": 288.91, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 40, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 441.08, "r_y0": 288.91, "r_x1": 446.13, "r_y1": 288.91, "r_x2": 446.13, "r_y2": 280.38, "r_x3": 441.08, "r_y3": 280.38, "coord_origin": "TOPLEFT" }, "text": "L", "orig": "L", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 40, "label": "text", "bbox": { "l": 407.97, "t": 292.13, "r": 414.04, "b": 300.66, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 41, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 407.97, "r_y0": 300.66, "r_x1": 414.04, "r_y1": 300.66, "r_x2": 414.04, "r_y2": 292.13, "r_x3": 407.97, "r_y3": 292.13, "coord_origin": "TOPLEFT" }, "text": "X", "orig": "X", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 41, "label": "text", "bbox": { "l": 441.26, "t": 411.18, "r": 452.87, "b": 419.71, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 42, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 441.26, "r_y0": 419.71, "r_x1": 452.87, "r_y1": 419.71, "r_x2": 452.87, "r_y2": 411.18, "r_x3": 441.26, "r_y3": 411.18, "coord_origin": "TOPLEFT" }, "text": "NL", "orig": "NL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 42, "label": "text", "bbox": { "l": 393.75, "t": 399.79, "r": 432.49, "b": 406.9, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 43, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 393.75, "r_y0": 406.9, "r_x1": 432.49, "r_y1": 406.9, "r_x2": 432.49, "r_y2": 399.79, "r_x3": 393.75, "r_y3": 399.79, "coord_origin": "TOPLEFT" }, "text": "vocabulary:", "orig": "vocabulary:", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 43, "label": "text", "bbox": { "l": 434.59, "t": 399.79, "r": 438.8, "b": 406.9, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 44, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 434.59, "r_y0": 406.9, "r_x1": 438.8, "r_y1": 406.9, "r_x2": 438.8, "r_y2": 399.79, "r_x3": 434.59, "r_y3": 399.79, "coord_origin": "TOPLEFT" }, "text": "5", "orig": "5", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 44, "label": "text", "bbox": { "l": 440.91, "t": 399.79, "r": 463.22, "b": 406.9, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 45, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 440.91, "r_y0": 406.9, "r_x1": 463.22, "r_y1": 406.9, "r_x2": 463.22, "r_y2": 399.79, "r_x3": 440.91, "r_y3": 399.79, "coord_origin": "TOPLEFT" }, "text": "tokens", "orig": "tokens", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 45, "label": "text", "bbox": { "l": 384.12, "t": 258.55, "r": 413.99, "b": 265.65, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 46, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 384.12, "r_y0": 265.65, "r_x1": 413.99, "r_y1": 265.65, "r_x2": 413.99, "r_y2": 258.55, "r_x3": 384.12, "r_y3": 258.55, "coord_origin": "TOPLEFT" }, "text": "D OTSL", "orig": "D OTSL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 46, "label": "text", "bbox": { "l": 393.75, "t": 266.68, "r": 451.45, "b": 273.78, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 47, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 393.75, "r_y0": 273.78, "r_x1": 451.45, "r_y1": 273.78, "r_x2": 451.45, "r_y2": 266.68, "r_x3": 393.75, "r_y3": 266.68, "coord_origin": "TOPLEFT" }, "text": "sequence length:", "orig": "sequence length:", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 47, "label": "text", "bbox": { "l": 453.55, "t": 266.68, "r": 461.97, "b": 273.78, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 48, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 453.55, "r_y0": 273.78, "r_x1": 461.97, "r_y1": 273.78, "r_x2": 461.97, "r_y2": 266.68, "r_x3": 453.55, "r_y3": 266.68, "coord_origin": "TOPLEFT" }, "text": "30", "orig": "30", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 48, "label": "text", "bbox": { "l": 151.79, "t": 399.76, "r": 233.89, "b": 406.86, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 49, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.79, "r_y0": 406.86, "r_x1": 233.89, "r_y1": 406.86, "r_x2": 233.89, "r_y2": 399.76, "r_x3": 151.79, "r_y3": 399.76, "coord_origin": "TOPLEFT" }, "text": "vocabulary for this table:", "orig": "vocabulary for this table:", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 49, "label": "text", "bbox": { "l": 235.99, "t": 399.76, "r": 244.42, "b": 406.86, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 50, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 235.99, "r_y0": 406.86, "r_x1": 244.42, "r_y1": 406.86, "r_x2": 244.42, "r_y2": 399.76, "r_x3": 235.99, "r_y3": 399.76, "coord_origin": "TOPLEFT" }, "text": "12", "orig": "12", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 50, "label": "text", "bbox": { "l": 246.52, "t": 399.76, "r": 268.84, "b": 406.86, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 51, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 246.52, "r_y0": 406.86, "r_x1": 268.84, "r_y1": 406.86, "r_x2": 268.84, "r_y2": 399.76, "r_x3": 246.52, "r_y3": 399.76, "coord_origin": "TOPLEFT" }, "text": "tokens", "orig": "tokens", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 51, "label": "text", "bbox": { "l": 154.33, "t": 213.57, "r": 159.8, "b": 220.68, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 52, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 154.33, "r_y0": 220.68, "r_x1": 159.8, "r_y1": 220.68, "r_x2": 159.8, "r_y2": 213.57, "r_x3": 154.33, "r_y3": 213.57, "coord_origin": "TOPLEFT" }, "text": "A", "orig": "A", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 52, "label": "text", "bbox": { "l": 321.07, "t": 213.57, "r": 326.54, "b": 220.68, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 53, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 321.07, "r_y0": 220.68, "r_x1": 326.54, "r_y1": 220.68, "r_x2": 326.54, "r_y2": 213.57, "r_x3": 321.07, "r_y3": 213.57, "coord_origin": "TOPLEFT" }, "text": "B", "orig": "B", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 53, "label": "text", "bbox": { "l": 153.09, "t": 280.3, "r": 175.84, "b": 286.7, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 54, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 153.09, "r_y0": 286.7, "r_x1": 175.84, "r_y1": 286.7, "r_x2": 175.84, "r_y2": 280.3, "r_x3": 153.09, "r_y3": 280.3, "coord_origin": "TOPLEFT" }, "text": "", "orig": "
", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 54, "label": "text", "bbox": { "l": 160.67, "t": 287.12, "r": 172.8, "b": 293.52, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 55, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 160.67, "r_y0": 293.52, "r_x1": 172.8, "r_y1": 293.52, "r_x2": 172.8, "r_y2": 287.12, "r_x3": 160.67, "r_y3": 287.12, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 55, "label": "text", "bbox": { "l": 168.25, "t": 293.94, "r": 177.91, "b": 300.33, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 56, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 168.25, "r_y0": 300.33, "r_x1": 177.91, "r_y1": 300.33, "r_x2": 177.91, "r_y2": 293.94, "r_x3": 168.25, "r_y3": 293.94, "coord_origin": "TOPLEFT" }, "text": "", "orig": ">", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 59, "label": "text", "bbox": { "l": 263.36, "t": 293.94, "r": 278.9, "b": 300.33, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 60, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 263.36, "r_y0": 300.33, "r_x1": 278.9, "r_y1": 300.33, "r_x2": 278.9, "r_y2": 293.94, "r_x3": 263.36, "r_y3": 293.94, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 60, "label": "text", "bbox": { "l": 280.79, "t": 293.94, "r": 290.46, "b": 300.33, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 61, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 280.79, "r_y0": 300.33, "r_x1": 290.46, "r_y1": 300.33, "r_x2": 290.46, "r_y2": 293.94, "r_x3": 280.79, "r_y3": 293.94, "coord_origin": "TOPLEFT" }, "text": "", "orig": ">", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 63, "label": "text", "bbox": { "l": 335.93, "t": 293.94, "r": 351.47, "b": 300.33, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 64, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 335.93, "r_y0": 300.33, "r_x1": 351.47, "r_y1": 300.33, "r_x2": 351.47, "r_y2": 293.94, "r_x3": 335.93, "r_y3": 293.94, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 64, "label": "text", "bbox": { "l": 160.67, "t": 300.75, "r": 174.69, "b": 307.15, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 65, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 160.67, "r_y0": 307.15, "r_x1": 174.69, "r_y1": 307.15, "r_x2": 174.69, "r_y2": 300.75, "r_x3": 160.67, "r_y3": 300.75, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 65, "label": "text", "bbox": { "l": 160.67, "t": 307.57, "r": 172.8, "b": 313.97, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 66, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 160.67, "r_y0": 313.97, "r_x1": 172.8, "r_y1": 313.97, "r_x2": 172.8, "r_y2": 307.57, "r_x3": 160.67, "r_y3": 307.57, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 66, "label": "text", "bbox": { "l": 168.25, "t": 314.39, "r": 181.89, "b": 320.78, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 67, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 168.25, "r_y0": 320.78, "r_x1": 181.89, "r_y1": 320.78, "r_x2": 181.89, "r_y2": 314.39, "r_x3": 168.25, "r_y3": 314.39, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 68, "label": "text", "bbox": { "l": 201.22, "t": 314.39, "r": 214.87, "b": 320.78, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 69, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 201.22, "r_y0": 320.78, "r_x1": 214.87, "r_y1": 320.78, "r_x2": 214.87, "r_y2": 314.39, "r_x3": 201.22, "r_y3": 314.39, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 70, "label": "text", "bbox": { "l": 234.19, "t": 314.39, "r": 247.84, "b": 320.78, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 71, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 234.19, "r_y0": 320.78, "r_x1": 247.84, "r_y1": 320.78, "r_x2": 247.84, "r_y2": 314.39, "r_x3": 234.19, "r_y3": 314.39, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 72, "label": "text", "bbox": { "l": 160.67, "t": 321.2, "r": 174.69, "b": 327.6, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 73, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 160.67, "r_y0": 327.6, "r_x1": 174.69, "r_y1": 327.6, "r_x2": 174.69, "r_y2": 321.2, "r_x3": 160.67, "r_y3": 321.2, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 73, "label": "text", "bbox": { "l": 160.67, "t": 328.02, "r": 172.8, "b": 334.42, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 74, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 160.67, "r_y0": 334.42, "r_x1": 172.8, "r_y1": 334.42, "r_x2": 172.8, "r_y2": 328.02, "r_x3": 160.67, "r_y3": 328.02, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 74, "label": "text", "bbox": { "l": 168.25, "t": 334.84, "r": 373.09, "b": 341.23, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 75, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 168.25, "r_y0": 341.23, "r_x1": 373.09, "r_y1": 341.23, "r_x2": 373.09, "r_y2": 334.84, "r_x3": 168.25, "r_y3": 334.84, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 75, "label": "text", "bbox": { "l": 160.67, "t": 341.66, "r": 174.69, "b": 348.05, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 76, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 160.67, "r_y0": 348.05, "r_x1": 174.69, "r_y1": 348.05, "r_x2": 174.69, "r_y2": 341.66, "r_x3": 160.67, "r_y3": 341.66, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 76, "label": "text", "bbox": { "l": 160.67, "t": 348.47, "r": 172.8, "b": 354.87, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 77, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 160.67, "r_y0": 354.87, "r_x1": 172.8, "r_y1": 354.87, "r_x2": 172.8, "r_y2": 348.47, "r_x3": 160.67, "r_y3": 348.47, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 77, "label": "text", "bbox": { "l": 168.25, "t": 355.29, "r": 181.89, "b": 361.68, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 78, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 168.25, "r_y0": 361.68, "r_x1": 181.89, "r_y1": 361.68, "r_x2": 181.89, "r_y2": 355.29, "r_x3": 168.25, "r_y3": 355.29, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 79, "label": "text", "bbox": { "l": 201.22, "t": 355.29, "r": 214.87, "b": 361.68, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 80, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 201.22, "r_y0": 361.68, "r_x1": 214.87, "r_y1": 361.68, "r_x2": 214.87, "r_y2": 355.29, "r_x3": 201.22, "r_y3": 355.29, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 81, "label": "text", "bbox": { "l": 234.19, "t": 355.29, "r": 247.84, "b": 361.68, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 82, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 234.19, "r_y0": 361.68, "r_x1": 247.84, "r_y1": 361.68, "r_x2": 247.84, "r_y2": 355.29, "r_x3": 234.19, "r_y3": 355.29, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 83, "label": "text", "bbox": { "l": 267.17, "t": 355.29, "r": 280.81, "b": 361.68, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 84, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 267.17, "r_y0": 361.68, "r_x1": 280.81, "r_y1": 361.68, "r_x2": 280.81, "r_y2": 355.29, "r_x3": 267.17, "r_y3": 355.29, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 85, "label": "text", "bbox": { "l": 160.67, "t": 362.11, "r": 174.69, "b": 368.5, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 86, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 160.67, "r_y0": 368.5, "r_x1": 174.69, "r_y1": 368.5, "r_x2": 174.69, "r_y2": 362.11, "r_x3": 160.67, "r_y3": 362.11, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 86, "label": "text", "bbox": { "l": 160.67, "t": 368.92, "r": 172.8, "b": 375.32, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 87, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 160.67, "r_y0": 375.32, "r_x1": 172.8, "r_y1": 375.32, "r_x2": 172.8, "r_y2": 368.92, "r_x3": 160.67, "r_y3": 368.92, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 87, "label": "text", "bbox": { "l": 168.25, "t": 375.74, "r": 181.89, "b": 382.13, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 88, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 168.25, "r_y0": 382.13, "r_x1": 181.89, "r_y1": 382.13, "r_x2": 181.89, "r_y2": 375.74, "r_x3": 168.25, "r_y3": 375.74, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 89, "label": "text", "bbox": { "l": 201.22, "t": 375.74, "r": 214.87, "b": 382.13, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 90, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 201.22, "r_y0": 382.13, "r_x1": 214.87, "r_y1": 382.13, "r_x2": 214.87, "r_y2": 375.74, "r_x3": 201.22, "r_y3": 375.74, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 91, "label": "text", "bbox": { "l": 234.19, "t": 375.74, "r": 247.84, "b": 382.13, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 92, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 234.19, "r_y0": 382.13, "r_x1": 247.84, "r_y1": 382.13, "r_x2": 247.84, "r_y2": 375.74, "r_x3": 234.19, "r_y3": 375.74, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 93, "label": "text", "bbox": { "l": 267.17, "t": 375.74, "r": 280.81, "b": 382.13, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 94, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 267.17, "r_y0": 382.13, "r_x1": 280.81, "r_y1": 382.13, "r_x2": 280.81, "r_y2": 375.74, "r_x3": 267.17, "r_y3": 375.74, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 95, "label": "text", "bbox": { "l": 160.67, "t": 382.56, "r": 174.69, "b": 388.95, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 96, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 160.67, "r_y0": 388.95, "r_x1": 174.69, "r_y1": 388.95, "r_x2": 174.69, "r_y2": 382.56, "r_x3": 160.67, "r_y3": 382.56, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 96, "label": "text", "bbox": { "l": 153.09, "t": 389.37, "r": 177.73, "b": 395.77, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 97, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 153.09, "r_y0": 395.77, "r_x1": 177.73, "r_y1": 395.77, "r_x2": 177.73, "r_y2": 389.37, "r_x3": 153.09, "r_y3": 389.37, "coord_origin": "TOPLEFT" }, "text": "
", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 67, "label": "text", "bbox": { "l": 183.79, "t": 314.39, "r": 199.33, "b": 320.78, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 68, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 183.79, "r_y0": 320.78, "r_x1": 199.33, "r_y1": 320.78, "r_x2": 199.33, "r_y2": 314.39, "r_x3": 183.79, "r_y3": 314.39, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 69, "label": "text", "bbox": { "l": 216.76, "t": 314.39, "r": 232.3, "b": 320.78, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 70, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 216.76, "r_y0": 320.78, "r_x1": 232.3, "r_y1": 320.78, "r_x2": 232.3, "r_y2": 314.39, "r_x3": 216.76, "r_y3": 314.39, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 71, "label": "text", "bbox": { "l": 249.73, "t": 314.39, "r": 265.27, "b": 320.78, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 72, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 249.73, "r_y0": 320.78, "r_x1": 265.27, "r_y1": 320.78, "r_x2": 265.27, "r_y2": 314.39, "r_x3": 249.73, "r_y3": 314.39, "coord_origin": "TOPLEFT" }, "text": "
", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 78, "label": "text", "bbox": { "l": 183.79, "t": 355.29, "r": 199.33, "b": 361.68, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 79, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 183.79, "r_y0": 361.68, "r_x1": 199.33, "r_y1": 361.68, "r_x2": 199.33, "r_y2": 355.29, "r_x3": 183.79, "r_y3": 355.29, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 80, "label": "text", "bbox": { "l": 216.76, "t": 355.29, "r": 232.3, "b": 361.68, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 81, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 216.76, "r_y0": 361.68, "r_x1": 232.3, "r_y1": 361.68, "r_x2": 232.3, "r_y2": 355.29, "r_x3": 216.76, "r_y3": 355.29, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 82, "label": "text", "bbox": { "l": 249.73, "t": 355.29, "r": 265.27, "b": 361.68, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 83, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 249.73, "r_y0": 361.68, "r_x1": 265.27, "r_y1": 361.68, "r_x2": 265.27, "r_y2": 355.29, "r_x3": 249.73, "r_y3": 355.29, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 84, "label": "text", "bbox": { "l": 282.71, "t": 355.29, "r": 298.25, "b": 361.68, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 85, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 282.71, "r_y0": 361.68, "r_x1": 298.25, "r_y1": 361.68, "r_x2": 298.25, "r_y2": 355.29, "r_x3": 282.71, "r_y3": 355.29, "coord_origin": "TOPLEFT" }, "text": "
", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 88, "label": "text", "bbox": { "l": 183.79, "t": 375.74, "r": 199.33, "b": 382.13, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 89, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 183.79, "r_y0": 382.13, "r_x1": 199.33, "r_y1": 382.13, "r_x2": 199.33, "r_y2": 375.74, "r_x3": 183.79, "r_y3": 375.74, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 90, "label": "text", "bbox": { "l": 216.76, "t": 375.74, "r": 232.3, "b": 382.13, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 91, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 216.76, "r_y0": 382.13, "r_x1": 232.3, "r_y1": 382.13, "r_x2": 232.3, "r_y2": 375.74, "r_x3": 216.76, "r_y3": 375.74, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 92, "label": "text", "bbox": { "l": 249.73, "t": 375.74, "r": 265.27, "b": 382.13, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 93, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 249.73, "r_y0": 382.13, "r_x1": 265.27, "r_y1": 382.13, "r_x2": 265.27, "r_y2": 375.74, "r_x3": 249.73, "r_y3": 375.74, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 94, "label": "text", "bbox": { "l": 282.71, "t": 375.74, "r": 298.25, "b": 382.13, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 95, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 282.71, "r_y0": 382.13, "r_x1": 298.25, "r_y1": 382.13, "r_x2": 298.25, "r_y2": 375.74, "r_x3": 282.71, "r_y3": 375.74, "coord_origin": "TOPLEFT" }, "text": "
", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 97, "label": "text", "bbox": { "l": 395.06, "t": 411.33, "r": 401.62, "b": 419.86, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 98, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 395.06, "r_y0": 419.86, "r_x1": 401.62, "r_y1": 419.86, "r_x2": 401.62, "r_y2": 411.33, "r_x3": 395.06, "r_y3": 411.33, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 98, "label": "text", "bbox": { "l": 407.42, "t": 411.33, "r": 412.48, "b": 419.86, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 99, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 407.42, "r_y0": 419.86, "r_x1": 412.48, "r_y1": 419.86, "r_x2": 412.48, "r_y2": 411.33, "r_x3": 407.42, "r_y3": 411.33, "coord_origin": "TOPLEFT" }, "text": "L", "orig": "L", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 99, "label": "text", "bbox": { "l": 418.69, "t": 411.33, "r": 425.26, "b": 419.86, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 100, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 418.69, "r_y0": 419.86, "r_x1": 425.26, "r_y1": 419.86, "r_x2": 425.26, "r_y2": 411.33, "r_x3": 418.69, "r_y3": 411.33, "coord_origin": "TOPLEFT" }, "text": "U", "orig": "U", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 100, "label": "text", "bbox": { "l": 430.51, "t": 411.33, "r": 436.57, "b": 419.86, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 101, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 430.51, "r_y0": 419.86, "r_x1": 436.57, "r_y1": 419.86, "r_x2": 436.57, "r_y2": 411.33, "r_x3": 430.51, "r_y3": 411.33, "coord_origin": "TOPLEFT" }, "text": "X", "orig": "X", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 101, "label": "text", "bbox": { "l": 152.36, "t": 409.77, "r": 175.11, "b": 416.17, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 102, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 152.36, "r_y0": 416.17, "r_x1": 175.11, "r_y1": 416.17, "r_x2": 175.11, "r_y2": 409.77, "r_x3": 152.36, "r_y3": 409.77, "coord_origin": "TOPLEFT" }, "text": "", "orig": "
", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 102, "label": "text", "bbox": { "l": 178.89, "t": 409.77, "r": 191.02, "b": 416.17, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 103, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 178.89, "r_y0": 416.17, "r_x1": 191.02, "r_y1": 416.17, "r_x2": 191.02, "r_y2": 409.77, "r_x3": 178.89, "r_y3": 409.77, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 103, "label": "text", "bbox": { "l": 194.81, "t": 409.77, "r": 208.83, "b": 416.17, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 104, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 194.81, "r_y0": 416.17, "r_x1": 208.83, "r_y1": 416.17, "r_x2": 208.83, "r_y2": 409.77, "r_x3": 194.81, "r_y3": 409.77, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 104, "label": "text", "bbox": { "l": 212.61, "t": 409.77, "r": 226.26, "b": 416.17, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 105, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 212.61, "r_y0": 416.17, "r_x1": 226.26, "r_y1": 416.17, "r_x2": 226.26, "r_y2": 409.77, "r_x3": 212.61, "r_y3": 409.77, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 106, "label": "text", "bbox": { "l": 249.38, "t": 409.77, "r": 259.04, "b": 416.17, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 107, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 249.38, "r_y0": 416.17, "r_x1": 259.04, "r_y1": 416.17, "r_x2": 259.04, "r_y2": 409.77, "r_x3": 249.38, "r_y3": 409.77, "coord_origin": "TOPLEFT" }, "text": "", "orig": ">", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 112, "label": "text", "bbox": { "l": 244.46, "t": 418.11, "r": 269.1, "b": 424.5, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 113, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 244.46, "r_y0": 424.5, "r_x1": 269.1, "r_y1": 424.5, "r_x2": 269.1, "r_y2": 418.11, "r_x3": 244.46, "r_y3": 418.11, "coord_origin": "TOPLEFT" }, "text": "
", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 105, "label": "text", "bbox": { "l": 230.05, "t": 409.77, "r": 245.59, "b": 416.17, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 106, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 230.05, "r_y0": 416.17, "r_x1": 245.59, "r_y1": 416.17, "r_x2": 245.59, "r_y2": 409.77, "r_x3": 230.05, "r_y3": 409.77, "coord_origin": "TOPLEFT" }, "text": "
", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 113, "label": "text", "bbox": { "l": 154.51, "t": 258.6, "r": 159.62, "b": 265.71, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 114, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 154.51, "r_y0": 265.71, "r_x1": 159.62, "r_y1": 265.71, "r_x2": 159.62, "r_y2": 258.6, "r_x3": 154.51, "r_y3": 258.6, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 114, "label": "text", "bbox": { "l": 164.74, "t": 258.6, "r": 185.22, "b": 265.71, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 115, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 164.74, "r_y0": 265.71, "r_x1": 185.22, "r_y1": 265.71, "r_x2": 185.22, "r_y2": 258.6, "r_x3": 164.74, "r_y3": 258.6, "coord_origin": "TOPLEFT" }, "text": "HTML", "orig": "HTML", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 115, "label": "text", "bbox": { "l": 164.35, "t": 266.5, "r": 222.05, "b": 273.6, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 116, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 164.35, "r_y0": 273.6, "r_x1": 222.05, "r_y1": 273.6, "r_x2": 222.05, "r_y2": 266.5, "r_x3": 164.35, "r_y3": 266.5, "coord_origin": "TOPLEFT" }, "text": "sequence length:", "orig": "sequence length:", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 116, "label": "text", "bbox": { "l": 224.15, "t": 266.5, "r": 232.58, "b": 273.6, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 117, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 224.15, "r_y0": 273.6, "r_x1": 232.58, "r_y1": 273.6, "r_x2": 232.58, "r_y2": 266.5, "r_x3": 224.15, "r_y3": 266.5, "coord_origin": "TOPLEFT" }, "text": "55", "orig": "55", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] } ] }, "text": "", "annotations": [], "provenance": null, "predicted_class": null, "confidence": null }, { "label": "text", "id": 2, "page_no": 1, "cluster": { "id": 2, "label": "text", "bbox": { "l": 134.76, "t": 452.31, "r": 480.59, "b": 520.89, "coord_origin": "TOPLEFT" }, "confidence": 0.95, "cells": [ { "index": 118, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 461.11, "r_x1": 161.33, "r_y1": 461.11, "r_x2": 161.33, "r_y2": 452.31, "r_x3": 134.76, "r_y3": 452.31, "coord_origin": "TOPLEFT" }, "text": "today,", "orig": "today,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 119, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 164.27, "r_y0": 461.11, "r_x1": 226.29, "r_y1": 461.11, "r_x2": 226.29, "r_y2": 452.31, "r_x3": 164.27, "r_y3": 452.31, "coord_origin": "TOPLEFT" }, "text": "table detection", "orig": "table detection", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 120, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 229.99, "r_y0": 461.11, "r_x1": 480.59, "r_y1": 461.11, "r_x2": 480.59, "r_y2": 452.31, "r_x3": 229.99, "r_y3": 452.31, "coord_origin": "TOPLEFT" }, "text": "in documents is a well understood problem, and the latest", "orig": "in documents is a well understood problem, and the latest", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 121, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.77, "r_y0": 473.07, "r_x1": 480.59, "r_y1": 473.07, "r_x2": 480.59, "r_y2": 464.27, "r_x3": 134.77, "r_y3": 464.27, "coord_origin": "TOPLEFT" }, "text": "state-of-the-art (SOTA) object detection methods provide an accuracy compa-", "orig": "state-of-the-art (SOTA) object detection methods provide an accuracy compa-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 122, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.77, "r_y0": 485.02, "r_x1": 480.59, "r_y1": 485.02, "r_x2": 480.59, "r_y2": 476.22, "r_x3": 134.77, "r_y3": 476.22, "coord_origin": "TOPLEFT" }, "text": "rable to human observers [7,8,10,14,23]. On the other hand, the problem of table", "orig": "rable to human observers [7,8,10,14,23]. On the other hand, the problem of table", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 123, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.77, "r_y0": 496.98, "r_x1": 480.59, "r_y1": 496.98, "r_x2": 480.59, "r_y2": 488.18, "r_x3": 134.77, "r_y3": 488.18, "coord_origin": "TOPLEFT" }, "text": "structure recognition (TSR) is a lot more challenging and remains a very active", "orig": "structure recognition (TSR) is a lot more challenging and remains a very active", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 124, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.77, "r_y0": 508.93, "r_x1": 480.59, "r_y1": 508.93, "r_x2": 480.59, "r_y2": 500.13, "r_x3": 134.77, "r_y3": 500.13, "coord_origin": "TOPLEFT" }, "text": "area of research, in which many novel machine learning algorithms are being", "orig": "area of research, in which many novel machine learning algorithms are being", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 125, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.77, "r_y0": 520.89, "r_x1": 313.25, "r_y1": 520.89, "r_x2": 313.25, "r_y2": 512.09, "r_x3": 134.77, "r_y3": 512.09, "coord_origin": "TOPLEFT" }, "text": "explored [3,4,5,9,11,12,13,14,17,18,21,22].", "orig": "explored [3,4,5,9,11,12,13,14,17,18,21,22].", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "today, table detection in documents is a well understood problem, and the latest state-of-the-art (SOTA) object detection methods provide an accuracy comparable to human observers [7,8,10,14,23]. On the other hand, the problem of table structure recognition (TSR) is a lot more challenging and remains a very active area of research, in which many novel machine learning algorithms are being explored [3,4,5,9,11,12,13,14,17,18,21,22]." }, { "label": "text", "id": 0, "page_no": 1, "cluster": { "id": 0, "label": "text", "bbox": { "l": 134.77, "t": 524.55, "r": 480.59, "b": 664.85, "coord_origin": "TOPLEFT" }, "confidence": 0.985, "cells": [ { "index": 126, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 149.71, "r_y0": 533.35, "r_x1": 480.59, "r_y1": 533.35, "r_x2": 480.59, "r_y2": 524.55, "r_x3": 149.71, "r_y3": 524.55, "coord_origin": "TOPLEFT" }, "text": "Recently emerging SOTA methods for table structure recognition employ", "orig": "Recently emerging SOTA methods for table structure recognition employ", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 127, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.77, "r_y0": 545.3, "r_x1": 480.59, "r_y1": 545.3, "r_x2": 480.59, "r_y2": 536.51, "r_x3": 134.77, "r_y3": 536.51, "coord_origin": "TOPLEFT" }, "text": "transformer-based models, in which an image of the table is provided to the net-", "orig": "transformer-based models, in which an image of the table is provided to the net-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 128, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.77, "r_y0": 557.26, "r_x1": 480.59, "r_y1": 557.26, "r_x2": 480.59, "r_y2": 548.46, "r_x3": 134.77, "r_y3": 548.46, "coord_origin": "TOPLEFT" }, "text": "work in order to predict the structure of the table as a sequence of tokens. These", "orig": "work in order to predict the structure of the table as a sequence of tokens. These", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 129, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.77, "r_y0": 569.21, "r_x1": 480.59, "r_y1": 569.21, "r_x2": 480.59, "r_y2": 560.42, "r_x3": 134.77, "r_y3": 560.42, "coord_origin": "TOPLEFT" }, "text": "image-to-sequence (Im2Seq) models are extremely powerful, since they allow for", "orig": "image-to-sequence (Im2Seq) models are extremely powerful, since they allow for", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 130, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.77, "r_y0": 581.17, "r_x1": 480.59, "r_y1": 581.17, "r_x2": 480.59, "r_y2": 572.37, "r_x3": 134.77, "r_y3": 572.37, "coord_origin": "TOPLEFT" }, "text": "a purely data-driven solution. The tokens of the sequence typically belong to a", "orig": "a purely data-driven solution. The tokens of the sequence typically belong to a", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 131, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.77, "r_y0": 593.12, "r_x1": 480.59, "r_y1": 593.12, "r_x2": 480.59, "r_y2": 584.33, "r_x3": 134.77, "r_y3": 584.33, "coord_origin": "TOPLEFT" }, "text": "markup language such as HTML, Latex or Markdown, which allow to describe", "orig": "markup language such as HTML, Latex or Markdown, which allow to describe", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 132, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.77, "r_y0": 605.08, "r_x1": 480.59, "r_y1": 605.08, "r_x2": 480.59, "r_y2": 596.28, "r_x3": 134.77, "r_y3": 596.28, "coord_origin": "TOPLEFT" }, "text": "table structure as rows, columns and spanning cells in various configurations.", "orig": "table structure as rows, columns and spanning cells in various configurations.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 133, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.77, "r_y0": 617.03, "r_x1": 480.59, "r_y1": 617.03, "r_x2": 480.59, "r_y2": 608.24, "r_x3": 134.77, "r_y3": 608.24, "coord_origin": "TOPLEFT" }, "text": "In Figure 1, we illustrate how HTML is used to represent the table-structure", "orig": "In Figure 1, we illustrate how HTML is used to represent the table-structure", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 134, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.77, "r_y0": 628.99, "r_x1": 480.59, "r_y1": 628.99, "r_x2": 480.59, "r_y2": 620.19, "r_x3": 134.77, "r_y3": 620.19, "coord_origin": "TOPLEFT" }, "text": "of a particular example table. Public table-structure data sets such as PubTab-", "orig": "of a particular example table. Public table-structure data sets such as PubTab-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 135, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.77, "r_y0": 640.94, "r_x1": 480.59, "r_y1": 640.94, "r_x2": 480.59, "r_y2": 632.15, "r_x3": 134.77, "r_y3": 632.15, "coord_origin": "TOPLEFT" }, "text": "Net [22], and FinTabNet [21], which were created in a semi-automated way from", "orig": "Net [22], and FinTabNet [21], which were created in a semi-automated way from", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 136, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.77, "r_y0": 652.9, "r_x1": 480.59, "r_y1": 652.9, "r_x2": 480.59, "r_y2": 644.1, "r_x3": 134.77, "r_y3": 644.1, "coord_origin": "TOPLEFT" }, "text": "paired PDF and HTML sources (e.g. PubMed Central), popularized primarily", "orig": "paired PDF and HTML sources (e.g. PubMed Central), popularized primarily", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 137, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.77, "r_y0": 664.85, "r_x1": 421.45, "r_y1": 664.85, "r_x2": 421.45, "r_y2": 656.06, "r_x3": 134.77, "r_y3": 656.06, "coord_origin": "TOPLEFT" }, "text": "the use of HTML as ground-truth representation format for TSR.", "orig": "the use of HTML as ground-truth representation format for TSR.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "Recently emerging SOTA methods for table structure recognition employ transformer-based models, in which an image of the table is provided to the network in order to predict the structure of the table as a sequence of tokens. These image-to-sequence (Im2Seq) models are extremely powerful, since they allow for a purely data-driven solution. The tokens of the sequence typically belong to a markup language such as HTML, Latex or Markdown, which allow to describe table structure as rows, columns and spanning cells in various configurations. In Figure 1, we illustrate how HTML is used to represent the table-structure of a particular example table. Public table-structure data sets such as PubTabNet [22], and FinTabNet [21], which were created in a semi-automated way from paired PDF and HTML sources (e.g. PubMed Central), popularized primarily the use of HTML as ground-truth representation format for TSR." } ], "body": [ { "label": "caption", "id": 4, "page_no": 1, "cluster": { "id": 4, "label": "caption", "bbox": { "l": 134.76, "t": 126.33, "r": 480.59, "b": 200.22, "coord_origin": "TOPLEFT" }, "confidence": 0.894, "cells": [ { "index": 3, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 134.26, "r_x1": 162.64, "r_y1": 134.26, "r_x2": 162.64, "r_y2": 126.33, "r_x3": 134.76, "r_y3": 126.33, "coord_origin": "TOPLEFT" }, "text": "Fig. 1.", "orig": "Fig. 1.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 4, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 167.06, "r_y0": 134.47, "r_x1": 480.59, "r_y1": 134.47, "r_x2": 480.59, "r_y2": 126.4, "r_x3": 167.06, "r_y3": 126.4, "coord_origin": "TOPLEFT" }, "text": "Comparison between HTML and OTSL table structure representation: (A)", "orig": "Comparison between HTML and OTSL table structure representation: (A)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 5, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 145.43, "r_x1": 480.59, "r_y1": 145.43, "r_x2": 480.59, "r_y2": 137.36, "r_x3": 134.76, "r_y3": 137.36, "coord_origin": "TOPLEFT" }, "text": "table-example with complex row and column headers, including a 2D empty span,", "orig": "table-example with complex row and column headers, including a 2D empty span,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 6, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 156.38, "r_x1": 147.95, "r_y1": 156.38, "r_x2": 147.95, "r_y2": 148.31, "r_x3": 134.76, "r_y3": 148.31, "coord_origin": "TOPLEFT" }, "text": "(B)", "orig": "(B)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 7, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 152.39, "r_y0": 156.38, "r_x1": 480.59, "r_y1": 156.38, "r_x2": 480.59, "r_y2": 148.31, "r_x3": 152.39, "r_y3": 148.31, "coord_origin": "TOPLEFT" }, "text": "minimal graphical representation of table structure using rectangular layout, (C)", "orig": "minimal graphical representation of table structure using rectangular layout, (C)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 8, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 167.34, "r_x1": 480.59, "r_y1": 167.34, "r_x2": 480.59, "r_y2": 159.27, "r_x3": 134.76, "r_y3": 159.27, "coord_origin": "TOPLEFT" }, "text": "HTML representation, (D) OTSL representation. This example demonstrates many of", "orig": "HTML representation, (D) OTSL representation. This example demonstrates many of", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 9, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 178.3, "r_x1": 480.59, "r_y1": 178.3, "r_x2": 480.59, "r_y2": 170.23, "r_x3": 134.76, "r_y3": 170.23, "coord_origin": "TOPLEFT" }, "text": "the key-features of OTSL, namely its reduced vocabulary size (12 versus 5 in this case),", "orig": "the key-features of OTSL, namely its reduced vocabulary size (12 versus 5 in this case),", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 10, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 189.26, "r_x1": 480.59, "r_y1": 189.26, "r_x2": 480.59, "r_y2": 181.19, "r_x3": 134.76, "r_y3": 181.19, "coord_origin": "TOPLEFT" }, "text": "its reduced sequence length (55 versus 30) and a enhanced internal structure (variable", "orig": "its reduced sequence length (55 versus 30) and a enhanced internal structure (variable", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 11, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 200.22, "r_x1": 460.87, "r_y1": 200.22, "r_x2": 460.87, "r_y2": 192.15, "r_x3": 134.76, "r_y3": 192.15, "coord_origin": "TOPLEFT" }, "text": "token sequence length per row in HTML versus a fixed length of rows in OTSL).", "orig": "token sequence length per row in HTML versus a fixed length of rows in OTSL).", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "Fig. 1. Comparison between HTML and OTSL table structure representation: (A) table-example with complex row and column headers, including a 2D empty span, (B) minimal graphical representation of table structure using rectangular layout, (C) HTML representation, (D) OTSL representation. This example demonstrates many of the key-features of OTSL, namely its reduced vocabulary size (12 versus 5 in this case), its reduced sequence length (55 versus 30) and a enhanced internal structure (variable token sequence length per row in HTML versus a fixed length of rows in OTSL)." }, { "label": "picture", "id": 1, "page_no": 1, "cluster": { "id": 1, "label": "picture", "bbox": { "l": 148.45, "t": 208.37, "r": 464.36, "b": 425.85, "coord_origin": "TOPLEFT" }, "confidence": 0.969, "cells": [ { "index": 12, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 396.41, "r_y0": 289.51, "r_x1": 402.97, "r_y1": 289.51, "r_x2": 402.97, "r_y2": 280.98, "r_x3": 396.41, "r_y3": 280.98, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 13, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 418.59, "r_y0": 289.42, "r_x1": 425.15, "r_y1": 289.42, "r_x2": 425.15, "r_y2": 280.9, "r_x3": 418.59, "r_y3": 280.9, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 14, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 395.75, "r_y0": 311.76, "r_x1": 402.31, "r_y1": 311.76, "r_x2": 402.31, "r_y2": 303.24, "r_x3": 395.75, "r_y3": 303.24, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 15, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 407.54, "r_y0": 311.9, "r_x1": 414.1, "r_y1": 311.9, "r_x2": 414.1, "r_y2": 303.37, "r_x3": 407.54, "r_y3": 303.37, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 16, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 407.56, "r_y0": 322.93, "r_x1": 414.13, "r_y1": 322.93, "r_x2": 414.13, "r_y2": 314.41, "r_x3": 407.56, "r_y3": 314.41, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 17, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 418.51, "r_y0": 300.61, "r_x1": 425.07, "r_y1": 300.61, "r_x2": 425.07, "r_y2": 292.09, "r_x3": 418.51, "r_y3": 292.09, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 18, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 429.6, "r_y0": 300.62, "r_x1": 436.16, "r_y1": 300.62, "r_x2": 436.16, "r_y2": 292.09, "r_x3": 429.6, "r_y3": 292.09, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 19, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 440.69, "r_y0": 300.54, "r_x1": 447.25, "r_y1": 300.54, "r_x2": 447.25, "r_y2": 292.01, "r_x3": 440.69, "r_y3": 292.01, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 20, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 418.62, "r_y0": 311.82, "r_x1": 425.19, "r_y1": 311.82, "r_x2": 425.19, "r_y2": 303.29, "r_x3": 418.62, "r_y3": 303.29, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 21, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 429.71, "r_y0": 311.83, "r_x1": 436.27, "r_y1": 311.83, "r_x2": 436.27, "r_y2": 303.3, "r_x3": 429.71, "r_y3": 303.3, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 22, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 440.8, "r_y0": 311.75, "r_x1": 447.36, "r_y1": 311.75, "r_x2": 447.36, "r_y2": 303.22, "r_x3": 440.8, "r_y3": 303.22, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 23, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 418.63, "r_y0": 323.09, "r_x1": 425.19, "r_y1": 323.09, "r_x2": 425.19, "r_y2": 314.57, "r_x3": 418.63, "r_y3": 314.57, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 24, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 429.71, "r_y0": 323.1, "r_x1": 436.27, "r_y1": 323.1, "r_x2": 436.27, "r_y2": 314.57, "r_x3": 429.71, "r_y3": 314.57, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 25, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 440.8, "r_y0": 323.02, "r_x1": 447.36, "r_y1": 323.02, "r_x2": 447.36, "r_y2": 314.5, "r_x3": 440.8, "r_y3": 314.5, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 26, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 407.4, "r_y0": 333.82, "r_x1": 413.96, "r_y1": 333.82, "r_x2": 413.96, "r_y2": 325.29, "r_x3": 407.4, "r_y3": 325.29, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 27, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 418.46, "r_y0": 333.98, "r_x1": 425.02, "r_y1": 333.98, "r_x2": 425.02, "r_y2": 325.45, "r_x3": 418.46, "r_y3": 325.45, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 28, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 429.55, "r_y0": 333.98, "r_x1": 436.11, "r_y1": 333.98, "r_x2": 436.11, "r_y2": 325.46, "r_x3": 429.55, "r_y3": 325.46, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 29, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 440.64, "r_y0": 333.91, "r_x1": 447.2, "r_y1": 333.91, "r_x2": 447.2, "r_y2": 325.38, "r_x3": 440.64, "r_y3": 325.38, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 30, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 451.9, "r_y0": 288.68, "r_x1": 463.51, "r_y1": 288.68, "r_x2": 463.51, "r_y2": 280.16, "r_x3": 451.9, "r_y3": 280.16, "coord_origin": "TOPLEFT" }, "text": "NL", "orig": "NL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 31, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 452.16, "r_y0": 300.12, "r_x1": 463.77, "r_y1": 300.12, "r_x2": 463.77, "r_y2": 291.6, "r_x3": 452.16, "r_y3": 291.6, "coord_origin": "TOPLEFT" }, "text": "NL", "orig": "NL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 32, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 452.18, "r_y0": 311.37, "r_x1": 463.79, "r_y1": 311.37, "r_x2": 463.79, "r_y2": 302.84, "r_x3": 452.18, "r_y3": 302.84, "coord_origin": "TOPLEFT" }, "text": "NL", "orig": "NL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 33, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 452.1, "r_y0": 322.65, "r_x1": 463.72, "r_y1": 322.65, "r_x2": 463.72, "r_y2": 314.12, "r_x3": 452.1, "r_y3": 314.12, "coord_origin": "TOPLEFT" }, "text": "NL", "orig": "NL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 34, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 452.3, "r_y0": 333.99, "r_x1": 463.91, "r_y1": 333.99, "r_x2": 463.91, "r_y2": 325.47, "r_x3": 452.3, "r_y3": 325.47, "coord_origin": "TOPLEFT" }, "text": "NL", "orig": "NL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 35, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 396.1, "r_y0": 323.02, "r_x1": 402.66, "r_y1": 323.02, "r_x2": 402.66, "r_y2": 314.49, "r_x3": 396.1, "r_y3": 314.49, "coord_origin": "TOPLEFT" }, "text": "U", "orig": "U", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 36, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 396.0, "r_y0": 333.91, "r_x1": 402.56, "r_y1": 333.91, "r_x2": 402.56, "r_y2": 325.39, "r_x3": 396.0, "r_y3": 325.39, "coord_origin": "TOPLEFT" }, "text": "U", "orig": "U", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 37, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 396.27, "r_y0": 300.8, "r_x1": 402.84, "r_y1": 300.8, "r_x2": 402.84, "r_y2": 292.27, "r_x3": 396.27, "r_y3": 292.27, "coord_origin": "TOPLEFT" }, "text": "U", "orig": "U", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 38, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 408.55, "r_y0": 289.49, "r_x1": 413.6, "r_y1": 289.49, "r_x2": 413.6, "r_y2": 280.97, "r_x3": 408.55, "r_y3": 280.97, "coord_origin": "TOPLEFT" }, "text": "L", "orig": "L", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 39, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 430.59, "r_y0": 289.02, "r_x1": 435.64, "r_y1": 289.02, "r_x2": 435.64, "r_y2": 280.5, "r_x3": 430.59, "r_y3": 280.5, "coord_origin": "TOPLEFT" }, "text": "L", "orig": "L", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 40, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 441.08, "r_y0": 288.91, "r_x1": 446.13, "r_y1": 288.91, "r_x2": 446.13, "r_y2": 280.38, "r_x3": 441.08, "r_y3": 280.38, "coord_origin": "TOPLEFT" }, "text": "L", "orig": "L", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 41, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 407.97, "r_y0": 300.66, "r_x1": 414.04, "r_y1": 300.66, "r_x2": 414.04, "r_y2": 292.13, "r_x3": 407.97, "r_y3": 292.13, "coord_origin": "TOPLEFT" }, "text": "X", "orig": "X", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 42, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 441.26, "r_y0": 419.71, "r_x1": 452.87, "r_y1": 419.71, "r_x2": 452.87, "r_y2": 411.18, "r_x3": 441.26, "r_y3": 411.18, "coord_origin": "TOPLEFT" }, "text": "NL", "orig": "NL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 43, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 393.75, "r_y0": 406.9, "r_x1": 432.49, "r_y1": 406.9, "r_x2": 432.49, "r_y2": 399.79, "r_x3": 393.75, "r_y3": 399.79, "coord_origin": "TOPLEFT" }, "text": "vocabulary:", "orig": "vocabulary:", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 44, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 434.59, "r_y0": 406.9, "r_x1": 438.8, "r_y1": 406.9, "r_x2": 438.8, "r_y2": 399.79, "r_x3": 434.59, "r_y3": 399.79, "coord_origin": "TOPLEFT" }, "text": "5", "orig": "5", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 45, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 440.91, "r_y0": 406.9, "r_x1": 463.22, "r_y1": 406.9, "r_x2": 463.22, "r_y2": 399.79, "r_x3": 440.91, "r_y3": 399.79, "coord_origin": "TOPLEFT" }, "text": "tokens", "orig": "tokens", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 46, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 384.12, "r_y0": 265.65, "r_x1": 413.99, "r_y1": 265.65, "r_x2": 413.99, "r_y2": 258.55, "r_x3": 384.12, "r_y3": 258.55, "coord_origin": "TOPLEFT" }, "text": "D OTSL", "orig": "D OTSL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 47, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 393.75, "r_y0": 273.78, "r_x1": 451.45, "r_y1": 273.78, "r_x2": 451.45, "r_y2": 266.68, "r_x3": 393.75, "r_y3": 266.68, "coord_origin": "TOPLEFT" }, "text": "sequence length:", "orig": "sequence length:", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 48, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 453.55, "r_y0": 273.78, "r_x1": 461.97, "r_y1": 273.78, "r_x2": 461.97, "r_y2": 266.68, "r_x3": 453.55, "r_y3": 266.68, "coord_origin": "TOPLEFT" }, "text": "30", "orig": "30", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 49, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.79, "r_y0": 406.86, "r_x1": 233.89, "r_y1": 406.86, "r_x2": 233.89, "r_y2": 399.76, "r_x3": 151.79, "r_y3": 399.76, "coord_origin": "TOPLEFT" }, "text": "vocabulary for this table:", "orig": "vocabulary for this table:", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 50, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 235.99, "r_y0": 406.86, "r_x1": 244.42, "r_y1": 406.86, "r_x2": 244.42, "r_y2": 399.76, "r_x3": 235.99, "r_y3": 399.76, "coord_origin": "TOPLEFT" }, "text": "12", "orig": "12", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 51, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 246.52, "r_y0": 406.86, "r_x1": 268.84, "r_y1": 406.86, "r_x2": 268.84, "r_y2": 399.76, "r_x3": 246.52, "r_y3": 399.76, "coord_origin": "TOPLEFT" }, "text": "tokens", "orig": "tokens", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 52, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 154.33, "r_y0": 220.68, "r_x1": 159.8, "r_y1": 220.68, "r_x2": 159.8, "r_y2": 213.57, "r_x3": 154.33, "r_y3": 213.57, "coord_origin": "TOPLEFT" }, "text": "A", "orig": "A", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 53, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 321.07, "r_y0": 220.68, "r_x1": 326.54, "r_y1": 220.68, "r_x2": 326.54, "r_y2": 213.57, "r_x3": 321.07, "r_y3": 213.57, "coord_origin": "TOPLEFT" }, "text": "B", "orig": "B", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 54, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 153.09, "r_y0": 286.7, "r_x1": 175.84, "r_y1": 286.7, "r_x2": 175.84, "r_y2": 280.3, "r_x3": 153.09, "r_y3": 280.3, "coord_origin": "TOPLEFT" }, "text": "", "orig": "
", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 55, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 160.67, "r_y0": 293.52, "r_x1": 172.8, "r_y1": 293.52, "r_x2": 172.8, "r_y2": 287.12, "r_x3": 160.67, "r_y3": 287.12, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 56, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 168.25, "r_y0": 300.33, "r_x1": 177.91, "r_y1": 300.33, "r_x2": 177.91, "r_y2": 293.94, "r_x3": 168.25, "r_y3": 293.94, "coord_origin": "TOPLEFT" }, "text": "", "orig": ">", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 60, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 263.36, "r_y0": 300.33, "r_x1": 278.9, "r_y1": 300.33, "r_x2": 278.9, "r_y2": 293.94, "r_x3": 263.36, "r_y3": 293.94, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 61, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 280.79, "r_y0": 300.33, "r_x1": 290.46, "r_y1": 300.33, "r_x2": 290.46, "r_y2": 293.94, "r_x3": 280.79, "r_y3": 293.94, "coord_origin": "TOPLEFT" }, "text": "", "orig": ">", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 64, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 335.93, "r_y0": 300.33, "r_x1": 351.47, "r_y1": 300.33, "r_x2": 351.47, "r_y2": 293.94, "r_x3": 335.93, "r_y3": 293.94, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 65, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 160.67, "r_y0": 307.15, "r_x1": 174.69, "r_y1": 307.15, "r_x2": 174.69, "r_y2": 300.75, "r_x3": 160.67, "r_y3": 300.75, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 66, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 160.67, "r_y0": 313.97, "r_x1": 172.8, "r_y1": 313.97, "r_x2": 172.8, "r_y2": 307.57, "r_x3": 160.67, "r_y3": 307.57, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 67, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 168.25, "r_y0": 320.78, "r_x1": 181.89, "r_y1": 320.78, "r_x2": 181.89, "r_y2": 314.39, "r_x3": 168.25, "r_y3": 314.39, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 69, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 201.22, "r_y0": 320.78, "r_x1": 214.87, "r_y1": 320.78, "r_x2": 214.87, "r_y2": 314.39, "r_x3": 201.22, "r_y3": 314.39, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 71, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 234.19, "r_y0": 320.78, "r_x1": 247.84, "r_y1": 320.78, "r_x2": 247.84, "r_y2": 314.39, "r_x3": 234.19, "r_y3": 314.39, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 73, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 160.67, "r_y0": 327.6, "r_x1": 174.69, "r_y1": 327.6, "r_x2": 174.69, "r_y2": 321.2, "r_x3": 160.67, "r_y3": 321.2, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 74, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 160.67, "r_y0": 334.42, "r_x1": 172.8, "r_y1": 334.42, "r_x2": 172.8, "r_y2": 328.02, "r_x3": 160.67, "r_y3": 328.02, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 75, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 168.25, "r_y0": 341.23, "r_x1": 373.09, "r_y1": 341.23, "r_x2": 373.09, "r_y2": 334.84, "r_x3": 168.25, "r_y3": 334.84, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 76, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 160.67, "r_y0": 348.05, "r_x1": 174.69, "r_y1": 348.05, "r_x2": 174.69, "r_y2": 341.66, "r_x3": 160.67, "r_y3": 341.66, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 77, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 160.67, "r_y0": 354.87, "r_x1": 172.8, "r_y1": 354.87, "r_x2": 172.8, "r_y2": 348.47, "r_x3": 160.67, "r_y3": 348.47, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 78, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 168.25, "r_y0": 361.68, "r_x1": 181.89, "r_y1": 361.68, "r_x2": 181.89, "r_y2": 355.29, "r_x3": 168.25, "r_y3": 355.29, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 80, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 201.22, "r_y0": 361.68, "r_x1": 214.87, "r_y1": 361.68, "r_x2": 214.87, "r_y2": 355.29, "r_x3": 201.22, "r_y3": 355.29, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 82, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 234.19, "r_y0": 361.68, "r_x1": 247.84, "r_y1": 361.68, "r_x2": 247.84, "r_y2": 355.29, "r_x3": 234.19, "r_y3": 355.29, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 84, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 267.17, "r_y0": 361.68, "r_x1": 280.81, "r_y1": 361.68, "r_x2": 280.81, "r_y2": 355.29, "r_x3": 267.17, "r_y3": 355.29, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 86, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 160.67, "r_y0": 368.5, "r_x1": 174.69, "r_y1": 368.5, "r_x2": 174.69, "r_y2": 362.11, "r_x3": 160.67, "r_y3": 362.11, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 87, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 160.67, "r_y0": 375.32, "r_x1": 172.8, "r_y1": 375.32, "r_x2": 172.8, "r_y2": 368.92, "r_x3": 160.67, "r_y3": 368.92, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 88, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 168.25, "r_y0": 382.13, "r_x1": 181.89, "r_y1": 382.13, "r_x2": 181.89, "r_y2": 375.74, "r_x3": 168.25, "r_y3": 375.74, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 90, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 201.22, "r_y0": 382.13, "r_x1": 214.87, "r_y1": 382.13, "r_x2": 214.87, "r_y2": 375.74, "r_x3": 201.22, "r_y3": 375.74, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 92, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 234.19, "r_y0": 382.13, "r_x1": 247.84, "r_y1": 382.13, "r_x2": 247.84, "r_y2": 375.74, "r_x3": 234.19, "r_y3": 375.74, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 94, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 267.17, "r_y0": 382.13, "r_x1": 280.81, "r_y1": 382.13, "r_x2": 280.81, "r_y2": 375.74, "r_x3": 267.17, "r_y3": 375.74, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 96, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 160.67, "r_y0": 388.95, "r_x1": 174.69, "r_y1": 388.95, "r_x2": 174.69, "r_y2": 382.56, "r_x3": 160.67, "r_y3": 382.56, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 97, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 153.09, "r_y0": 395.77, "r_x1": 177.73, "r_y1": 395.77, "r_x2": 177.73, "r_y2": 389.37, "r_x3": 153.09, "r_y3": 389.37, "coord_origin": "TOPLEFT" }, "text": "
", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 68, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 183.79, "r_y0": 320.78, "r_x1": 199.33, "r_y1": 320.78, "r_x2": 199.33, "r_y2": 314.39, "r_x3": 183.79, "r_y3": 314.39, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 70, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 216.76, "r_y0": 320.78, "r_x1": 232.3, "r_y1": 320.78, "r_x2": 232.3, "r_y2": 314.39, "r_x3": 216.76, "r_y3": 314.39, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 72, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 249.73, "r_y0": 320.78, "r_x1": 265.27, "r_y1": 320.78, "r_x2": 265.27, "r_y2": 314.39, "r_x3": 249.73, "r_y3": 314.39, "coord_origin": "TOPLEFT" }, "text": "
", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 79, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 183.79, "r_y0": 361.68, "r_x1": 199.33, "r_y1": 361.68, "r_x2": 199.33, "r_y2": 355.29, "r_x3": 183.79, "r_y3": 355.29, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 81, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 216.76, "r_y0": 361.68, "r_x1": 232.3, "r_y1": 361.68, "r_x2": 232.3, "r_y2": 355.29, "r_x3": 216.76, "r_y3": 355.29, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 83, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 249.73, "r_y0": 361.68, "r_x1": 265.27, "r_y1": 361.68, "r_x2": 265.27, "r_y2": 355.29, "r_x3": 249.73, "r_y3": 355.29, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 85, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 282.71, "r_y0": 361.68, "r_x1": 298.25, "r_y1": 361.68, "r_x2": 298.25, "r_y2": 355.29, "r_x3": 282.71, "r_y3": 355.29, "coord_origin": "TOPLEFT" }, "text": "
", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 89, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 183.79, "r_y0": 382.13, "r_x1": 199.33, "r_y1": 382.13, "r_x2": 199.33, "r_y2": 375.74, "r_x3": 183.79, "r_y3": 375.74, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 91, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 216.76, "r_y0": 382.13, "r_x1": 232.3, "r_y1": 382.13, "r_x2": 232.3, "r_y2": 375.74, "r_x3": 216.76, "r_y3": 375.74, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 93, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 249.73, "r_y0": 382.13, "r_x1": 265.27, "r_y1": 382.13, "r_x2": 265.27, "r_y2": 375.74, "r_x3": 249.73, "r_y3": 375.74, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 95, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 282.71, "r_y0": 382.13, "r_x1": 298.25, "r_y1": 382.13, "r_x2": 298.25, "r_y2": 375.74, "r_x3": 282.71, "r_y3": 375.74, "coord_origin": "TOPLEFT" }, "text": "
", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 98, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 395.06, "r_y0": 419.86, "r_x1": 401.62, "r_y1": 419.86, "r_x2": 401.62, "r_y2": 411.33, "r_x3": 395.06, "r_y3": 411.33, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 99, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 407.42, "r_y0": 419.86, "r_x1": 412.48, "r_y1": 419.86, "r_x2": 412.48, "r_y2": 411.33, "r_x3": 407.42, "r_y3": 411.33, "coord_origin": "TOPLEFT" }, "text": "L", "orig": "L", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 100, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 418.69, "r_y0": 419.86, "r_x1": 425.26, "r_y1": 419.86, "r_x2": 425.26, "r_y2": 411.33, "r_x3": 418.69, "r_y3": 411.33, "coord_origin": "TOPLEFT" }, "text": "U", "orig": "U", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 101, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 430.51, "r_y0": 419.86, "r_x1": 436.57, "r_y1": 419.86, "r_x2": 436.57, "r_y2": 411.33, "r_x3": 430.51, "r_y3": 411.33, "coord_origin": "TOPLEFT" }, "text": "X", "orig": "X", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 102, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 152.36, "r_y0": 416.17, "r_x1": 175.11, "r_y1": 416.17, "r_x2": 175.11, "r_y2": 409.77, "r_x3": 152.36, "r_y3": 409.77, "coord_origin": "TOPLEFT" }, "text": "", "orig": "
", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 103, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 178.89, "r_y0": 416.17, "r_x1": 191.02, "r_y1": 416.17, "r_x2": 191.02, "r_y2": 409.77, "r_x3": 178.89, "r_y3": 409.77, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 104, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 194.81, "r_y0": 416.17, "r_x1": 208.83, "r_y1": 416.17, "r_x2": 208.83, "r_y2": 409.77, "r_x3": 194.81, "r_y3": 409.77, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 105, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 212.61, "r_y0": 416.17, "r_x1": 226.26, "r_y1": 416.17, "r_x2": 226.26, "r_y2": 409.77, "r_x3": 212.61, "r_y3": 409.77, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 107, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 249.38, "r_y0": 416.17, "r_x1": 259.04, "r_y1": 416.17, "r_x2": 259.04, "r_y2": 409.77, "r_x3": 249.38, "r_y3": 409.77, "coord_origin": "TOPLEFT" }, "text": "", "orig": ">", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 113, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 244.46, "r_y0": 424.5, "r_x1": 269.1, "r_y1": 424.5, "r_x2": 269.1, "r_y2": 418.11, "r_x3": 244.46, "r_y3": 418.11, "coord_origin": "TOPLEFT" }, "text": "
", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 106, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 230.05, "r_y0": 416.17, "r_x1": 245.59, "r_y1": 416.17, "r_x2": 245.59, "r_y2": 409.77, "r_x3": 230.05, "r_y3": 409.77, "coord_origin": "TOPLEFT" }, "text": "
", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 114, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 154.51, "r_y0": 265.71, "r_x1": 159.62, "r_y1": 265.71, "r_x2": 159.62, "r_y2": 258.6, "r_x3": 154.51, "r_y3": 258.6, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 115, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 164.74, "r_y0": 265.71, "r_x1": 185.22, "r_y1": 265.71, "r_x2": 185.22, "r_y2": 258.6, "r_x3": 164.74, "r_y3": 258.6, "coord_origin": "TOPLEFT" }, "text": "HTML", "orig": "HTML", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 116, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 164.35, "r_y0": 273.6, "r_x1": 222.05, "r_y1": 273.6, "r_x2": 222.05, "r_y2": 266.5, "r_x3": 164.35, "r_y3": 266.5, "coord_origin": "TOPLEFT" }, "text": "sequence length:", "orig": "sequence length:", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 117, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 224.15, "r_y0": 273.6, "r_x1": 232.58, "r_y1": 273.6, "r_x2": 232.58, "r_y2": 266.5, "r_x3": 224.15, "r_y3": 266.5, "coord_origin": "TOPLEFT" }, "text": "55", "orig": "55", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [ { "id": 11, "label": "text", "bbox": { "l": 396.41, "t": 280.98, "r": 402.97, "b": 289.51, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 12, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 396.41, "r_y0": 289.51, "r_x1": 402.97, "r_y1": 289.51, "r_x2": 402.97, "r_y2": 280.98, "r_x3": 396.41, "r_y3": 280.98, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 12, "label": "text", "bbox": { "l": 418.59, "t": 280.9, "r": 425.15, "b": 289.42, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 13, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 418.59, "r_y0": 289.42, "r_x1": 425.15, "r_y1": 289.42, "r_x2": 425.15, "r_y2": 280.9, "r_x3": 418.59, "r_y3": 280.9, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 13, "label": "text", "bbox": { "l": 395.75, "t": 303.24, "r": 402.31, "b": 311.76, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 14, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 395.75, "r_y0": 311.76, "r_x1": 402.31, "r_y1": 311.76, "r_x2": 402.31, "r_y2": 303.24, "r_x3": 395.75, "r_y3": 303.24, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 14, "label": "text", "bbox": { "l": 407.54, "t": 303.37, "r": 414.1, "b": 311.9, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 15, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 407.54, "r_y0": 311.9, "r_x1": 414.1, "r_y1": 311.9, "r_x2": 414.1, "r_y2": 303.37, "r_x3": 407.54, "r_y3": 303.37, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 15, "label": "text", "bbox": { "l": 407.56, "t": 314.41, "r": 414.13, "b": 322.93, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 16, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 407.56, "r_y0": 322.93, "r_x1": 414.13, "r_y1": 322.93, "r_x2": 414.13, "r_y2": 314.41, "r_x3": 407.56, "r_y3": 314.41, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 16, "label": "text", "bbox": { "l": 418.51, "t": 292.09, "r": 425.07, "b": 300.61, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 17, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 418.51, "r_y0": 300.61, "r_x1": 425.07, "r_y1": 300.61, "r_x2": 425.07, "r_y2": 292.09, "r_x3": 418.51, "r_y3": 292.09, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 17, "label": "text", "bbox": { "l": 429.6, "t": 292.09, "r": 436.16, "b": 300.62, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 18, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 429.6, "r_y0": 300.62, "r_x1": 436.16, "r_y1": 300.62, "r_x2": 436.16, "r_y2": 292.09, "r_x3": 429.6, "r_y3": 292.09, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 18, "label": "text", "bbox": { "l": 440.69, "t": 292.01, "r": 447.25, "b": 300.54, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 19, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 440.69, "r_y0": 300.54, "r_x1": 447.25, "r_y1": 300.54, "r_x2": 447.25, "r_y2": 292.01, "r_x3": 440.69, "r_y3": 292.01, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 19, "label": "text", "bbox": { "l": 418.62, "t": 303.29, "r": 425.19, "b": 311.82, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 20, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 418.62, "r_y0": 311.82, "r_x1": 425.19, "r_y1": 311.82, "r_x2": 425.19, "r_y2": 303.29, "r_x3": 418.62, "r_y3": 303.29, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 20, "label": "text", "bbox": { "l": 429.71, "t": 303.3, "r": 436.27, "b": 311.83, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 21, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 429.71, "r_y0": 311.83, "r_x1": 436.27, "r_y1": 311.83, "r_x2": 436.27, "r_y2": 303.3, "r_x3": 429.71, "r_y3": 303.3, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 21, "label": "text", "bbox": { "l": 440.8, "t": 303.22, "r": 447.36, "b": 311.75, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 22, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 440.8, "r_y0": 311.75, "r_x1": 447.36, "r_y1": 311.75, "r_x2": 447.36, "r_y2": 303.22, "r_x3": 440.8, "r_y3": 303.22, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 22, "label": "text", "bbox": { "l": 418.63, "t": 314.57, "r": 425.19, "b": 323.09, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 23, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 418.63, "r_y0": 323.09, "r_x1": 425.19, "r_y1": 323.09, "r_x2": 425.19, "r_y2": 314.57, "r_x3": 418.63, "r_y3": 314.57, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 23, "label": "text", "bbox": { "l": 429.71, "t": 314.57, "r": 436.27, "b": 323.1, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 24, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 429.71, "r_y0": 323.1, "r_x1": 436.27, "r_y1": 323.1, "r_x2": 436.27, "r_y2": 314.57, "r_x3": 429.71, "r_y3": 314.57, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 24, "label": "text", "bbox": { "l": 440.8, "t": 314.5, "r": 447.36, "b": 323.02, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 25, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 440.8, "r_y0": 323.02, "r_x1": 447.36, "r_y1": 323.02, "r_x2": 447.36, "r_y2": 314.5, "r_x3": 440.8, "r_y3": 314.5, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 25, "label": "text", "bbox": { "l": 407.4, "t": 325.29, "r": 413.96, "b": 333.82, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 26, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 407.4, "r_y0": 333.82, "r_x1": 413.96, "r_y1": 333.82, "r_x2": 413.96, "r_y2": 325.29, "r_x3": 407.4, "r_y3": 325.29, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 26, "label": "text", "bbox": { "l": 418.46, "t": 325.45, "r": 425.02, "b": 333.98, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 27, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 418.46, "r_y0": 333.98, "r_x1": 425.02, "r_y1": 333.98, "r_x2": 425.02, "r_y2": 325.45, "r_x3": 418.46, "r_y3": 325.45, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 27, "label": "text", "bbox": { "l": 429.55, "t": 325.46, "r": 436.11, "b": 333.98, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 28, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 429.55, "r_y0": 333.98, "r_x1": 436.11, "r_y1": 333.98, "r_x2": 436.11, "r_y2": 325.46, "r_x3": 429.55, "r_y3": 325.46, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 28, "label": "text", "bbox": { "l": 440.64, "t": 325.38, "r": 447.2, "b": 333.91, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 29, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 440.64, "r_y0": 333.91, "r_x1": 447.2, "r_y1": 333.91, "r_x2": 447.2, "r_y2": 325.38, "r_x3": 440.64, "r_y3": 325.38, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 29, "label": "text", "bbox": { "l": 451.9, "t": 280.16, "r": 463.51, "b": 288.68, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 30, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 451.9, "r_y0": 288.68, "r_x1": 463.51, "r_y1": 288.68, "r_x2": 463.51, "r_y2": 280.16, "r_x3": 451.9, "r_y3": 280.16, "coord_origin": "TOPLEFT" }, "text": "NL", "orig": "NL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 30, "label": "text", "bbox": { "l": 452.16, "t": 291.6, "r": 463.77, "b": 300.12, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 31, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 452.16, "r_y0": 300.12, "r_x1": 463.77, "r_y1": 300.12, "r_x2": 463.77, "r_y2": 291.6, "r_x3": 452.16, "r_y3": 291.6, "coord_origin": "TOPLEFT" }, "text": "NL", "orig": "NL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 31, "label": "text", "bbox": { "l": 452.18, "t": 302.84, "r": 463.79, "b": 311.37, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 32, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 452.18, "r_y0": 311.37, "r_x1": 463.79, "r_y1": 311.37, "r_x2": 463.79, "r_y2": 302.84, "r_x3": 452.18, "r_y3": 302.84, "coord_origin": "TOPLEFT" }, "text": "NL", "orig": "NL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 32, "label": "text", "bbox": { "l": 452.1, "t": 314.12, "r": 463.72, "b": 322.65, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 33, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 452.1, "r_y0": 322.65, "r_x1": 463.72, "r_y1": 322.65, "r_x2": 463.72, "r_y2": 314.12, "r_x3": 452.1, "r_y3": 314.12, "coord_origin": "TOPLEFT" }, "text": "NL", "orig": "NL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 33, "label": "text", "bbox": { "l": 452.3, "t": 325.47, "r": 463.91, "b": 333.99, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 34, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 452.3, "r_y0": 333.99, "r_x1": 463.91, "r_y1": 333.99, "r_x2": 463.91, "r_y2": 325.47, "r_x3": 452.3, "r_y3": 325.47, "coord_origin": "TOPLEFT" }, "text": "NL", "orig": "NL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 34, "label": "text", "bbox": { "l": 396.1, "t": 314.49, "r": 402.66, "b": 323.02, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 35, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 396.1, "r_y0": 323.02, "r_x1": 402.66, "r_y1": 323.02, "r_x2": 402.66, "r_y2": 314.49, "r_x3": 396.1, "r_y3": 314.49, "coord_origin": "TOPLEFT" }, "text": "U", "orig": "U", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 35, "label": "text", "bbox": { "l": 396.0, "t": 325.39, "r": 402.56, "b": 333.91, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 36, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 396.0, "r_y0": 333.91, "r_x1": 402.56, "r_y1": 333.91, "r_x2": 402.56, "r_y2": 325.39, "r_x3": 396.0, "r_y3": 325.39, "coord_origin": "TOPLEFT" }, "text": "U", "orig": "U", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 36, "label": "text", "bbox": { "l": 396.27, "t": 292.27, "r": 402.84, "b": 300.8, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 37, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 396.27, "r_y0": 300.8, "r_x1": 402.84, "r_y1": 300.8, "r_x2": 402.84, "r_y2": 292.27, "r_x3": 396.27, "r_y3": 292.27, "coord_origin": "TOPLEFT" }, "text": "U", "orig": "U", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 37, "label": "text", "bbox": { "l": 408.55, "t": 280.97, "r": 413.6, "b": 289.49, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 38, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 408.55, "r_y0": 289.49, "r_x1": 413.6, "r_y1": 289.49, "r_x2": 413.6, "r_y2": 280.97, "r_x3": 408.55, "r_y3": 280.97, "coord_origin": "TOPLEFT" }, "text": "L", "orig": "L", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 38, "label": "text", "bbox": { "l": 430.59, "t": 280.5, "r": 435.64, "b": 289.02, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 39, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 430.59, "r_y0": 289.02, "r_x1": 435.64, "r_y1": 289.02, "r_x2": 435.64, "r_y2": 280.5, "r_x3": 430.59, "r_y3": 280.5, "coord_origin": "TOPLEFT" }, "text": "L", "orig": "L", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 39, "label": "text", "bbox": { "l": 441.08, "t": 280.38, "r": 446.13, "b": 288.91, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 40, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 441.08, "r_y0": 288.91, "r_x1": 446.13, "r_y1": 288.91, "r_x2": 446.13, "r_y2": 280.38, "r_x3": 441.08, "r_y3": 280.38, "coord_origin": "TOPLEFT" }, "text": "L", "orig": "L", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 40, "label": "text", "bbox": { "l": 407.97, "t": 292.13, "r": 414.04, "b": 300.66, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 41, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 407.97, "r_y0": 300.66, "r_x1": 414.04, "r_y1": 300.66, "r_x2": 414.04, "r_y2": 292.13, "r_x3": 407.97, "r_y3": 292.13, "coord_origin": "TOPLEFT" }, "text": "X", "orig": "X", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 41, "label": "text", "bbox": { "l": 441.26, "t": 411.18, "r": 452.87, "b": 419.71, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 42, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 441.26, "r_y0": 419.71, "r_x1": 452.87, "r_y1": 419.71, "r_x2": 452.87, "r_y2": 411.18, "r_x3": 441.26, "r_y3": 411.18, "coord_origin": "TOPLEFT" }, "text": "NL", "orig": "NL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 42, "label": "text", "bbox": { "l": 393.75, "t": 399.79, "r": 432.49, "b": 406.9, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 43, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 393.75, "r_y0": 406.9, "r_x1": 432.49, "r_y1": 406.9, "r_x2": 432.49, "r_y2": 399.79, "r_x3": 393.75, "r_y3": 399.79, "coord_origin": "TOPLEFT" }, "text": "vocabulary:", "orig": "vocabulary:", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 43, "label": "text", "bbox": { "l": 434.59, "t": 399.79, "r": 438.8, "b": 406.9, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 44, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 434.59, "r_y0": 406.9, "r_x1": 438.8, "r_y1": 406.9, "r_x2": 438.8, "r_y2": 399.79, "r_x3": 434.59, "r_y3": 399.79, "coord_origin": "TOPLEFT" }, "text": "5", "orig": "5", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 44, "label": "text", "bbox": { "l": 440.91, "t": 399.79, "r": 463.22, "b": 406.9, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 45, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 440.91, "r_y0": 406.9, "r_x1": 463.22, "r_y1": 406.9, "r_x2": 463.22, "r_y2": 399.79, "r_x3": 440.91, "r_y3": 399.79, "coord_origin": "TOPLEFT" }, "text": "tokens", "orig": "tokens", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 45, "label": "text", "bbox": { "l": 384.12, "t": 258.55, "r": 413.99, "b": 265.65, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 46, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 384.12, "r_y0": 265.65, "r_x1": 413.99, "r_y1": 265.65, "r_x2": 413.99, "r_y2": 258.55, "r_x3": 384.12, "r_y3": 258.55, "coord_origin": "TOPLEFT" }, "text": "D OTSL", "orig": "D OTSL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 46, "label": "text", "bbox": { "l": 393.75, "t": 266.68, "r": 451.45, "b": 273.78, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 47, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 393.75, "r_y0": 273.78, "r_x1": 451.45, "r_y1": 273.78, "r_x2": 451.45, "r_y2": 266.68, "r_x3": 393.75, "r_y3": 266.68, "coord_origin": "TOPLEFT" }, "text": "sequence length:", "orig": "sequence length:", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 47, "label": "text", "bbox": { "l": 453.55, "t": 266.68, "r": 461.97, "b": 273.78, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 48, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 453.55, "r_y0": 273.78, "r_x1": 461.97, "r_y1": 273.78, "r_x2": 461.97, "r_y2": 266.68, "r_x3": 453.55, "r_y3": 266.68, "coord_origin": "TOPLEFT" }, "text": "30", "orig": "30", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 48, "label": "text", "bbox": { "l": 151.79, "t": 399.76, "r": 233.89, "b": 406.86, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 49, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.79, "r_y0": 406.86, "r_x1": 233.89, "r_y1": 406.86, "r_x2": 233.89, "r_y2": 399.76, "r_x3": 151.79, "r_y3": 399.76, "coord_origin": "TOPLEFT" }, "text": "vocabulary for this table:", "orig": "vocabulary for this table:", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 49, "label": "text", "bbox": { "l": 235.99, "t": 399.76, "r": 244.42, "b": 406.86, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 50, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 235.99, "r_y0": 406.86, "r_x1": 244.42, "r_y1": 406.86, "r_x2": 244.42, "r_y2": 399.76, "r_x3": 235.99, "r_y3": 399.76, "coord_origin": "TOPLEFT" }, "text": "12", "orig": "12", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 50, "label": "text", "bbox": { "l": 246.52, "t": 399.76, "r": 268.84, "b": 406.86, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 51, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 246.52, "r_y0": 406.86, "r_x1": 268.84, "r_y1": 406.86, "r_x2": 268.84, "r_y2": 399.76, "r_x3": 246.52, "r_y3": 399.76, "coord_origin": "TOPLEFT" }, "text": "tokens", "orig": "tokens", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 51, "label": "text", "bbox": { "l": 154.33, "t": 213.57, "r": 159.8, "b": 220.68, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 52, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 154.33, "r_y0": 220.68, "r_x1": 159.8, "r_y1": 220.68, "r_x2": 159.8, "r_y2": 213.57, "r_x3": 154.33, "r_y3": 213.57, "coord_origin": "TOPLEFT" }, "text": "A", "orig": "A", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 52, "label": "text", "bbox": { "l": 321.07, "t": 213.57, "r": 326.54, "b": 220.68, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 53, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 321.07, "r_y0": 220.68, "r_x1": 326.54, "r_y1": 220.68, "r_x2": 326.54, "r_y2": 213.57, "r_x3": 321.07, "r_y3": 213.57, "coord_origin": "TOPLEFT" }, "text": "B", "orig": "B", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 53, "label": "text", "bbox": { "l": 153.09, "t": 280.3, "r": 175.84, "b": 286.7, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 54, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 153.09, "r_y0": 286.7, "r_x1": 175.84, "r_y1": 286.7, "r_x2": 175.84, "r_y2": 280.3, "r_x3": 153.09, "r_y3": 280.3, "coord_origin": "TOPLEFT" }, "text": "", "orig": "
", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 54, "label": "text", "bbox": { "l": 160.67, "t": 287.12, "r": 172.8, "b": 293.52, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 55, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 160.67, "r_y0": 293.52, "r_x1": 172.8, "r_y1": 293.52, "r_x2": 172.8, "r_y2": 287.12, "r_x3": 160.67, "r_y3": 287.12, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 55, "label": "text", "bbox": { "l": 168.25, "t": 293.94, "r": 177.91, "b": 300.33, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 56, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 168.25, "r_y0": 300.33, "r_x1": 177.91, "r_y1": 300.33, "r_x2": 177.91, "r_y2": 293.94, "r_x3": 168.25, "r_y3": 293.94, "coord_origin": "TOPLEFT" }, "text": "", "orig": ">", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 59, "label": "text", "bbox": { "l": 263.36, "t": 293.94, "r": 278.9, "b": 300.33, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 60, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 263.36, "r_y0": 300.33, "r_x1": 278.9, "r_y1": 300.33, "r_x2": 278.9, "r_y2": 293.94, "r_x3": 263.36, "r_y3": 293.94, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 60, "label": "text", "bbox": { "l": 280.79, "t": 293.94, "r": 290.46, "b": 300.33, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 61, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 280.79, "r_y0": 300.33, "r_x1": 290.46, "r_y1": 300.33, "r_x2": 290.46, "r_y2": 293.94, "r_x3": 280.79, "r_y3": 293.94, "coord_origin": "TOPLEFT" }, "text": "", "orig": ">", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 63, "label": "text", "bbox": { "l": 335.93, "t": 293.94, "r": 351.47, "b": 300.33, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 64, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 335.93, "r_y0": 300.33, "r_x1": 351.47, "r_y1": 300.33, "r_x2": 351.47, "r_y2": 293.94, "r_x3": 335.93, "r_y3": 293.94, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 64, "label": "text", "bbox": { "l": 160.67, "t": 300.75, "r": 174.69, "b": 307.15, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 65, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 160.67, "r_y0": 307.15, "r_x1": 174.69, "r_y1": 307.15, "r_x2": 174.69, "r_y2": 300.75, "r_x3": 160.67, "r_y3": 300.75, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 65, "label": "text", "bbox": { "l": 160.67, "t": 307.57, "r": 172.8, "b": 313.97, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 66, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 160.67, "r_y0": 313.97, "r_x1": 172.8, "r_y1": 313.97, "r_x2": 172.8, "r_y2": 307.57, "r_x3": 160.67, "r_y3": 307.57, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 66, "label": "text", "bbox": { "l": 168.25, "t": 314.39, "r": 181.89, "b": 320.78, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 67, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 168.25, "r_y0": 320.78, "r_x1": 181.89, "r_y1": 320.78, "r_x2": 181.89, "r_y2": 314.39, "r_x3": 168.25, "r_y3": 314.39, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 68, "label": "text", "bbox": { "l": 201.22, "t": 314.39, "r": 214.87, "b": 320.78, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 69, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 201.22, "r_y0": 320.78, "r_x1": 214.87, "r_y1": 320.78, "r_x2": 214.87, "r_y2": 314.39, "r_x3": 201.22, "r_y3": 314.39, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 70, "label": "text", "bbox": { "l": 234.19, "t": 314.39, "r": 247.84, "b": 320.78, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 71, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 234.19, "r_y0": 320.78, "r_x1": 247.84, "r_y1": 320.78, "r_x2": 247.84, "r_y2": 314.39, "r_x3": 234.19, "r_y3": 314.39, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 72, "label": "text", "bbox": { "l": 160.67, "t": 321.2, "r": 174.69, "b": 327.6, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 73, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 160.67, "r_y0": 327.6, "r_x1": 174.69, "r_y1": 327.6, "r_x2": 174.69, "r_y2": 321.2, "r_x3": 160.67, "r_y3": 321.2, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 73, "label": "text", "bbox": { "l": 160.67, "t": 328.02, "r": 172.8, "b": 334.42, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 74, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 160.67, "r_y0": 334.42, "r_x1": 172.8, "r_y1": 334.42, "r_x2": 172.8, "r_y2": 328.02, "r_x3": 160.67, "r_y3": 328.02, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 74, "label": "text", "bbox": { "l": 168.25, "t": 334.84, "r": 373.09, "b": 341.23, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 75, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 168.25, "r_y0": 341.23, "r_x1": 373.09, "r_y1": 341.23, "r_x2": 373.09, "r_y2": 334.84, "r_x3": 168.25, "r_y3": 334.84, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 75, "label": "text", "bbox": { "l": 160.67, "t": 341.66, "r": 174.69, "b": 348.05, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 76, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 160.67, "r_y0": 348.05, "r_x1": 174.69, "r_y1": 348.05, "r_x2": 174.69, "r_y2": 341.66, "r_x3": 160.67, "r_y3": 341.66, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 76, "label": "text", "bbox": { "l": 160.67, "t": 348.47, "r": 172.8, "b": 354.87, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 77, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 160.67, "r_y0": 354.87, "r_x1": 172.8, "r_y1": 354.87, "r_x2": 172.8, "r_y2": 348.47, "r_x3": 160.67, "r_y3": 348.47, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 77, "label": "text", "bbox": { "l": 168.25, "t": 355.29, "r": 181.89, "b": 361.68, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 78, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 168.25, "r_y0": 361.68, "r_x1": 181.89, "r_y1": 361.68, "r_x2": 181.89, "r_y2": 355.29, "r_x3": 168.25, "r_y3": 355.29, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 79, "label": "text", "bbox": { "l": 201.22, "t": 355.29, "r": 214.87, "b": 361.68, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 80, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 201.22, "r_y0": 361.68, "r_x1": 214.87, "r_y1": 361.68, "r_x2": 214.87, "r_y2": 355.29, "r_x3": 201.22, "r_y3": 355.29, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 81, "label": "text", "bbox": { "l": 234.19, "t": 355.29, "r": 247.84, "b": 361.68, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 82, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 234.19, "r_y0": 361.68, "r_x1": 247.84, "r_y1": 361.68, "r_x2": 247.84, "r_y2": 355.29, "r_x3": 234.19, "r_y3": 355.29, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 83, "label": "text", "bbox": { "l": 267.17, "t": 355.29, "r": 280.81, "b": 361.68, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 84, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 267.17, "r_y0": 361.68, "r_x1": 280.81, "r_y1": 361.68, "r_x2": 280.81, "r_y2": 355.29, "r_x3": 267.17, "r_y3": 355.29, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 85, "label": "text", "bbox": { "l": 160.67, "t": 362.11, "r": 174.69, "b": 368.5, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 86, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 160.67, "r_y0": 368.5, "r_x1": 174.69, "r_y1": 368.5, "r_x2": 174.69, "r_y2": 362.11, "r_x3": 160.67, "r_y3": 362.11, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 86, "label": "text", "bbox": { "l": 160.67, "t": 368.92, "r": 172.8, "b": 375.32, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 87, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 160.67, "r_y0": 375.32, "r_x1": 172.8, "r_y1": 375.32, "r_x2": 172.8, "r_y2": 368.92, "r_x3": 160.67, "r_y3": 368.92, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 87, "label": "text", "bbox": { "l": 168.25, "t": 375.74, "r": 181.89, "b": 382.13, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 88, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 168.25, "r_y0": 382.13, "r_x1": 181.89, "r_y1": 382.13, "r_x2": 181.89, "r_y2": 375.74, "r_x3": 168.25, "r_y3": 375.74, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 89, "label": "text", "bbox": { "l": 201.22, "t": 375.74, "r": 214.87, "b": 382.13, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 90, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 201.22, "r_y0": 382.13, "r_x1": 214.87, "r_y1": 382.13, "r_x2": 214.87, "r_y2": 375.74, "r_x3": 201.22, "r_y3": 375.74, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 91, "label": "text", "bbox": { "l": 234.19, "t": 375.74, "r": 247.84, "b": 382.13, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 92, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 234.19, "r_y0": 382.13, "r_x1": 247.84, "r_y1": 382.13, "r_x2": 247.84, "r_y2": 375.74, "r_x3": 234.19, "r_y3": 375.74, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 93, "label": "text", "bbox": { "l": 267.17, "t": 375.74, "r": 280.81, "b": 382.13, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 94, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 267.17, "r_y0": 382.13, "r_x1": 280.81, "r_y1": 382.13, "r_x2": 280.81, "r_y2": 375.74, "r_x3": 267.17, "r_y3": 375.74, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 95, "label": "text", "bbox": { "l": 160.67, "t": 382.56, "r": 174.69, "b": 388.95, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 96, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 160.67, "r_y0": 388.95, "r_x1": 174.69, "r_y1": 388.95, "r_x2": 174.69, "r_y2": 382.56, "r_x3": 160.67, "r_y3": 382.56, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 96, "label": "text", "bbox": { "l": 153.09, "t": 389.37, "r": 177.73, "b": 395.77, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 97, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 153.09, "r_y0": 395.77, "r_x1": 177.73, "r_y1": 395.77, "r_x2": 177.73, "r_y2": 389.37, "r_x3": 153.09, "r_y3": 389.37, "coord_origin": "TOPLEFT" }, "text": "
", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 67, "label": "text", "bbox": { "l": 183.79, "t": 314.39, "r": 199.33, "b": 320.78, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 68, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 183.79, "r_y0": 320.78, "r_x1": 199.33, "r_y1": 320.78, "r_x2": 199.33, "r_y2": 314.39, "r_x3": 183.79, "r_y3": 314.39, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 69, "label": "text", "bbox": { "l": 216.76, "t": 314.39, "r": 232.3, "b": 320.78, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 70, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 216.76, "r_y0": 320.78, "r_x1": 232.3, "r_y1": 320.78, "r_x2": 232.3, "r_y2": 314.39, "r_x3": 216.76, "r_y3": 314.39, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 71, "label": "text", "bbox": { "l": 249.73, "t": 314.39, "r": 265.27, "b": 320.78, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 72, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 249.73, "r_y0": 320.78, "r_x1": 265.27, "r_y1": 320.78, "r_x2": 265.27, "r_y2": 314.39, "r_x3": 249.73, "r_y3": 314.39, "coord_origin": "TOPLEFT" }, "text": "
", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 78, "label": "text", "bbox": { "l": 183.79, "t": 355.29, "r": 199.33, "b": 361.68, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 79, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 183.79, "r_y0": 361.68, "r_x1": 199.33, "r_y1": 361.68, "r_x2": 199.33, "r_y2": 355.29, "r_x3": 183.79, "r_y3": 355.29, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 80, "label": "text", "bbox": { "l": 216.76, "t": 355.29, "r": 232.3, "b": 361.68, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 81, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 216.76, "r_y0": 361.68, "r_x1": 232.3, "r_y1": 361.68, "r_x2": 232.3, "r_y2": 355.29, "r_x3": 216.76, "r_y3": 355.29, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 82, "label": "text", "bbox": { "l": 249.73, "t": 355.29, "r": 265.27, "b": 361.68, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 83, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 249.73, "r_y0": 361.68, "r_x1": 265.27, "r_y1": 361.68, "r_x2": 265.27, "r_y2": 355.29, "r_x3": 249.73, "r_y3": 355.29, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 84, "label": "text", "bbox": { "l": 282.71, "t": 355.29, "r": 298.25, "b": 361.68, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 85, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 282.71, "r_y0": 361.68, "r_x1": 298.25, "r_y1": 361.68, "r_x2": 298.25, "r_y2": 355.29, "r_x3": 282.71, "r_y3": 355.29, "coord_origin": "TOPLEFT" }, "text": "
", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 88, "label": "text", "bbox": { "l": 183.79, "t": 375.74, "r": 199.33, "b": 382.13, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 89, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 183.79, "r_y0": 382.13, "r_x1": 199.33, "r_y1": 382.13, "r_x2": 199.33, "r_y2": 375.74, "r_x3": 183.79, "r_y3": 375.74, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 90, "label": "text", "bbox": { "l": 216.76, "t": 375.74, "r": 232.3, "b": 382.13, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 91, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 216.76, "r_y0": 382.13, "r_x1": 232.3, "r_y1": 382.13, "r_x2": 232.3, "r_y2": 375.74, "r_x3": 216.76, "r_y3": 375.74, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 92, "label": "text", "bbox": { "l": 249.73, "t": 375.74, "r": 265.27, "b": 382.13, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 93, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 249.73, "r_y0": 382.13, "r_x1": 265.27, "r_y1": 382.13, "r_x2": 265.27, "r_y2": 375.74, "r_x3": 249.73, "r_y3": 375.74, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 94, "label": "text", "bbox": { "l": 282.71, "t": 375.74, "r": 298.25, "b": 382.13, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 95, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 282.71, "r_y0": 382.13, "r_x1": 298.25, "r_y1": 382.13, "r_x2": 298.25, "r_y2": 375.74, "r_x3": 282.71, "r_y3": 375.74, "coord_origin": "TOPLEFT" }, "text": "
", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 97, "label": "text", "bbox": { "l": 395.06, "t": 411.33, "r": 401.62, "b": 419.86, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 98, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 395.06, "r_y0": 419.86, "r_x1": 401.62, "r_y1": 419.86, "r_x2": 401.62, "r_y2": 411.33, "r_x3": 395.06, "r_y3": 411.33, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 98, "label": "text", "bbox": { "l": 407.42, "t": 411.33, "r": 412.48, "b": 419.86, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 99, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 407.42, "r_y0": 419.86, "r_x1": 412.48, "r_y1": 419.86, "r_x2": 412.48, "r_y2": 411.33, "r_x3": 407.42, "r_y3": 411.33, "coord_origin": "TOPLEFT" }, "text": "L", "orig": "L", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 99, "label": "text", "bbox": { "l": 418.69, "t": 411.33, "r": 425.26, "b": 419.86, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 100, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 418.69, "r_y0": 419.86, "r_x1": 425.26, "r_y1": 419.86, "r_x2": 425.26, "r_y2": 411.33, "r_x3": 418.69, "r_y3": 411.33, "coord_origin": "TOPLEFT" }, "text": "U", "orig": "U", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 100, "label": "text", "bbox": { "l": 430.51, "t": 411.33, "r": 436.57, "b": 419.86, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 101, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 430.51, "r_y0": 419.86, "r_x1": 436.57, "r_y1": 419.86, "r_x2": 436.57, "r_y2": 411.33, "r_x3": 430.51, "r_y3": 411.33, "coord_origin": "TOPLEFT" }, "text": "X", "orig": "X", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 101, "label": "text", "bbox": { "l": 152.36, "t": 409.77, "r": 175.11, "b": 416.17, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 102, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 152.36, "r_y0": 416.17, "r_x1": 175.11, "r_y1": 416.17, "r_x2": 175.11, "r_y2": 409.77, "r_x3": 152.36, "r_y3": 409.77, "coord_origin": "TOPLEFT" }, "text": "", "orig": "
", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 102, "label": "text", "bbox": { "l": 178.89, "t": 409.77, "r": 191.02, "b": 416.17, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 103, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 178.89, "r_y0": 416.17, "r_x1": 191.02, "r_y1": 416.17, "r_x2": 191.02, "r_y2": 409.77, "r_x3": 178.89, "r_y3": 409.77, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 103, "label": "text", "bbox": { "l": 194.81, "t": 409.77, "r": 208.83, "b": 416.17, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 104, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 194.81, "r_y0": 416.17, "r_x1": 208.83, "r_y1": 416.17, "r_x2": 208.83, "r_y2": 409.77, "r_x3": 194.81, "r_y3": 409.77, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 104, "label": "text", "bbox": { "l": 212.61, "t": 409.77, "r": 226.26, "b": 416.17, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 105, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 212.61, "r_y0": 416.17, "r_x1": 226.26, "r_y1": 416.17, "r_x2": 226.26, "r_y2": 409.77, "r_x3": 212.61, "r_y3": 409.77, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 106, "label": "text", "bbox": { "l": 249.38, "t": 409.77, "r": 259.04, "b": 416.17, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 107, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 249.38, "r_y0": 416.17, "r_x1": 259.04, "r_y1": 416.17, "r_x2": 259.04, "r_y2": 409.77, "r_x3": 249.38, "r_y3": 409.77, "coord_origin": "TOPLEFT" }, "text": "", "orig": ">", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 112, "label": "text", "bbox": { "l": 244.46, "t": 418.11, "r": 269.1, "b": 424.5, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 113, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 244.46, "r_y0": 424.5, "r_x1": 269.1, "r_y1": 424.5, "r_x2": 269.1, "r_y2": 418.11, "r_x3": 244.46, "r_y3": 418.11, "coord_origin": "TOPLEFT" }, "text": "
", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 105, "label": "text", "bbox": { "l": 230.05, "t": 409.77, "r": 245.59, "b": 416.17, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 106, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 230.05, "r_y0": 416.17, "r_x1": 245.59, "r_y1": 416.17, "r_x2": 245.59, "r_y2": 409.77, "r_x3": 230.05, "r_y3": 409.77, "coord_origin": "TOPLEFT" }, "text": "
", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 113, "label": "text", "bbox": { "l": 154.51, "t": 258.6, "r": 159.62, "b": 265.71, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 114, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 154.51, "r_y0": 265.71, "r_x1": 159.62, "r_y1": 265.71, "r_x2": 159.62, "r_y2": 258.6, "r_x3": 154.51, "r_y3": 258.6, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 114, "label": "text", "bbox": { "l": 164.74, "t": 258.6, "r": 185.22, "b": 265.71, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 115, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 164.74, "r_y0": 265.71, "r_x1": 185.22, "r_y1": 265.71, "r_x2": 185.22, "r_y2": 258.6, "r_x3": 164.74, "r_y3": 258.6, "coord_origin": "TOPLEFT" }, "text": "HTML", "orig": "HTML", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 115, "label": "text", "bbox": { "l": 164.35, "t": 266.5, "r": 222.05, "b": 273.6, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 116, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 164.35, "r_y0": 273.6, "r_x1": 222.05, "r_y1": 273.6, "r_x2": 222.05, "r_y2": 266.5, "r_x3": 164.35, "r_y3": 266.5, "coord_origin": "TOPLEFT" }, "text": "sequence length:", "orig": "sequence length:", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 116, "label": "text", "bbox": { "l": 224.15, "t": 266.5, "r": 232.58, "b": 273.6, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 117, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 224.15, "r_y0": 273.6, "r_x1": 232.58, "r_y1": 273.6, "r_x2": 232.58, "r_y2": 266.5, "r_x3": 224.15, "r_y3": 266.5, "coord_origin": "TOPLEFT" }, "text": "55", "orig": "55", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] } ] }, "text": "", "annotations": [], "provenance": null, "predicted_class": null, "confidence": null }, { "label": "text", "id": 2, "page_no": 1, "cluster": { "id": 2, "label": "text", "bbox": { "l": 134.76, "t": 452.31, "r": 480.59, "b": 520.89, "coord_origin": "TOPLEFT" }, "confidence": 0.95, "cells": [ { "index": 118, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 461.11, "r_x1": 161.33, "r_y1": 461.11, "r_x2": 161.33, "r_y2": 452.31, "r_x3": 134.76, "r_y3": 452.31, "coord_origin": "TOPLEFT" }, "text": "today,", "orig": "today,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 119, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 164.27, "r_y0": 461.11, "r_x1": 226.29, "r_y1": 461.11, "r_x2": 226.29, "r_y2": 452.31, "r_x3": 164.27, "r_y3": 452.31, "coord_origin": "TOPLEFT" }, "text": "table detection", "orig": "table detection", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 120, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 229.99, "r_y0": 461.11, "r_x1": 480.59, "r_y1": 461.11, "r_x2": 480.59, "r_y2": 452.31, "r_x3": 229.99, "r_y3": 452.31, "coord_origin": "TOPLEFT" }, "text": "in documents is a well understood problem, and the latest", "orig": "in documents is a well understood problem, and the latest", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 121, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.77, "r_y0": 473.07, "r_x1": 480.59, "r_y1": 473.07, "r_x2": 480.59, "r_y2": 464.27, "r_x3": 134.77, "r_y3": 464.27, "coord_origin": "TOPLEFT" }, "text": "state-of-the-art (SOTA) object detection methods provide an accuracy compa-", "orig": "state-of-the-art (SOTA) object detection methods provide an accuracy compa-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 122, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.77, "r_y0": 485.02, "r_x1": 480.59, "r_y1": 485.02, "r_x2": 480.59, "r_y2": 476.22, "r_x3": 134.77, "r_y3": 476.22, "coord_origin": "TOPLEFT" }, "text": "rable to human observers [7,8,10,14,23]. On the other hand, the problem of table", "orig": "rable to human observers [7,8,10,14,23]. On the other hand, the problem of table", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 123, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.77, "r_y0": 496.98, "r_x1": 480.59, "r_y1": 496.98, "r_x2": 480.59, "r_y2": 488.18, "r_x3": 134.77, "r_y3": 488.18, "coord_origin": "TOPLEFT" }, "text": "structure recognition (TSR) is a lot more challenging and remains a very active", "orig": "structure recognition (TSR) is a lot more challenging and remains a very active", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 124, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.77, "r_y0": 508.93, "r_x1": 480.59, "r_y1": 508.93, "r_x2": 480.59, "r_y2": 500.13, "r_x3": 134.77, "r_y3": 500.13, "coord_origin": "TOPLEFT" }, "text": "area of research, in which many novel machine learning algorithms are being", "orig": "area of research, in which many novel machine learning algorithms are being", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 125, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.77, "r_y0": 520.89, "r_x1": 313.25, "r_y1": 520.89, "r_x2": 313.25, "r_y2": 512.09, "r_x3": 134.77, "r_y3": 512.09, "coord_origin": "TOPLEFT" }, "text": "explored [3,4,5,9,11,12,13,14,17,18,21,22].", "orig": "explored [3,4,5,9,11,12,13,14,17,18,21,22].", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "today, table detection in documents is a well understood problem, and the latest state-of-the-art (SOTA) object detection methods provide an accuracy comparable to human observers [7,8,10,14,23]. On the other hand, the problem of table structure recognition (TSR) is a lot more challenging and remains a very active area of research, in which many novel machine learning algorithms are being explored [3,4,5,9,11,12,13,14,17,18,21,22]." }, { "label": "text", "id": 0, "page_no": 1, "cluster": { "id": 0, "label": "text", "bbox": { "l": 134.77, "t": 524.55, "r": 480.59, "b": 664.85, "coord_origin": "TOPLEFT" }, "confidence": 0.985, "cells": [ { "index": 126, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 149.71, "r_y0": 533.35, "r_x1": 480.59, "r_y1": 533.35, "r_x2": 480.59, "r_y2": 524.55, "r_x3": 149.71, "r_y3": 524.55, "coord_origin": "TOPLEFT" }, "text": "Recently emerging SOTA methods for table structure recognition employ", "orig": "Recently emerging SOTA methods for table structure recognition employ", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 127, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.77, "r_y0": 545.3, "r_x1": 480.59, "r_y1": 545.3, "r_x2": 480.59, "r_y2": 536.51, "r_x3": 134.77, "r_y3": 536.51, "coord_origin": "TOPLEFT" }, "text": "transformer-based models, in which an image of the table is provided to the net-", "orig": "transformer-based models, in which an image of the table is provided to the net-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 128, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.77, "r_y0": 557.26, "r_x1": 480.59, "r_y1": 557.26, "r_x2": 480.59, "r_y2": 548.46, "r_x3": 134.77, "r_y3": 548.46, "coord_origin": "TOPLEFT" }, "text": "work in order to predict the structure of the table as a sequence of tokens. These", "orig": "work in order to predict the structure of the table as a sequence of tokens. These", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 129, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.77, "r_y0": 569.21, "r_x1": 480.59, "r_y1": 569.21, "r_x2": 480.59, "r_y2": 560.42, "r_x3": 134.77, "r_y3": 560.42, "coord_origin": "TOPLEFT" }, "text": "image-to-sequence (Im2Seq) models are extremely powerful, since they allow for", "orig": "image-to-sequence (Im2Seq) models are extremely powerful, since they allow for", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 130, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.77, "r_y0": 581.17, "r_x1": 480.59, "r_y1": 581.17, "r_x2": 480.59, "r_y2": 572.37, "r_x3": 134.77, "r_y3": 572.37, "coord_origin": "TOPLEFT" }, "text": "a purely data-driven solution. The tokens of the sequence typically belong to a", "orig": "a purely data-driven solution. The tokens of the sequence typically belong to a", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 131, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.77, "r_y0": 593.12, "r_x1": 480.59, "r_y1": 593.12, "r_x2": 480.59, "r_y2": 584.33, "r_x3": 134.77, "r_y3": 584.33, "coord_origin": "TOPLEFT" }, "text": "markup language such as HTML, Latex or Markdown, which allow to describe", "orig": "markup language such as HTML, Latex or Markdown, which allow to describe", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 132, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.77, "r_y0": 605.08, "r_x1": 480.59, "r_y1": 605.08, "r_x2": 480.59, "r_y2": 596.28, "r_x3": 134.77, "r_y3": 596.28, "coord_origin": "TOPLEFT" }, "text": "table structure as rows, columns and spanning cells in various configurations.", "orig": "table structure as rows, columns and spanning cells in various configurations.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 133, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.77, "r_y0": 617.03, "r_x1": 480.59, "r_y1": 617.03, "r_x2": 480.59, "r_y2": 608.24, "r_x3": 134.77, "r_y3": 608.24, "coord_origin": "TOPLEFT" }, "text": "In Figure 1, we illustrate how HTML is used to represent the table-structure", "orig": "In Figure 1, we illustrate how HTML is used to represent the table-structure", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 134, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.77, "r_y0": 628.99, "r_x1": 480.59, "r_y1": 628.99, "r_x2": 480.59, "r_y2": 620.19, "r_x3": 134.77, "r_y3": 620.19, "coord_origin": "TOPLEFT" }, "text": "of a particular example table. Public table-structure data sets such as PubTab-", "orig": "of a particular example table. Public table-structure data sets such as PubTab-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 135, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.77, "r_y0": 640.94, "r_x1": 480.59, "r_y1": 640.94, "r_x2": 480.59, "r_y2": 632.15, "r_x3": 134.77, "r_y3": 632.15, "coord_origin": "TOPLEFT" }, "text": "Net [22], and FinTabNet [21], which were created in a semi-automated way from", "orig": "Net [22], and FinTabNet [21], which were created in a semi-automated way from", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 136, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.77, "r_y0": 652.9, "r_x1": 480.59, "r_y1": 652.9, "r_x2": 480.59, "r_y2": 644.1, "r_x3": 134.77, "r_y3": 644.1, "coord_origin": "TOPLEFT" }, "text": "paired PDF and HTML sources (e.g. PubMed Central), popularized primarily", "orig": "paired PDF and HTML sources (e.g. PubMed Central), popularized primarily", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 137, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.77, "r_y0": 664.85, "r_x1": 421.45, "r_y1": 664.85, "r_x2": 421.45, "r_y2": 656.06, "r_x3": 134.77, "r_y3": 656.06, "coord_origin": "TOPLEFT" }, "text": "the use of HTML as ground-truth representation format for TSR.", "orig": "the use of HTML as ground-truth representation format for TSR.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "Recently emerging SOTA methods for table structure recognition employ transformer-based models, in which an image of the table is provided to the network in order to predict the structure of the table as a sequence of tokens. These image-to-sequence (Im2Seq) models are extremely powerful, since they allow for a purely data-driven solution. The tokens of the sequence typically belong to a markup language such as HTML, Latex or Markdown, which allow to describe table structure as rows, columns and spanning cells in various configurations. In Figure 1, we illustrate how HTML is used to represent the table-structure of a particular example table. Public table-structure data sets such as PubTabNet [22], and FinTabNet [21], which were created in a semi-automated way from paired PDF and HTML sources (e.g. PubMed Central), popularized primarily the use of HTML as ground-truth representation format for TSR." } ], "headers": [ { "label": "page_header", "id": 5, "page_no": 1, "cluster": { "id": 5, "label": "page_header", "bbox": { "l": 134.76, "t": 93.77, "r": 139.37, "b": 101.84, "coord_origin": "TOPLEFT" }, "confidence": 0.858, "cells": [ { "index": 0, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 101.84, "r_x1": 139.37, "r_y1": 101.84, "r_x2": 139.37, "r_y2": 93.77, "r_x3": 134.76, "r_y3": 93.77, "coord_origin": "TOPLEFT" }, "text": "2", "orig": "2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "2" }, { "label": "page_header", "id": 3, "page_no": 1, "cluster": { "id": 3, "label": "page_header", "bbox": { "l": 167.81, "t": 93.77, "r": 231.72, "b": 101.84, "coord_origin": "TOPLEFT" }, "confidence": 0.908, "cells": [ { "index": 1, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 167.81, "r_y0": 101.84, "r_x1": 178.08, "r_y1": 101.84, "r_x2": 178.08, "r_y2": 93.77, "r_x3": 167.81, "r_y3": 93.77, "coord_origin": "TOPLEFT" }, "text": "M.", "orig": "M.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 2, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 182.37, "r_y0": 101.84, "r_x1": 231.72, "r_y1": 101.84, "r_x2": 231.72, "r_y2": 93.77, "r_x3": 182.37, "r_y3": 93.77, "coord_origin": "TOPLEFT" }, "text": "Lysak, et al.", "orig": "Lysak, et al.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "M. Lysak, et al." } ] } }, { "page_no": 2, "size": { "width": 612.0, "height": 792.0 }, "parsed_page": { "dimension": { "angle": 0.0, "rect": { "r_x0": 0.0, "r_y0": 0.0, "r_x1": 612.0, "r_y1": 0.0, "r_x2": 612.0, "r_y2": 792.0, "r_x3": 0.0, "r_y3": 792.0, "coord_origin": "BOTTOMLEFT" }, "boundary_type": "crop_box", "art_bbox": { "l": 0.0, "t": 792.0, "r": 612.0, "b": 0.0, "coord_origin": "BOTTOMLEFT" }, "bleed_bbox": { "l": 0.0, "t": 792.0, "r": 612.0, "b": 0.0, "coord_origin": "BOTTOMLEFT" }, "crop_bbox": { "l": 0.0, "t": 792.0, "r": 612.0, "b": 0.0, "coord_origin": "BOTTOMLEFT" }, "media_bbox": { "l": 0.0, "t": 792.0, "r": 612.0, "b": 0.0, "coord_origin": "BOTTOMLEFT" }, "trim_bbox": { "l": 0.0, "t": 792.0, "r": 612.0, "b": 0.0, "coord_origin": "BOTTOMLEFT" } }, "bitmap_resources": [], "char_cells": [], "word_cells": [], "textline_cells": [ { "index": 0, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 194.48, "r_y0": 101.84, "r_x1": 447.54, "r_y1": 101.84, "r_x2": 447.54, "r_y2": 93.77, "r_x3": 194.48, "r_y3": 93.77, "coord_origin": "TOPLEFT" }, "text": "Optimized Table Tokenization for Table Structure Recognition", "orig": "Optimized Table Tokenization for Table Structure Recognition", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 1, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 475.98, "r_y0": 101.84, "r_x1": 480.59, "r_y1": 101.84, "r_x2": 480.59, "r_y2": 93.77, "r_x3": 475.98, "r_y3": 93.77, "coord_origin": "TOPLEFT" }, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 2, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 149.71, "r_y0": 127.73, "r_x1": 480.59, "r_y1": 127.73, "r_x2": 480.59, "r_y2": 118.93, "r_x3": 149.71, "r_y3": 118.93, "coord_origin": "TOPLEFT" }, "text": "While the majority of research in TSR is currently focused on the develop-", "orig": "While the majority of research in TSR is currently focused on the develop-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 3, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 139.69, "r_x1": 480.59, "r_y1": 139.69, "r_x2": 480.59, "r_y2": 130.89, "r_x3": 134.76, "r_y3": 130.89, "coord_origin": "TOPLEFT" }, "text": "ment and application of novel neural model architectures, the table structure", "orig": "ment and application of novel neural model architectures, the table structure", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 4, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 151.64, "r_x1": 480.59, "r_y1": 151.64, "r_x2": 480.59, "r_y2": 142.84, "r_x3": 134.76, "r_y3": 142.84, "coord_origin": "TOPLEFT" }, "text": "representation language (e.g. HTML in PubTabNet and FinTabNet) is usually", "orig": "representation language (e.g. HTML in PubTabNet and FinTabNet) is usually", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 5, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 163.6, "r_x1": 169.63, "r_y1": 163.6, "r_x2": 169.63, "r_y2": 154.8, "r_x3": 134.76, "r_y3": 154.8, "coord_origin": "TOPLEFT" }, "text": "adopted", "orig": "adopted", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 6, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 173.86, "r_y0": 163.6, "r_x1": 194.56, "r_y1": 163.6, "r_x2": 194.56, "r_y2": 154.8, "r_x3": 173.86, "r_y3": 154.8, "coord_origin": "TOPLEFT" }, "text": "as is", "orig": "as is", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 7, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 199.61, "r_y0": 163.6, "r_x1": 480.59, "r_y1": 163.6, "r_x2": 480.59, "r_y2": 154.8, "r_x3": 199.61, "r_y3": 154.8, "coord_origin": "TOPLEFT" }, "text": "for the sequence tokenization in Im2Seq models. In this paper,", "orig": "for the sequence tokenization in Im2Seq models. In this paper,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 8, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 175.55, "r_x1": 480.59, "r_y1": 175.55, "r_x2": 480.59, "r_y2": 166.75, "r_x3": 134.76, "r_y3": 166.75, "coord_origin": "TOPLEFT" }, "text": "we aim for the opposite and investigate the impact of the table structure rep-", "orig": "we aim for the opposite and investigate the impact of the table structure rep-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 9, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 187.51, "r_x1": 480.59, "r_y1": 187.51, "r_x2": 480.59, "r_y2": 178.71, "r_x3": 134.76, "r_y3": 178.71, "coord_origin": "TOPLEFT" }, "text": "resentation language with an otherwise unmodified Im2Seq transformer-based", "orig": "resentation language with an otherwise unmodified Im2Seq transformer-based", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 10, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 199.46, "r_x1": 480.59, "r_y1": 199.46, "r_x2": 480.59, "r_y2": 190.66, "r_x3": 134.76, "r_y3": 190.66, "coord_origin": "TOPLEFT" }, "text": "architecture. Since the current state-of-the-art Im2Seq model is TableFormer [9],", "orig": "architecture. Since the current state-of-the-art Im2Seq model is TableFormer [9],", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 11, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 211.42, "r_x1": 348.36, "r_y1": 211.42, "r_x2": 348.36, "r_y2": 202.62, "r_x3": 134.76, "r_y3": 202.62, "coord_origin": "TOPLEFT" }, "text": "we select this model to perform our experiments.", "orig": "we select this model to perform our experiments.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 12, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 149.71, "r_y0": 223.63, "r_x1": 480.59, "r_y1": 223.63, "r_x2": 480.59, "r_y2": 214.84, "r_x3": 149.71, "r_y3": 214.84, "coord_origin": "TOPLEFT" }, "text": "The main contribution of this paper is the introduction of a new optimised ta-", "orig": "The main contribution of this paper is the introduction of a new optimised ta-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 13, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 235.59, "r_x1": 480.59, "r_y1": 235.59, "r_x2": 480.59, "r_y2": 226.79, "r_x3": 134.76, "r_y3": 226.79, "coord_origin": "TOPLEFT" }, "text": "ble structure language (OTSL), specifically designed to describe table-structure", "orig": "ble structure language (OTSL), specifically designed to describe table-structure", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 14, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 247.54, "r_x1": 480.59, "r_y1": 247.54, "r_x2": 480.59, "r_y2": 238.75, "r_x3": 134.76, "r_y3": 238.75, "coord_origin": "TOPLEFT" }, "text": "in an compact and structured way for Im2Seq models. OTSL has a number of", "orig": "in an compact and structured way for Im2Seq models. OTSL has a number of", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 15, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 259.5, "r_x1": 480.59, "r_y1": 259.5, "r_x2": 480.59, "r_y2": 250.7, "r_x3": 134.76, "r_y3": 250.7, "coord_origin": "TOPLEFT" }, "text": "key features, which make it very attractive to use in Im2Seq models. Specifically,", "orig": "key features, which make it very attractive to use in Im2Seq models. Specifically,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 16, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 271.45, "r_x1": 480.59, "r_y1": 271.45, "r_x2": 480.59, "r_y2": 262.66, "r_x3": 134.76, "r_y3": 262.66, "coord_origin": "TOPLEFT" }, "text": "compared to other languages such as HTML, OTSL has a minimized vocabulary", "orig": "compared to other languages such as HTML, OTSL has a minimized vocabulary", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 17, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 283.41, "r_x1": 480.6, "r_y1": 283.41, "r_x2": 480.6, "r_y2": 274.61, "r_x3": 134.76, "r_y3": 274.61, "coord_origin": "TOPLEFT" }, "text": "which yields short sequence length, strong inherent structure (e.g. strict rectan-", "orig": "which yields short sequence length, strong inherent structure (e.g. strict rectan-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 18, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 295.36, "r_x1": 480.59, "r_y1": 295.36, "r_x2": 480.59, "r_y2": 286.57, "r_x3": 134.76, "r_y3": 286.57, "coord_origin": "TOPLEFT" }, "text": "gular layout) and a strict syntax with rules that only look backwards. The latter", "orig": "gular layout) and a strict syntax with rules that only look backwards. The latter", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 19, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 307.32, "r_x1": 480.59, "r_y1": 307.32, "r_x2": 480.59, "r_y2": 298.52, "r_x3": 134.76, "r_y3": 298.52, "coord_origin": "TOPLEFT" }, "text": "allows for syntax validation during inference and ensures a syntactically correct", "orig": "allows for syntax validation during inference and ensures a syntactically correct", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 20, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 319.27, "r_x1": 480.59, "r_y1": 319.27, "r_x2": 480.59, "r_y2": 310.48, "r_x3": 134.76, "r_y3": 310.48, "coord_origin": "TOPLEFT" }, "text": "table-structure. These OTSL features are illustrated in Figure 1, in comparison", "orig": "table-structure. These OTSL features are illustrated in Figure 1, in comparison", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 21, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 331.23, "r_x1": 179.72, "r_y1": 331.23, "r_x2": 179.72, "r_y2": 322.43, "r_x3": 134.76, "r_y3": 322.43, "coord_origin": "TOPLEFT" }, "text": "to HTML.", "orig": "to HTML.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 22, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 149.71, "r_y0": 343.44, "r_x1": 480.59, "r_y1": 343.44, "r_x2": 480.59, "r_y2": 334.65, "r_x3": 149.71, "r_y3": 334.65, "coord_origin": "TOPLEFT" }, "text": "The paper is structured as follows. In section 2, we give an overview of the", "orig": "The paper is structured as follows. In section 2, we give an overview of the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 23, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 355.4, "r_x1": 480.59, "r_y1": 355.4, "r_x2": 480.59, "r_y2": 346.6, "r_x3": 134.76, "r_y3": 346.6, "coord_origin": "TOPLEFT" }, "text": "latest developments in table-structure reconstruction. In section 3 we review", "orig": "latest developments in table-structure reconstruction. In section 3 we review", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 24, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 367.36, "r_x1": 480.59, "r_y1": 367.36, "r_x2": 480.59, "r_y2": 358.56, "r_x3": 134.76, "r_y3": 358.56, "coord_origin": "TOPLEFT" }, "text": "the current HTML table encoding (popularised by PubTabNet and FinTabNet)", "orig": "the current HTML table encoding (popularised by PubTabNet and FinTabNet)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 25, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 379.31, "r_x1": 480.59, "r_y1": 379.31, "r_x2": 480.59, "r_y2": 370.51, "r_x3": 134.76, "r_y3": 370.51, "coord_origin": "TOPLEFT" }, "text": "and discuss its flaws. Subsequently, we introduce OTSL in section 4, which in-", "orig": "and discuss its flaws. Subsequently, we introduce OTSL in section 4, which in-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 26, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 391.27, "r_x1": 480.59, "r_y1": 391.27, "r_x2": 480.59, "r_y2": 382.47, "r_x3": 134.76, "r_y3": 382.47, "coord_origin": "TOPLEFT" }, "text": "cludes the language definition, syntax rules and error-correction procedures. In", "orig": "cludes the language definition, syntax rules and error-correction procedures. In", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 27, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 403.22, "r_x1": 480.59, "r_y1": 403.22, "r_x2": 480.59, "r_y2": 394.42, "r_x3": 134.76, "r_y3": 394.42, "coord_origin": "TOPLEFT" }, "text": "section 5, we apply OTSL on the TableFormer architecture, compare it to Table-", "orig": "section 5, we apply OTSL on the TableFormer architecture, compare it to Table-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 28, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 415.18, "r_x1": 480.59, "r_y1": 415.18, "r_x2": 480.59, "r_y2": 406.38, "r_x3": 134.76, "r_y3": 406.38, "coord_origin": "TOPLEFT" }, "text": "Former models trained on HTML and ultimately demonstrate the advantages", "orig": "Former models trained on HTML and ultimately demonstrate the advantages", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 29, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 427.13, "r_x1": 480.6, "r_y1": 427.13, "r_x2": 480.6, "r_y2": 418.33, "r_x3": 134.76, "r_y3": 418.33, "coord_origin": "TOPLEFT" }, "text": "of using OTSL. Finally, in section 6 we conclude our work and outline next", "orig": "of using OTSL. Finally, in section 6 we conclude our work and outline next", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 30, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 439.09, "r_x1": 201.27, "r_y1": 439.09, "r_x2": 201.27, "r_y2": 430.29, "r_x3": 134.76, "r_y3": 430.29, "coord_origin": "TOPLEFT" }, "text": "potential steps.", "orig": "potential steps.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 31, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 472.66, "r_x1": 141.49, "r_y1": 472.66, "r_x2": 141.49, "r_y2": 462.09, "r_x3": 134.76, "r_y3": 462.09, "coord_origin": "TOPLEFT" }, "text": "2", "orig": "2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 32, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 154.94, "r_y0": 472.66, "r_x1": 236.77, "r_y1": 472.66, "r_x2": 236.77, "r_y2": 462.09, "r_x3": 154.94, "r_y3": 462.09, "coord_origin": "TOPLEFT" }, "text": "Related Work", "orig": "Related Work", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 33, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 497.48, "r_x1": 480.59, "r_y1": 497.48, "r_x2": 480.59, "r_y2": 488.69, "r_x3": 134.76, "r_y3": 488.69, "coord_origin": "TOPLEFT" }, "text": "Approaches to formalize the logical structure and layout of tables in electronic", "orig": "Approaches to formalize the logical structure and layout of tables in electronic", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 34, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 509.44, "r_x1": 480.59, "r_y1": 509.44, "r_x2": 480.59, "r_y2": 500.64, "r_x3": 134.76, "r_y3": 500.64, "coord_origin": "TOPLEFT" }, "text": "documents date back more than two decades [16]. In the recent past, a wide", "orig": "documents date back more than two decades [16]. In the recent past, a wide", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 35, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 521.39, "r_x1": 480.59, "r_y1": 521.39, "r_x2": 480.59, "r_y2": 512.6, "r_x3": 134.76, "r_y3": 512.6, "coord_origin": "TOPLEFT" }, "text": "variety of computer vision methods have been explored to tackle the prob-", "orig": "variety of computer vision methods have been explored to tackle the prob-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 36, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 533.35, "r_x1": 480.59, "r_y1": 533.35, "r_x2": 480.59, "r_y2": 524.55, "r_x3": 134.76, "r_y3": 524.55, "coord_origin": "TOPLEFT" }, "text": "lem of table structure recognition, i.e. the correct identification of columns,", "orig": "lem of table structure recognition, i.e. the correct identification of columns,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 37, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 545.3, "r_x1": 480.59, "r_y1": 545.3, "r_x2": 480.59, "r_y2": 536.51, "r_x3": 134.76, "r_y3": 536.51, "coord_origin": "TOPLEFT" }, "text": "rows and spanning cells in a given table. Broadly speaking, the current deep-", "orig": "rows and spanning cells in a given table. Broadly speaking, the current deep-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 38, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 557.26, "r_x1": 480.59, "r_y1": 557.26, "r_x2": 480.59, "r_y2": 548.46, "r_x3": 134.76, "r_y3": 548.46, "coord_origin": "TOPLEFT" }, "text": "learning based approaches fall into three categories: object detection (OD) meth-", "orig": "learning based approaches fall into three categories: object detection (OD) meth-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 39, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 569.21, "r_x1": 480.59, "r_y1": 569.21, "r_x2": 480.59, "r_y2": 560.42, "r_x3": 134.76, "r_y3": 560.42, "coord_origin": "TOPLEFT" }, "text": "ods, Graph-Neural-Network (GNN) methods and Image-to-Markup-Sequence", "orig": "ods, Graph-Neural-Network (GNN) methods and Image-to-Markup-Sequence", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 40, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 581.17, "r_x1": 484.12, "r_y1": 581.17, "r_x2": 484.12, "r_y2": 572.37, "r_x3": 134.76, "r_y3": 572.37, "coord_origin": "TOPLEFT" }, "text": "(Im2Seq) methods. Object-detection based methods [11,12,13,14,21] rely on table-", "orig": "(Im2Seq) methods. Object-detection based methods [11,12,13,14,21] rely on table-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 41, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 593.12, "r_x1": 480.6, "r_y1": 593.12, "r_x2": 480.6, "r_y2": 584.33, "r_x3": 134.76, "r_y3": 584.33, "coord_origin": "TOPLEFT" }, "text": "structure annotation using (overlapping) bounding boxes for training, and pro-", "orig": "structure annotation using (overlapping) bounding boxes for training, and pro-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 42, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 605.08, "r_x1": 480.59, "r_y1": 605.08, "r_x2": 480.59, "r_y2": 596.28, "r_x3": 134.76, "r_y3": 596.28, "coord_origin": "TOPLEFT" }, "text": "duce bounding-box predictions to define table cells, rows, and columns on a table", "orig": "duce bounding-box predictions to define table cells, rows, and columns on a table", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 43, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 617.03, "r_x1": 480.59, "r_y1": 617.03, "r_x2": 480.59, "r_y2": 608.24, "r_x3": 134.76, "r_y3": 608.24, "coord_origin": "TOPLEFT" }, "text": "image. Graph Neural Network (GNN) based methods [3,6,17,18], as the name", "orig": "image. Graph Neural Network (GNN) based methods [3,6,17,18], as the name", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 44, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 628.99, "r_x1": 480.59, "r_y1": 628.99, "r_x2": 480.59, "r_y2": 620.19, "r_x3": 134.76, "r_y3": 620.19, "coord_origin": "TOPLEFT" }, "text": "suggests, represent tables as graph structures. The graph nodes represent the", "orig": "suggests, represent tables as graph structures. The graph nodes represent the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 45, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 640.94, "r_x1": 480.59, "r_y1": 640.94, "r_x2": 480.59, "r_y2": 632.15, "r_x3": 134.76, "r_y3": 632.15, "coord_origin": "TOPLEFT" }, "text": "content of each table cell, an embedding vector from the table image, or geomet-", "orig": "content of each table cell, an embedding vector from the table image, or geomet-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 46, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 652.9, "r_x1": 480.59, "r_y1": 652.9, "r_x2": 480.59, "r_y2": 644.1, "r_x3": 134.76, "r_y3": 644.1, "coord_origin": "TOPLEFT" }, "text": "ric coordinates of the table cell. The edges of the graph define the relationship", "orig": "ric coordinates of the table cell. The edges of the graph define the relationship", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 47, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 664.86, "r_x1": 480.59, "r_y1": 664.86, "r_x2": 480.59, "r_y2": 656.06, "r_x3": 134.76, "r_y3": 656.06, "coord_origin": "TOPLEFT" }, "text": "between the nodes, e.g. if they belong to the same column, row, or table cell.", "orig": "between the nodes, e.g. if they belong to the same column, row, or table cell.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "has_chars": false, "has_words": false, "has_lines": true, "image": null, "lines": [] }, "predictions": { "layout": { "clusters": [ { "id": 5, "label": "page_header", "bbox": { "l": 194.48, "t": 93.77, "r": 447.54, "b": 101.84, "coord_origin": "TOPLEFT" }, "confidence": 0.933, "cells": [ { "index": 0, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 194.48, "r_y0": 101.84, "r_x1": 447.54, "r_y1": 101.84, "r_x2": 447.54, "r_y2": 93.77, "r_x3": 194.48, "r_y3": 93.77, "coord_origin": "TOPLEFT" }, "text": "Optimized Table Tokenization for Table Structure Recognition", "orig": "Optimized Table Tokenization for Table Structure Recognition", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 6, "label": "page_header", "bbox": { "l": 475.98, "t": 93.77, "r": 480.59, "b": 101.84, "coord_origin": "TOPLEFT" }, "confidence": 0.877, "cells": [ { "index": 1, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 475.98, "r_y0": 101.84, "r_x1": 480.59, "r_y1": 101.84, "r_x2": 480.59, "r_y2": 93.77, "r_x3": 475.98, "r_y3": 93.77, "coord_origin": "TOPLEFT" }, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 2, "label": "text", "bbox": { "l": 134.76, "t": 118.93, "r": 480.59, "b": 211.42, "coord_origin": "TOPLEFT" }, "confidence": 0.987, "cells": [ { "index": 2, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 149.71, "r_y0": 127.73, "r_x1": 480.59, "r_y1": 127.73, "r_x2": 480.59, "r_y2": 118.93, "r_x3": 149.71, "r_y3": 118.93, "coord_origin": "TOPLEFT" }, "text": "While the majority of research in TSR is currently focused on the develop-", "orig": "While the majority of research in TSR is currently focused on the develop-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 3, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 139.69, "r_x1": 480.59, "r_y1": 139.69, "r_x2": 480.59, "r_y2": 130.89, "r_x3": 134.76, "r_y3": 130.89, "coord_origin": "TOPLEFT" }, "text": "ment and application of novel neural model architectures, the table structure", "orig": "ment and application of novel neural model architectures, the table structure", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 4, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 151.64, "r_x1": 480.59, "r_y1": 151.64, "r_x2": 480.59, "r_y2": 142.84, "r_x3": 134.76, "r_y3": 142.84, "coord_origin": "TOPLEFT" }, "text": "representation language (e.g. HTML in PubTabNet and FinTabNet) is usually", "orig": "representation language (e.g. HTML in PubTabNet and FinTabNet) is usually", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 5, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 163.6, "r_x1": 169.63, "r_y1": 163.6, "r_x2": 169.63, "r_y2": 154.8, "r_x3": 134.76, "r_y3": 154.8, "coord_origin": "TOPLEFT" }, "text": "adopted", "orig": "adopted", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 6, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 173.86, "r_y0": 163.6, "r_x1": 194.56, "r_y1": 163.6, "r_x2": 194.56, "r_y2": 154.8, "r_x3": 173.86, "r_y3": 154.8, "coord_origin": "TOPLEFT" }, "text": "as is", "orig": "as is", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 7, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 199.61, "r_y0": 163.6, "r_x1": 480.59, "r_y1": 163.6, "r_x2": 480.59, "r_y2": 154.8, "r_x3": 199.61, "r_y3": 154.8, "coord_origin": "TOPLEFT" }, "text": "for the sequence tokenization in Im2Seq models. In this paper,", "orig": "for the sequence tokenization in Im2Seq models. In this paper,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 8, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 175.55, "r_x1": 480.59, "r_y1": 175.55, "r_x2": 480.59, "r_y2": 166.75, "r_x3": 134.76, "r_y3": 166.75, "coord_origin": "TOPLEFT" }, "text": "we aim for the opposite and investigate the impact of the table structure rep-", "orig": "we aim for the opposite and investigate the impact of the table structure rep-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 9, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 187.51, "r_x1": 480.59, "r_y1": 187.51, "r_x2": 480.59, "r_y2": 178.71, "r_x3": 134.76, "r_y3": 178.71, "coord_origin": "TOPLEFT" }, "text": "resentation language with an otherwise unmodified Im2Seq transformer-based", "orig": "resentation language with an otherwise unmodified Im2Seq transformer-based", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 10, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 199.46, "r_x1": 480.59, "r_y1": 199.46, "r_x2": 480.59, "r_y2": 190.66, "r_x3": 134.76, "r_y3": 190.66, "coord_origin": "TOPLEFT" }, "text": "architecture. Since the current state-of-the-art Im2Seq model is TableFormer [9],", "orig": "architecture. Since the current state-of-the-art Im2Seq model is TableFormer [9],", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 11, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 211.42, "r_x1": 348.36, "r_y1": 211.42, "r_x2": 348.36, "r_y2": 202.62, "r_x3": 134.76, "r_y3": 202.62, "coord_origin": "TOPLEFT" }, "text": "we select this model to perform our experiments.", "orig": "we select this model to perform our experiments.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 1, "label": "text", "bbox": { "l": 134.76, "t": 214.84, "r": 480.6, "b": 331.23, "coord_origin": "TOPLEFT" }, "confidence": 0.987, "cells": [ { "index": 12, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 149.71, "r_y0": 223.63, "r_x1": 480.59, "r_y1": 223.63, "r_x2": 480.59, "r_y2": 214.84, "r_x3": 149.71, "r_y3": 214.84, "coord_origin": "TOPLEFT" }, "text": "The main contribution of this paper is the introduction of a new optimised ta-", "orig": "The main contribution of this paper is the introduction of a new optimised ta-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 13, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 235.59, "r_x1": 480.59, "r_y1": 235.59, "r_x2": 480.59, "r_y2": 226.79, "r_x3": 134.76, "r_y3": 226.79, "coord_origin": "TOPLEFT" }, "text": "ble structure language (OTSL), specifically designed to describe table-structure", "orig": "ble structure language (OTSL), specifically designed to describe table-structure", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 14, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 247.54, "r_x1": 480.59, "r_y1": 247.54, "r_x2": 480.59, "r_y2": 238.75, "r_x3": 134.76, "r_y3": 238.75, "coord_origin": "TOPLEFT" }, "text": "in an compact and structured way for Im2Seq models. OTSL has a number of", "orig": "in an compact and structured way for Im2Seq models. OTSL has a number of", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 15, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 259.5, "r_x1": 480.59, "r_y1": 259.5, "r_x2": 480.59, "r_y2": 250.7, "r_x3": 134.76, "r_y3": 250.7, "coord_origin": "TOPLEFT" }, "text": "key features, which make it very attractive to use in Im2Seq models. Specifically,", "orig": "key features, which make it very attractive to use in Im2Seq models. Specifically,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 16, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 271.45, "r_x1": 480.59, "r_y1": 271.45, "r_x2": 480.59, "r_y2": 262.66, "r_x3": 134.76, "r_y3": 262.66, "coord_origin": "TOPLEFT" }, "text": "compared to other languages such as HTML, OTSL has a minimized vocabulary", "orig": "compared to other languages such as HTML, OTSL has a minimized vocabulary", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 17, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 283.41, "r_x1": 480.6, "r_y1": 283.41, "r_x2": 480.6, "r_y2": 274.61, "r_x3": 134.76, "r_y3": 274.61, "coord_origin": "TOPLEFT" }, "text": "which yields short sequence length, strong inherent structure (e.g. strict rectan-", "orig": "which yields short sequence length, strong inherent structure (e.g. strict rectan-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 18, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 295.36, "r_x1": 480.59, "r_y1": 295.36, "r_x2": 480.59, "r_y2": 286.57, "r_x3": 134.76, "r_y3": 286.57, "coord_origin": "TOPLEFT" }, "text": "gular layout) and a strict syntax with rules that only look backwards. The latter", "orig": "gular layout) and a strict syntax with rules that only look backwards. The latter", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 19, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 307.32, "r_x1": 480.59, "r_y1": 307.32, "r_x2": 480.59, "r_y2": 298.52, "r_x3": 134.76, "r_y3": 298.52, "coord_origin": "TOPLEFT" }, "text": "allows for syntax validation during inference and ensures a syntactically correct", "orig": "allows for syntax validation during inference and ensures a syntactically correct", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 20, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 319.27, "r_x1": 480.59, "r_y1": 319.27, "r_x2": 480.59, "r_y2": 310.48, "r_x3": 134.76, "r_y3": 310.48, "coord_origin": "TOPLEFT" }, "text": "table-structure. These OTSL features are illustrated in Figure 1, in comparison", "orig": "table-structure. These OTSL features are illustrated in Figure 1, in comparison", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 21, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 331.23, "r_x1": 179.72, "r_y1": 331.23, "r_x2": 179.72, "r_y2": 322.43, "r_x3": 134.76, "r_y3": 322.43, "coord_origin": "TOPLEFT" }, "text": "to HTML.", "orig": "to HTML.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 0, "label": "text", "bbox": { "l": 134.76, "t": 334.65, "r": 480.6, "b": 439.09, "coord_origin": "TOPLEFT" }, "confidence": 0.988, "cells": [ { "index": 22, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 149.71, "r_y0": 343.44, "r_x1": 480.59, "r_y1": 343.44, "r_x2": 480.59, "r_y2": 334.65, "r_x3": 149.71, "r_y3": 334.65, "coord_origin": "TOPLEFT" }, "text": "The paper is structured as follows. In section 2, we give an overview of the", "orig": "The paper is structured as follows. In section 2, we give an overview of the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 23, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 355.4, "r_x1": 480.59, "r_y1": 355.4, "r_x2": 480.59, "r_y2": 346.6, "r_x3": 134.76, "r_y3": 346.6, "coord_origin": "TOPLEFT" }, "text": "latest developments in table-structure reconstruction. In section 3 we review", "orig": "latest developments in table-structure reconstruction. In section 3 we review", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 24, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 367.36, "r_x1": 480.59, "r_y1": 367.36, "r_x2": 480.59, "r_y2": 358.56, "r_x3": 134.76, "r_y3": 358.56, "coord_origin": "TOPLEFT" }, "text": "the current HTML table encoding (popularised by PubTabNet and FinTabNet)", "orig": "the current HTML table encoding (popularised by PubTabNet and FinTabNet)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 25, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 379.31, "r_x1": 480.59, "r_y1": 379.31, "r_x2": 480.59, "r_y2": 370.51, "r_x3": 134.76, "r_y3": 370.51, "coord_origin": "TOPLEFT" }, "text": "and discuss its flaws. Subsequently, we introduce OTSL in section 4, which in-", "orig": "and discuss its flaws. Subsequently, we introduce OTSL in section 4, which in-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 26, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 391.27, "r_x1": 480.59, "r_y1": 391.27, "r_x2": 480.59, "r_y2": 382.47, "r_x3": 134.76, "r_y3": 382.47, "coord_origin": "TOPLEFT" }, "text": "cludes the language definition, syntax rules and error-correction procedures. In", "orig": "cludes the language definition, syntax rules and error-correction procedures. In", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 27, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 403.22, "r_x1": 480.59, "r_y1": 403.22, "r_x2": 480.59, "r_y2": 394.42, "r_x3": 134.76, "r_y3": 394.42, "coord_origin": "TOPLEFT" }, "text": "section 5, we apply OTSL on the TableFormer architecture, compare it to Table-", "orig": "section 5, we apply OTSL on the TableFormer architecture, compare it to Table-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 28, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 415.18, "r_x1": 480.59, "r_y1": 415.18, "r_x2": 480.59, "r_y2": 406.38, "r_x3": 134.76, "r_y3": 406.38, "coord_origin": "TOPLEFT" }, "text": "Former models trained on HTML and ultimately demonstrate the advantages", "orig": "Former models trained on HTML and ultimately demonstrate the advantages", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 29, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 427.13, "r_x1": 480.6, "r_y1": 427.13, "r_x2": 480.6, "r_y2": 418.33, "r_x3": 134.76, "r_y3": 418.33, "coord_origin": "TOPLEFT" }, "text": "of using OTSL. Finally, in section 6 we conclude our work and outline next", "orig": "of using OTSL. Finally, in section 6 we conclude our work and outline next", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 30, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 439.09, "r_x1": 201.27, "r_y1": 439.09, "r_x2": 201.27, "r_y2": 430.29, "r_x3": 134.76, "r_y3": 430.29, "coord_origin": "TOPLEFT" }, "text": "potential steps.", "orig": "potential steps.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 4, "label": "section_header", "bbox": { "l": 134.76, "t": 462.09, "r": 236.77, "b": 472.66, "coord_origin": "TOPLEFT" }, "confidence": 0.944, "cells": [ { "index": 31, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 472.66, "r_x1": 141.49, "r_y1": 472.66, "r_x2": 141.49, "r_y2": 462.09, "r_x3": 134.76, "r_y3": 462.09, "coord_origin": "TOPLEFT" }, "text": "2", "orig": "2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 32, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 154.94, "r_y0": 472.66, "r_x1": 236.77, "r_y1": 472.66, "r_x2": 236.77, "r_y2": 462.09, "r_x3": 154.94, "r_y3": 462.09, "coord_origin": "TOPLEFT" }, "text": "Related Work", "orig": "Related Work", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 3, "label": "text", "bbox": { "l": 134.76, "t": 488.69, "r": 484.12, "b": 664.86, "coord_origin": "TOPLEFT" }, "confidence": 0.987, "cells": [ { "index": 33, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 497.48, "r_x1": 480.59, "r_y1": 497.48, "r_x2": 480.59, "r_y2": 488.69, "r_x3": 134.76, "r_y3": 488.69, "coord_origin": "TOPLEFT" }, "text": "Approaches to formalize the logical structure and layout of tables in electronic", "orig": "Approaches to formalize the logical structure and layout of tables in electronic", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 34, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 509.44, "r_x1": 480.59, "r_y1": 509.44, "r_x2": 480.59, "r_y2": 500.64, "r_x3": 134.76, "r_y3": 500.64, "coord_origin": "TOPLEFT" }, "text": "documents date back more than two decades [16]. In the recent past, a wide", "orig": "documents date back more than two decades [16]. In the recent past, a wide", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 35, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 521.39, "r_x1": 480.59, "r_y1": 521.39, "r_x2": 480.59, "r_y2": 512.6, "r_x3": 134.76, "r_y3": 512.6, "coord_origin": "TOPLEFT" }, "text": "variety of computer vision methods have been explored to tackle the prob-", "orig": "variety of computer vision methods have been explored to tackle the prob-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 36, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 533.35, "r_x1": 480.59, "r_y1": 533.35, "r_x2": 480.59, "r_y2": 524.55, "r_x3": 134.76, "r_y3": 524.55, "coord_origin": "TOPLEFT" }, "text": "lem of table structure recognition, i.e. the correct identification of columns,", "orig": "lem of table structure recognition, i.e. the correct identification of columns,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 37, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 545.3, "r_x1": 480.59, "r_y1": 545.3, "r_x2": 480.59, "r_y2": 536.51, "r_x3": 134.76, "r_y3": 536.51, "coord_origin": "TOPLEFT" }, "text": "rows and spanning cells in a given table. Broadly speaking, the current deep-", "orig": "rows and spanning cells in a given table. Broadly speaking, the current deep-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 38, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 557.26, "r_x1": 480.59, "r_y1": 557.26, "r_x2": 480.59, "r_y2": 548.46, "r_x3": 134.76, "r_y3": 548.46, "coord_origin": "TOPLEFT" }, "text": "learning based approaches fall into three categories: object detection (OD) meth-", "orig": "learning based approaches fall into three categories: object detection (OD) meth-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 39, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 569.21, "r_x1": 480.59, "r_y1": 569.21, "r_x2": 480.59, "r_y2": 560.42, "r_x3": 134.76, "r_y3": 560.42, "coord_origin": "TOPLEFT" }, "text": "ods, Graph-Neural-Network (GNN) methods and Image-to-Markup-Sequence", "orig": "ods, Graph-Neural-Network (GNN) methods and Image-to-Markup-Sequence", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 40, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 581.17, "r_x1": 484.12, "r_y1": 581.17, "r_x2": 484.12, "r_y2": 572.37, "r_x3": 134.76, "r_y3": 572.37, "coord_origin": "TOPLEFT" }, "text": "(Im2Seq) methods. Object-detection based methods [11,12,13,14,21] rely on table-", "orig": "(Im2Seq) methods. Object-detection based methods [11,12,13,14,21] rely on table-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 41, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 593.12, "r_x1": 480.6, "r_y1": 593.12, "r_x2": 480.6, "r_y2": 584.33, "r_x3": 134.76, "r_y3": 584.33, "coord_origin": "TOPLEFT" }, "text": "structure annotation using (overlapping) bounding boxes for training, and pro-", "orig": "structure annotation using (overlapping) bounding boxes for training, and pro-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 42, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 605.08, "r_x1": 480.59, "r_y1": 605.08, "r_x2": 480.59, "r_y2": 596.28, "r_x3": 134.76, "r_y3": 596.28, "coord_origin": "TOPLEFT" }, "text": "duce bounding-box predictions to define table cells, rows, and columns on a table", "orig": "duce bounding-box predictions to define table cells, rows, and columns on a table", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 43, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 617.03, "r_x1": 480.59, "r_y1": 617.03, "r_x2": 480.59, "r_y2": 608.24, "r_x3": 134.76, "r_y3": 608.24, "coord_origin": "TOPLEFT" }, "text": "image. Graph Neural Network (GNN) based methods [3,6,17,18], as the name", "orig": "image. Graph Neural Network (GNN) based methods [3,6,17,18], as the name", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 44, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 628.99, "r_x1": 480.59, "r_y1": 628.99, "r_x2": 480.59, "r_y2": 620.19, "r_x3": 134.76, "r_y3": 620.19, "coord_origin": "TOPLEFT" }, "text": "suggests, represent tables as graph structures. The graph nodes represent the", "orig": "suggests, represent tables as graph structures. The graph nodes represent the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 45, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 640.94, "r_x1": 480.59, "r_y1": 640.94, "r_x2": 480.59, "r_y2": 632.15, "r_x3": 134.76, "r_y3": 632.15, "coord_origin": "TOPLEFT" }, "text": "content of each table cell, an embedding vector from the table image, or geomet-", "orig": "content of each table cell, an embedding vector from the table image, or geomet-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 46, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 652.9, "r_x1": 480.59, "r_y1": 652.9, "r_x2": 480.59, "r_y2": 644.1, "r_x3": 134.76, "r_y3": 644.1, "coord_origin": "TOPLEFT" }, "text": "ric coordinates of the table cell. The edges of the graph define the relationship", "orig": "ric coordinates of the table cell. The edges of the graph define the relationship", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 47, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 664.86, "r_x1": 480.59, "r_y1": 664.86, "r_x2": 480.59, "r_y2": 656.06, "r_x3": 134.76, "r_y3": 656.06, "coord_origin": "TOPLEFT" }, "text": "between the nodes, e.g. if they belong to the same column, row, or table cell.", "orig": "between the nodes, e.g. if they belong to the same column, row, or table cell.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] } ] }, "tablestructure": { "table_map": {} }, "figures_classification": null, "equations_prediction": null, "vlm_response": null }, "assembled": { "elements": [ { "label": "page_header", "id": 5, "page_no": 2, "cluster": { "id": 5, "label": "page_header", "bbox": { "l": 194.48, "t": 93.77, "r": 447.54, "b": 101.84, "coord_origin": "TOPLEFT" }, "confidence": 0.933, "cells": [ { "index": 0, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 194.48, "r_y0": 101.84, "r_x1": 447.54, "r_y1": 101.84, "r_x2": 447.54, "r_y2": 93.77, "r_x3": 194.48, "r_y3": 93.77, "coord_origin": "TOPLEFT" }, "text": "Optimized Table Tokenization for Table Structure Recognition", "orig": "Optimized Table Tokenization for Table Structure Recognition", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "Optimized Table Tokenization for Table Structure Recognition" }, { "label": "page_header", "id": 6, "page_no": 2, "cluster": { "id": 6, "label": "page_header", "bbox": { "l": 475.98, "t": 93.77, "r": 480.59, "b": 101.84, "coord_origin": "TOPLEFT" }, "confidence": 0.877, "cells": [ { "index": 1, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 475.98, "r_y0": 101.84, "r_x1": 480.59, "r_y1": 101.84, "r_x2": 480.59, "r_y2": 93.77, "r_x3": 475.98, "r_y3": 93.77, "coord_origin": "TOPLEFT" }, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "3" }, { "label": "text", "id": 2, "page_no": 2, "cluster": { "id": 2, "label": "text", "bbox": { "l": 134.76, "t": 118.93, "r": 480.59, "b": 211.42, "coord_origin": "TOPLEFT" }, "confidence": 0.987, "cells": [ { "index": 2, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 149.71, "r_y0": 127.73, "r_x1": 480.59, "r_y1": 127.73, "r_x2": 480.59, "r_y2": 118.93, "r_x3": 149.71, "r_y3": 118.93, "coord_origin": "TOPLEFT" }, "text": "While the majority of research in TSR is currently focused on the develop-", "orig": "While the majority of research in TSR is currently focused on the develop-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 3, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 139.69, "r_x1": 480.59, "r_y1": 139.69, "r_x2": 480.59, "r_y2": 130.89, "r_x3": 134.76, "r_y3": 130.89, "coord_origin": "TOPLEFT" }, "text": "ment and application of novel neural model architectures, the table structure", "orig": "ment and application of novel neural model architectures, the table structure", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 4, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 151.64, "r_x1": 480.59, "r_y1": 151.64, "r_x2": 480.59, "r_y2": 142.84, "r_x3": 134.76, "r_y3": 142.84, "coord_origin": "TOPLEFT" }, "text": "representation language (e.g. HTML in PubTabNet and FinTabNet) is usually", "orig": "representation language (e.g. HTML in PubTabNet and FinTabNet) is usually", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 5, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 163.6, "r_x1": 169.63, "r_y1": 163.6, "r_x2": 169.63, "r_y2": 154.8, "r_x3": 134.76, "r_y3": 154.8, "coord_origin": "TOPLEFT" }, "text": "adopted", "orig": "adopted", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 6, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 173.86, "r_y0": 163.6, "r_x1": 194.56, "r_y1": 163.6, "r_x2": 194.56, "r_y2": 154.8, "r_x3": 173.86, "r_y3": 154.8, "coord_origin": "TOPLEFT" }, "text": "as is", "orig": "as is", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 7, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 199.61, "r_y0": 163.6, "r_x1": 480.59, "r_y1": 163.6, "r_x2": 480.59, "r_y2": 154.8, "r_x3": 199.61, "r_y3": 154.8, "coord_origin": "TOPLEFT" }, "text": "for the sequence tokenization in Im2Seq models. In this paper,", "orig": "for the sequence tokenization in Im2Seq models. In this paper,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 8, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 175.55, "r_x1": 480.59, "r_y1": 175.55, "r_x2": 480.59, "r_y2": 166.75, "r_x3": 134.76, "r_y3": 166.75, "coord_origin": "TOPLEFT" }, "text": "we aim for the opposite and investigate the impact of the table structure rep-", "orig": "we aim for the opposite and investigate the impact of the table structure rep-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 9, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 187.51, "r_x1": 480.59, "r_y1": 187.51, "r_x2": 480.59, "r_y2": 178.71, "r_x3": 134.76, "r_y3": 178.71, "coord_origin": "TOPLEFT" }, "text": "resentation language with an otherwise unmodified Im2Seq transformer-based", "orig": "resentation language with an otherwise unmodified Im2Seq transformer-based", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 10, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 199.46, "r_x1": 480.59, "r_y1": 199.46, "r_x2": 480.59, "r_y2": 190.66, "r_x3": 134.76, "r_y3": 190.66, "coord_origin": "TOPLEFT" }, "text": "architecture. Since the current state-of-the-art Im2Seq model is TableFormer [9],", "orig": "architecture. Since the current state-of-the-art Im2Seq model is TableFormer [9],", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 11, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 211.42, "r_x1": 348.36, "r_y1": 211.42, "r_x2": 348.36, "r_y2": 202.62, "r_x3": 134.76, "r_y3": 202.62, "coord_origin": "TOPLEFT" }, "text": "we select this model to perform our experiments.", "orig": "we select this model to perform our experiments.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "While the majority of research in TSR is currently focused on the development and application of novel neural model architectures, the table structure representation language (e.g. HTML in PubTabNet and FinTabNet) is usually adopted as is for the sequence tokenization in Im2Seq models. In this paper, we aim for the opposite and investigate the impact of the table structure representation language with an otherwise unmodified Im2Seq transformer-based architecture. Since the current state-of-the-art Im2Seq model is TableFormer [9], we select this model to perform our experiments." }, { "label": "text", "id": 1, "page_no": 2, "cluster": { "id": 1, "label": "text", "bbox": { "l": 134.76, "t": 214.84, "r": 480.6, "b": 331.23, "coord_origin": "TOPLEFT" }, "confidence": 0.987, "cells": [ { "index": 12, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 149.71, "r_y0": 223.63, "r_x1": 480.59, "r_y1": 223.63, "r_x2": 480.59, "r_y2": 214.84, "r_x3": 149.71, "r_y3": 214.84, "coord_origin": "TOPLEFT" }, "text": "The main contribution of this paper is the introduction of a new optimised ta-", "orig": "The main contribution of this paper is the introduction of a new optimised ta-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 13, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 235.59, "r_x1": 480.59, "r_y1": 235.59, "r_x2": 480.59, "r_y2": 226.79, "r_x3": 134.76, "r_y3": 226.79, "coord_origin": "TOPLEFT" }, "text": "ble structure language (OTSL), specifically designed to describe table-structure", "orig": "ble structure language (OTSL), specifically designed to describe table-structure", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 14, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 247.54, "r_x1": 480.59, "r_y1": 247.54, "r_x2": 480.59, "r_y2": 238.75, "r_x3": 134.76, "r_y3": 238.75, "coord_origin": "TOPLEFT" }, "text": "in an compact and structured way for Im2Seq models. OTSL has a number of", "orig": "in an compact and structured way for Im2Seq models. OTSL has a number of", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 15, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 259.5, "r_x1": 480.59, "r_y1": 259.5, "r_x2": 480.59, "r_y2": 250.7, "r_x3": 134.76, "r_y3": 250.7, "coord_origin": "TOPLEFT" }, "text": "key features, which make it very attractive to use in Im2Seq models. Specifically,", "orig": "key features, which make it very attractive to use in Im2Seq models. Specifically,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 16, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 271.45, "r_x1": 480.59, "r_y1": 271.45, "r_x2": 480.59, "r_y2": 262.66, "r_x3": 134.76, "r_y3": 262.66, "coord_origin": "TOPLEFT" }, "text": "compared to other languages such as HTML, OTSL has a minimized vocabulary", "orig": "compared to other languages such as HTML, OTSL has a minimized vocabulary", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 17, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 283.41, "r_x1": 480.6, "r_y1": 283.41, "r_x2": 480.6, "r_y2": 274.61, "r_x3": 134.76, "r_y3": 274.61, "coord_origin": "TOPLEFT" }, "text": "which yields short sequence length, strong inherent structure (e.g. strict rectan-", "orig": "which yields short sequence length, strong inherent structure (e.g. strict rectan-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 18, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 295.36, "r_x1": 480.59, "r_y1": 295.36, "r_x2": 480.59, "r_y2": 286.57, "r_x3": 134.76, "r_y3": 286.57, "coord_origin": "TOPLEFT" }, "text": "gular layout) and a strict syntax with rules that only look backwards. The latter", "orig": "gular layout) and a strict syntax with rules that only look backwards. The latter", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 19, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 307.32, "r_x1": 480.59, "r_y1": 307.32, "r_x2": 480.59, "r_y2": 298.52, "r_x3": 134.76, "r_y3": 298.52, "coord_origin": "TOPLEFT" }, "text": "allows for syntax validation during inference and ensures a syntactically correct", "orig": "allows for syntax validation during inference and ensures a syntactically correct", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 20, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 319.27, "r_x1": 480.59, "r_y1": 319.27, "r_x2": 480.59, "r_y2": 310.48, "r_x3": 134.76, "r_y3": 310.48, "coord_origin": "TOPLEFT" }, "text": "table-structure. These OTSL features are illustrated in Figure 1, in comparison", "orig": "table-structure. These OTSL features are illustrated in Figure 1, in comparison", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 21, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 331.23, "r_x1": 179.72, "r_y1": 331.23, "r_x2": 179.72, "r_y2": 322.43, "r_x3": 134.76, "r_y3": 322.43, "coord_origin": "TOPLEFT" }, "text": "to HTML.", "orig": "to HTML.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "The main contribution of this paper is the introduction of a new optimised table structure language (OTSL), specifically designed to describe table-structure in an compact and structured way for Im2Seq models. OTSL has a number of key features, which make it very attractive to use in Im2Seq models. Specifically, compared to other languages such as HTML, OTSL has a minimized vocabulary which yields short sequence length, strong inherent structure (e.g. strict rectangular layout) and a strict syntax with rules that only look backwards. The latter allows for syntax validation during inference and ensures a syntactically correct table-structure. These OTSL features are illustrated in Figure 1, in comparison to HTML." }, { "label": "text", "id": 0, "page_no": 2, "cluster": { "id": 0, "label": "text", "bbox": { "l": 134.76, "t": 334.65, "r": 480.6, "b": 439.09, "coord_origin": "TOPLEFT" }, "confidence": 0.988, "cells": [ { "index": 22, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 149.71, "r_y0": 343.44, "r_x1": 480.59, "r_y1": 343.44, "r_x2": 480.59, "r_y2": 334.65, "r_x3": 149.71, "r_y3": 334.65, "coord_origin": "TOPLEFT" }, "text": "The paper is structured as follows. In section 2, we give an overview of the", "orig": "The paper is structured as follows. In section 2, we give an overview of the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 23, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 355.4, "r_x1": 480.59, "r_y1": 355.4, "r_x2": 480.59, "r_y2": 346.6, "r_x3": 134.76, "r_y3": 346.6, "coord_origin": "TOPLEFT" }, "text": "latest developments in table-structure reconstruction. In section 3 we review", "orig": "latest developments in table-structure reconstruction. In section 3 we review", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 24, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 367.36, "r_x1": 480.59, "r_y1": 367.36, "r_x2": 480.59, "r_y2": 358.56, "r_x3": 134.76, "r_y3": 358.56, "coord_origin": "TOPLEFT" }, "text": "the current HTML table encoding (popularised by PubTabNet and FinTabNet)", "orig": "the current HTML table encoding (popularised by PubTabNet and FinTabNet)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 25, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 379.31, "r_x1": 480.59, "r_y1": 379.31, "r_x2": 480.59, "r_y2": 370.51, "r_x3": 134.76, "r_y3": 370.51, "coord_origin": "TOPLEFT" }, "text": "and discuss its flaws. Subsequently, we introduce OTSL in section 4, which in-", "orig": "and discuss its flaws. Subsequently, we introduce OTSL in section 4, which in-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 26, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 391.27, "r_x1": 480.59, "r_y1": 391.27, "r_x2": 480.59, "r_y2": 382.47, "r_x3": 134.76, "r_y3": 382.47, "coord_origin": "TOPLEFT" }, "text": "cludes the language definition, syntax rules and error-correction procedures. In", "orig": "cludes the language definition, syntax rules and error-correction procedures. In", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 27, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 403.22, "r_x1": 480.59, "r_y1": 403.22, "r_x2": 480.59, "r_y2": 394.42, "r_x3": 134.76, "r_y3": 394.42, "coord_origin": "TOPLEFT" }, "text": "section 5, we apply OTSL on the TableFormer architecture, compare it to Table-", "orig": "section 5, we apply OTSL on the TableFormer architecture, compare it to Table-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 28, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 415.18, "r_x1": 480.59, "r_y1": 415.18, "r_x2": 480.59, "r_y2": 406.38, "r_x3": 134.76, "r_y3": 406.38, "coord_origin": "TOPLEFT" }, "text": "Former models trained on HTML and ultimately demonstrate the advantages", "orig": "Former models trained on HTML and ultimately demonstrate the advantages", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 29, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 427.13, "r_x1": 480.6, "r_y1": 427.13, "r_x2": 480.6, "r_y2": 418.33, "r_x3": 134.76, "r_y3": 418.33, "coord_origin": "TOPLEFT" }, "text": "of using OTSL. Finally, in section 6 we conclude our work and outline next", "orig": "of using OTSL. Finally, in section 6 we conclude our work and outline next", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 30, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 439.09, "r_x1": 201.27, "r_y1": 439.09, "r_x2": 201.27, "r_y2": 430.29, "r_x3": 134.76, "r_y3": 430.29, "coord_origin": "TOPLEFT" }, "text": "potential steps.", "orig": "potential steps.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "The paper is structured as follows. In section 2, we give an overview of the latest developments in table-structure reconstruction. In section 3 we review the current HTML table encoding (popularised by PubTabNet and FinTabNet) and discuss its flaws. Subsequently, we introduce OTSL in section 4, which includes the language definition, syntax rules and error-correction procedures. In section 5, we apply OTSL on the TableFormer architecture, compare it to TableFormer models trained on HTML and ultimately demonstrate the advantages of using OTSL. Finally, in section 6 we conclude our work and outline next potential steps." }, { "label": "section_header", "id": 4, "page_no": 2, "cluster": { "id": 4, "label": "section_header", "bbox": { "l": 134.76, "t": 462.09, "r": 236.77, "b": 472.66, "coord_origin": "TOPLEFT" }, "confidence": 0.944, "cells": [ { "index": 31, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 472.66, "r_x1": 141.49, "r_y1": 472.66, "r_x2": 141.49, "r_y2": 462.09, "r_x3": 134.76, "r_y3": 462.09, "coord_origin": "TOPLEFT" }, "text": "2", "orig": "2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 32, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 154.94, "r_y0": 472.66, "r_x1": 236.77, "r_y1": 472.66, "r_x2": 236.77, "r_y2": 462.09, "r_x3": 154.94, "r_y3": 462.09, "coord_origin": "TOPLEFT" }, "text": "Related Work", "orig": "Related Work", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "2 Related Work" }, { "label": "text", "id": 3, "page_no": 2, "cluster": { "id": 3, "label": "text", "bbox": { "l": 134.76, "t": 488.69, "r": 484.12, "b": 664.86, "coord_origin": "TOPLEFT" }, "confidence": 0.987, "cells": [ { "index": 33, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 497.48, "r_x1": 480.59, "r_y1": 497.48, "r_x2": 480.59, "r_y2": 488.69, "r_x3": 134.76, "r_y3": 488.69, "coord_origin": "TOPLEFT" }, "text": "Approaches to formalize the logical structure and layout of tables in electronic", "orig": "Approaches to formalize the logical structure and layout of tables in electronic", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 34, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 509.44, "r_x1": 480.59, "r_y1": 509.44, "r_x2": 480.59, "r_y2": 500.64, "r_x3": 134.76, "r_y3": 500.64, "coord_origin": "TOPLEFT" }, "text": "documents date back more than two decades [16]. In the recent past, a wide", "orig": "documents date back more than two decades [16]. In the recent past, a wide", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 35, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 521.39, "r_x1": 480.59, "r_y1": 521.39, "r_x2": 480.59, "r_y2": 512.6, "r_x3": 134.76, "r_y3": 512.6, "coord_origin": "TOPLEFT" }, "text": "variety of computer vision methods have been explored to tackle the prob-", "orig": "variety of computer vision methods have been explored to tackle the prob-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 36, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 533.35, "r_x1": 480.59, "r_y1": 533.35, "r_x2": 480.59, "r_y2": 524.55, "r_x3": 134.76, "r_y3": 524.55, "coord_origin": "TOPLEFT" }, "text": "lem of table structure recognition, i.e. the correct identification of columns,", "orig": "lem of table structure recognition, i.e. the correct identification of columns,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 37, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 545.3, "r_x1": 480.59, "r_y1": 545.3, "r_x2": 480.59, "r_y2": 536.51, "r_x3": 134.76, "r_y3": 536.51, "coord_origin": "TOPLEFT" }, "text": "rows and spanning cells in a given table. Broadly speaking, the current deep-", "orig": "rows and spanning cells in a given table. Broadly speaking, the current deep-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 38, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 557.26, "r_x1": 480.59, "r_y1": 557.26, "r_x2": 480.59, "r_y2": 548.46, "r_x3": 134.76, "r_y3": 548.46, "coord_origin": "TOPLEFT" }, "text": "learning based approaches fall into three categories: object detection (OD) meth-", "orig": "learning based approaches fall into three categories: object detection (OD) meth-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 39, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 569.21, "r_x1": 480.59, "r_y1": 569.21, "r_x2": 480.59, "r_y2": 560.42, "r_x3": 134.76, "r_y3": 560.42, "coord_origin": "TOPLEFT" }, "text": "ods, Graph-Neural-Network (GNN) methods and Image-to-Markup-Sequence", "orig": "ods, Graph-Neural-Network (GNN) methods and Image-to-Markup-Sequence", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 40, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 581.17, "r_x1": 484.12, "r_y1": 581.17, "r_x2": 484.12, "r_y2": 572.37, "r_x3": 134.76, "r_y3": 572.37, "coord_origin": "TOPLEFT" }, "text": "(Im2Seq) methods. Object-detection based methods [11,12,13,14,21] rely on table-", "orig": "(Im2Seq) methods. Object-detection based methods [11,12,13,14,21] rely on table-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 41, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 593.12, "r_x1": 480.6, "r_y1": 593.12, "r_x2": 480.6, "r_y2": 584.33, "r_x3": 134.76, "r_y3": 584.33, "coord_origin": "TOPLEFT" }, "text": "structure annotation using (overlapping) bounding boxes for training, and pro-", "orig": "structure annotation using (overlapping) bounding boxes for training, and pro-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 42, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 605.08, "r_x1": 480.59, "r_y1": 605.08, "r_x2": 480.59, "r_y2": 596.28, "r_x3": 134.76, "r_y3": 596.28, "coord_origin": "TOPLEFT" }, "text": "duce bounding-box predictions to define table cells, rows, and columns on a table", "orig": "duce bounding-box predictions to define table cells, rows, and columns on a table", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 43, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 617.03, "r_x1": 480.59, "r_y1": 617.03, "r_x2": 480.59, "r_y2": 608.24, "r_x3": 134.76, "r_y3": 608.24, "coord_origin": "TOPLEFT" }, "text": "image. Graph Neural Network (GNN) based methods [3,6,17,18], as the name", "orig": "image. Graph Neural Network (GNN) based methods [3,6,17,18], as the name", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 44, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 628.99, "r_x1": 480.59, "r_y1": 628.99, "r_x2": 480.59, "r_y2": 620.19, "r_x3": 134.76, "r_y3": 620.19, "coord_origin": "TOPLEFT" }, "text": "suggests, represent tables as graph structures. The graph nodes represent the", "orig": "suggests, represent tables as graph structures. The graph nodes represent the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 45, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 640.94, "r_x1": 480.59, "r_y1": 640.94, "r_x2": 480.59, "r_y2": 632.15, "r_x3": 134.76, "r_y3": 632.15, "coord_origin": "TOPLEFT" }, "text": "content of each table cell, an embedding vector from the table image, or geomet-", "orig": "content of each table cell, an embedding vector from the table image, or geomet-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 46, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 652.9, "r_x1": 480.59, "r_y1": 652.9, "r_x2": 480.59, "r_y2": 644.1, "r_x3": 134.76, "r_y3": 644.1, "coord_origin": "TOPLEFT" }, "text": "ric coordinates of the table cell. The edges of the graph define the relationship", "orig": "ric coordinates of the table cell. The edges of the graph define the relationship", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 47, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 664.86, "r_x1": 480.59, "r_y1": 664.86, "r_x2": 480.59, "r_y2": 656.06, "r_x3": 134.76, "r_y3": 656.06, "coord_origin": "TOPLEFT" }, "text": "between the nodes, e.g. if they belong to the same column, row, or table cell.", "orig": "between the nodes, e.g. if they belong to the same column, row, or table cell.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "Approaches to formalize the logical structure and layout of tables in electronic documents date back more than two decades [16]. In the recent past, a wide variety of computer vision methods have been explored to tackle the problem of table structure recognition, i.e. the correct identification of columns, rows and spanning cells in a given table. Broadly speaking, the current deeplearning based approaches fall into three categories: object detection (OD) methods, Graph-Neural-Network (GNN) methods and Image-to-Markup-Sequence (Im2Seq) methods. Object-detection based methods [11,12,13,14,21] rely on tablestructure annotation using (overlapping) bounding boxes for training, and produce bounding-box predictions to define table cells, rows, and columns on a table image. Graph Neural Network (GNN) based methods [3,6,17,18], as the name suggests, represent tables as graph structures. The graph nodes represent the content of each table cell, an embedding vector from the table image, or geometric coordinates of the table cell. The edges of the graph define the relationship between the nodes, e.g. if they belong to the same column, row, or table cell." } ], "body": [ { "label": "text", "id": 2, "page_no": 2, "cluster": { "id": 2, "label": "text", "bbox": { "l": 134.76, "t": 118.93, "r": 480.59, "b": 211.42, "coord_origin": "TOPLEFT" }, "confidence": 0.987, "cells": [ { "index": 2, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 149.71, "r_y0": 127.73, "r_x1": 480.59, "r_y1": 127.73, "r_x2": 480.59, "r_y2": 118.93, "r_x3": 149.71, "r_y3": 118.93, "coord_origin": "TOPLEFT" }, "text": "While the majority of research in TSR is currently focused on the develop-", "orig": "While the majority of research in TSR is currently focused on the develop-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 3, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 139.69, "r_x1": 480.59, "r_y1": 139.69, "r_x2": 480.59, "r_y2": 130.89, "r_x3": 134.76, "r_y3": 130.89, "coord_origin": "TOPLEFT" }, "text": "ment and application of novel neural model architectures, the table structure", "orig": "ment and application of novel neural model architectures, the table structure", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 4, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 151.64, "r_x1": 480.59, "r_y1": 151.64, "r_x2": 480.59, "r_y2": 142.84, "r_x3": 134.76, "r_y3": 142.84, "coord_origin": "TOPLEFT" }, "text": "representation language (e.g. HTML in PubTabNet and FinTabNet) is usually", "orig": "representation language (e.g. HTML in PubTabNet and FinTabNet) is usually", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 5, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 163.6, "r_x1": 169.63, "r_y1": 163.6, "r_x2": 169.63, "r_y2": 154.8, "r_x3": 134.76, "r_y3": 154.8, "coord_origin": "TOPLEFT" }, "text": "adopted", "orig": "adopted", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 6, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 173.86, "r_y0": 163.6, "r_x1": 194.56, "r_y1": 163.6, "r_x2": 194.56, "r_y2": 154.8, "r_x3": 173.86, "r_y3": 154.8, "coord_origin": "TOPLEFT" }, "text": "as is", "orig": "as is", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 7, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 199.61, "r_y0": 163.6, "r_x1": 480.59, "r_y1": 163.6, "r_x2": 480.59, "r_y2": 154.8, "r_x3": 199.61, "r_y3": 154.8, "coord_origin": "TOPLEFT" }, "text": "for the sequence tokenization in Im2Seq models. In this paper,", "orig": "for the sequence tokenization in Im2Seq models. In this paper,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 8, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 175.55, "r_x1": 480.59, "r_y1": 175.55, "r_x2": 480.59, "r_y2": 166.75, "r_x3": 134.76, "r_y3": 166.75, "coord_origin": "TOPLEFT" }, "text": "we aim for the opposite and investigate the impact of the table structure rep-", "orig": "we aim for the opposite and investigate the impact of the table structure rep-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 9, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 187.51, "r_x1": 480.59, "r_y1": 187.51, "r_x2": 480.59, "r_y2": 178.71, "r_x3": 134.76, "r_y3": 178.71, "coord_origin": "TOPLEFT" }, "text": "resentation language with an otherwise unmodified Im2Seq transformer-based", "orig": "resentation language with an otherwise unmodified Im2Seq transformer-based", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 10, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 199.46, "r_x1": 480.59, "r_y1": 199.46, "r_x2": 480.59, "r_y2": 190.66, "r_x3": 134.76, "r_y3": 190.66, "coord_origin": "TOPLEFT" }, "text": "architecture. Since the current state-of-the-art Im2Seq model is TableFormer [9],", "orig": "architecture. Since the current state-of-the-art Im2Seq model is TableFormer [9],", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 11, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 211.42, "r_x1": 348.36, "r_y1": 211.42, "r_x2": 348.36, "r_y2": 202.62, "r_x3": 134.76, "r_y3": 202.62, "coord_origin": "TOPLEFT" }, "text": "we select this model to perform our experiments.", "orig": "we select this model to perform our experiments.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "While the majority of research in TSR is currently focused on the development and application of novel neural model architectures, the table structure representation language (e.g. HTML in PubTabNet and FinTabNet) is usually adopted as is for the sequence tokenization in Im2Seq models. In this paper, we aim for the opposite and investigate the impact of the table structure representation language with an otherwise unmodified Im2Seq transformer-based architecture. Since the current state-of-the-art Im2Seq model is TableFormer [9], we select this model to perform our experiments." }, { "label": "text", "id": 1, "page_no": 2, "cluster": { "id": 1, "label": "text", "bbox": { "l": 134.76, "t": 214.84, "r": 480.6, "b": 331.23, "coord_origin": "TOPLEFT" }, "confidence": 0.987, "cells": [ { "index": 12, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 149.71, "r_y0": 223.63, "r_x1": 480.59, "r_y1": 223.63, "r_x2": 480.59, "r_y2": 214.84, "r_x3": 149.71, "r_y3": 214.84, "coord_origin": "TOPLEFT" }, "text": "The main contribution of this paper is the introduction of a new optimised ta-", "orig": "The main contribution of this paper is the introduction of a new optimised ta-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 13, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 235.59, "r_x1": 480.59, "r_y1": 235.59, "r_x2": 480.59, "r_y2": 226.79, "r_x3": 134.76, "r_y3": 226.79, "coord_origin": "TOPLEFT" }, "text": "ble structure language (OTSL), specifically designed to describe table-structure", "orig": "ble structure language (OTSL), specifically designed to describe table-structure", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 14, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 247.54, "r_x1": 480.59, "r_y1": 247.54, "r_x2": 480.59, "r_y2": 238.75, "r_x3": 134.76, "r_y3": 238.75, "coord_origin": "TOPLEFT" }, "text": "in an compact and structured way for Im2Seq models. OTSL has a number of", "orig": "in an compact and structured way for Im2Seq models. OTSL has a number of", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 15, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 259.5, "r_x1": 480.59, "r_y1": 259.5, "r_x2": 480.59, "r_y2": 250.7, "r_x3": 134.76, "r_y3": 250.7, "coord_origin": "TOPLEFT" }, "text": "key features, which make it very attractive to use in Im2Seq models. Specifically,", "orig": "key features, which make it very attractive to use in Im2Seq models. Specifically,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 16, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 271.45, "r_x1": 480.59, "r_y1": 271.45, "r_x2": 480.59, "r_y2": 262.66, "r_x3": 134.76, "r_y3": 262.66, "coord_origin": "TOPLEFT" }, "text": "compared to other languages such as HTML, OTSL has a minimized vocabulary", "orig": "compared to other languages such as HTML, OTSL has a minimized vocabulary", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 17, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 283.41, "r_x1": 480.6, "r_y1": 283.41, "r_x2": 480.6, "r_y2": 274.61, "r_x3": 134.76, "r_y3": 274.61, "coord_origin": "TOPLEFT" }, "text": "which yields short sequence length, strong inherent structure (e.g. strict rectan-", "orig": "which yields short sequence length, strong inherent structure (e.g. strict rectan-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 18, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 295.36, "r_x1": 480.59, "r_y1": 295.36, "r_x2": 480.59, "r_y2": 286.57, "r_x3": 134.76, "r_y3": 286.57, "coord_origin": "TOPLEFT" }, "text": "gular layout) and a strict syntax with rules that only look backwards. The latter", "orig": "gular layout) and a strict syntax with rules that only look backwards. The latter", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 19, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 307.32, "r_x1": 480.59, "r_y1": 307.32, "r_x2": 480.59, "r_y2": 298.52, "r_x3": 134.76, "r_y3": 298.52, "coord_origin": "TOPLEFT" }, "text": "allows for syntax validation during inference and ensures a syntactically correct", "orig": "allows for syntax validation during inference and ensures a syntactically correct", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 20, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 319.27, "r_x1": 480.59, "r_y1": 319.27, "r_x2": 480.59, "r_y2": 310.48, "r_x3": 134.76, "r_y3": 310.48, "coord_origin": "TOPLEFT" }, "text": "table-structure. These OTSL features are illustrated in Figure 1, in comparison", "orig": "table-structure. These OTSL features are illustrated in Figure 1, in comparison", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 21, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 331.23, "r_x1": 179.72, "r_y1": 331.23, "r_x2": 179.72, "r_y2": 322.43, "r_x3": 134.76, "r_y3": 322.43, "coord_origin": "TOPLEFT" }, "text": "to HTML.", "orig": "to HTML.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "The main contribution of this paper is the introduction of a new optimised table structure language (OTSL), specifically designed to describe table-structure in an compact and structured way for Im2Seq models. OTSL has a number of key features, which make it very attractive to use in Im2Seq models. Specifically, compared to other languages such as HTML, OTSL has a minimized vocabulary which yields short sequence length, strong inherent structure (e.g. strict rectangular layout) and a strict syntax with rules that only look backwards. The latter allows for syntax validation during inference and ensures a syntactically correct table-structure. These OTSL features are illustrated in Figure 1, in comparison to HTML." }, { "label": "text", "id": 0, "page_no": 2, "cluster": { "id": 0, "label": "text", "bbox": { "l": 134.76, "t": 334.65, "r": 480.6, "b": 439.09, "coord_origin": "TOPLEFT" }, "confidence": 0.988, "cells": [ { "index": 22, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 149.71, "r_y0": 343.44, "r_x1": 480.59, "r_y1": 343.44, "r_x2": 480.59, "r_y2": 334.65, "r_x3": 149.71, "r_y3": 334.65, "coord_origin": "TOPLEFT" }, "text": "The paper is structured as follows. In section 2, we give an overview of the", "orig": "The paper is structured as follows. In section 2, we give an overview of the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 23, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 355.4, "r_x1": 480.59, "r_y1": 355.4, "r_x2": 480.59, "r_y2": 346.6, "r_x3": 134.76, "r_y3": 346.6, "coord_origin": "TOPLEFT" }, "text": "latest developments in table-structure reconstruction. In section 3 we review", "orig": "latest developments in table-structure reconstruction. In section 3 we review", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 24, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 367.36, "r_x1": 480.59, "r_y1": 367.36, "r_x2": 480.59, "r_y2": 358.56, "r_x3": 134.76, "r_y3": 358.56, "coord_origin": "TOPLEFT" }, "text": "the current HTML table encoding (popularised by PubTabNet and FinTabNet)", "orig": "the current HTML table encoding (popularised by PubTabNet and FinTabNet)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 25, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 379.31, "r_x1": 480.59, "r_y1": 379.31, "r_x2": 480.59, "r_y2": 370.51, "r_x3": 134.76, "r_y3": 370.51, "coord_origin": "TOPLEFT" }, "text": "and discuss its flaws. Subsequently, we introduce OTSL in section 4, which in-", "orig": "and discuss its flaws. Subsequently, we introduce OTSL in section 4, which in-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 26, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 391.27, "r_x1": 480.59, "r_y1": 391.27, "r_x2": 480.59, "r_y2": 382.47, "r_x3": 134.76, "r_y3": 382.47, "coord_origin": "TOPLEFT" }, "text": "cludes the language definition, syntax rules and error-correction procedures. In", "orig": "cludes the language definition, syntax rules and error-correction procedures. In", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 27, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 403.22, "r_x1": 480.59, "r_y1": 403.22, "r_x2": 480.59, "r_y2": 394.42, "r_x3": 134.76, "r_y3": 394.42, "coord_origin": "TOPLEFT" }, "text": "section 5, we apply OTSL on the TableFormer architecture, compare it to Table-", "orig": "section 5, we apply OTSL on the TableFormer architecture, compare it to Table-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 28, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 415.18, "r_x1": 480.59, "r_y1": 415.18, "r_x2": 480.59, "r_y2": 406.38, "r_x3": 134.76, "r_y3": 406.38, "coord_origin": "TOPLEFT" }, "text": "Former models trained on HTML and ultimately demonstrate the advantages", "orig": "Former models trained on HTML and ultimately demonstrate the advantages", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 29, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 427.13, "r_x1": 480.6, "r_y1": 427.13, "r_x2": 480.6, "r_y2": 418.33, "r_x3": 134.76, "r_y3": 418.33, "coord_origin": "TOPLEFT" }, "text": "of using OTSL. Finally, in section 6 we conclude our work and outline next", "orig": "of using OTSL. Finally, in section 6 we conclude our work and outline next", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 30, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 439.09, "r_x1": 201.27, "r_y1": 439.09, "r_x2": 201.27, "r_y2": 430.29, "r_x3": 134.76, "r_y3": 430.29, "coord_origin": "TOPLEFT" }, "text": "potential steps.", "orig": "potential steps.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "The paper is structured as follows. In section 2, we give an overview of the latest developments in table-structure reconstruction. In section 3 we review the current HTML table encoding (popularised by PubTabNet and FinTabNet) and discuss its flaws. Subsequently, we introduce OTSL in section 4, which includes the language definition, syntax rules and error-correction procedures. In section 5, we apply OTSL on the TableFormer architecture, compare it to TableFormer models trained on HTML and ultimately demonstrate the advantages of using OTSL. Finally, in section 6 we conclude our work and outline next potential steps." }, { "label": "section_header", "id": 4, "page_no": 2, "cluster": { "id": 4, "label": "section_header", "bbox": { "l": 134.76, "t": 462.09, "r": 236.77, "b": 472.66, "coord_origin": "TOPLEFT" }, "confidence": 0.944, "cells": [ { "index": 31, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 472.66, "r_x1": 141.49, "r_y1": 472.66, "r_x2": 141.49, "r_y2": 462.09, "r_x3": 134.76, "r_y3": 462.09, "coord_origin": "TOPLEFT" }, "text": "2", "orig": "2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 32, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 154.94, "r_y0": 472.66, "r_x1": 236.77, "r_y1": 472.66, "r_x2": 236.77, "r_y2": 462.09, "r_x3": 154.94, "r_y3": 462.09, "coord_origin": "TOPLEFT" }, "text": "Related Work", "orig": "Related Work", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "2 Related Work" }, { "label": "text", "id": 3, "page_no": 2, "cluster": { "id": 3, "label": "text", "bbox": { "l": 134.76, "t": 488.69, "r": 484.12, "b": 664.86, "coord_origin": "TOPLEFT" }, "confidence": 0.987, "cells": [ { "index": 33, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 497.48, "r_x1": 480.59, "r_y1": 497.48, "r_x2": 480.59, "r_y2": 488.69, "r_x3": 134.76, "r_y3": 488.69, "coord_origin": "TOPLEFT" }, "text": "Approaches to formalize the logical structure and layout of tables in electronic", "orig": "Approaches to formalize the logical structure and layout of tables in electronic", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 34, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 509.44, "r_x1": 480.59, "r_y1": 509.44, "r_x2": 480.59, "r_y2": 500.64, "r_x3": 134.76, "r_y3": 500.64, "coord_origin": "TOPLEFT" }, "text": "documents date back more than two decades [16]. In the recent past, a wide", "orig": "documents date back more than two decades [16]. In the recent past, a wide", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 35, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 521.39, "r_x1": 480.59, "r_y1": 521.39, "r_x2": 480.59, "r_y2": 512.6, "r_x3": 134.76, "r_y3": 512.6, "coord_origin": "TOPLEFT" }, "text": "variety of computer vision methods have been explored to tackle the prob-", "orig": "variety of computer vision methods have been explored to tackle the prob-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 36, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 533.35, "r_x1": 480.59, "r_y1": 533.35, "r_x2": 480.59, "r_y2": 524.55, "r_x3": 134.76, "r_y3": 524.55, "coord_origin": "TOPLEFT" }, "text": "lem of table structure recognition, i.e. the correct identification of columns,", "orig": "lem of table structure recognition, i.e. the correct identification of columns,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 37, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 545.3, "r_x1": 480.59, "r_y1": 545.3, "r_x2": 480.59, "r_y2": 536.51, "r_x3": 134.76, "r_y3": 536.51, "coord_origin": "TOPLEFT" }, "text": "rows and spanning cells in a given table. Broadly speaking, the current deep-", "orig": "rows and spanning cells in a given table. Broadly speaking, the current deep-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 38, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 557.26, "r_x1": 480.59, "r_y1": 557.26, "r_x2": 480.59, "r_y2": 548.46, "r_x3": 134.76, "r_y3": 548.46, "coord_origin": "TOPLEFT" }, "text": "learning based approaches fall into three categories: object detection (OD) meth-", "orig": "learning based approaches fall into three categories: object detection (OD) meth-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 39, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 569.21, "r_x1": 480.59, "r_y1": 569.21, "r_x2": 480.59, "r_y2": 560.42, "r_x3": 134.76, "r_y3": 560.42, "coord_origin": "TOPLEFT" }, "text": "ods, Graph-Neural-Network (GNN) methods and Image-to-Markup-Sequence", "orig": "ods, Graph-Neural-Network (GNN) methods and Image-to-Markup-Sequence", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 40, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 581.17, "r_x1": 484.12, "r_y1": 581.17, "r_x2": 484.12, "r_y2": 572.37, "r_x3": 134.76, "r_y3": 572.37, "coord_origin": "TOPLEFT" }, "text": "(Im2Seq) methods. Object-detection based methods [11,12,13,14,21] rely on table-", "orig": "(Im2Seq) methods. Object-detection based methods [11,12,13,14,21] rely on table-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 41, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 593.12, "r_x1": 480.6, "r_y1": 593.12, "r_x2": 480.6, "r_y2": 584.33, "r_x3": 134.76, "r_y3": 584.33, "coord_origin": "TOPLEFT" }, "text": "structure annotation using (overlapping) bounding boxes for training, and pro-", "orig": "structure annotation using (overlapping) bounding boxes for training, and pro-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 42, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 605.08, "r_x1": 480.59, "r_y1": 605.08, "r_x2": 480.59, "r_y2": 596.28, "r_x3": 134.76, "r_y3": 596.28, "coord_origin": "TOPLEFT" }, "text": "duce bounding-box predictions to define table cells, rows, and columns on a table", "orig": "duce bounding-box predictions to define table cells, rows, and columns on a table", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 43, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 617.03, "r_x1": 480.59, "r_y1": 617.03, "r_x2": 480.59, "r_y2": 608.24, "r_x3": 134.76, "r_y3": 608.24, "coord_origin": "TOPLEFT" }, "text": "image. Graph Neural Network (GNN) based methods [3,6,17,18], as the name", "orig": "image. Graph Neural Network (GNN) based methods [3,6,17,18], as the name", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 44, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 628.99, "r_x1": 480.59, "r_y1": 628.99, "r_x2": 480.59, "r_y2": 620.19, "r_x3": 134.76, "r_y3": 620.19, "coord_origin": "TOPLEFT" }, "text": "suggests, represent tables as graph structures. The graph nodes represent the", "orig": "suggests, represent tables as graph structures. The graph nodes represent the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 45, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 640.94, "r_x1": 480.59, "r_y1": 640.94, "r_x2": 480.59, "r_y2": 632.15, "r_x3": 134.76, "r_y3": 632.15, "coord_origin": "TOPLEFT" }, "text": "content of each table cell, an embedding vector from the table image, or geomet-", "orig": "content of each table cell, an embedding vector from the table image, or geomet-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 46, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 652.9, "r_x1": 480.59, "r_y1": 652.9, "r_x2": 480.59, "r_y2": 644.1, "r_x3": 134.76, "r_y3": 644.1, "coord_origin": "TOPLEFT" }, "text": "ric coordinates of the table cell. The edges of the graph define the relationship", "orig": "ric coordinates of the table cell. The edges of the graph define the relationship", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 47, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 664.86, "r_x1": 480.59, "r_y1": 664.86, "r_x2": 480.59, "r_y2": 656.06, "r_x3": 134.76, "r_y3": 656.06, "coord_origin": "TOPLEFT" }, "text": "between the nodes, e.g. if they belong to the same column, row, or table cell.", "orig": "between the nodes, e.g. if they belong to the same column, row, or table cell.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "Approaches to formalize the logical structure and layout of tables in electronic documents date back more than two decades [16]. In the recent past, a wide variety of computer vision methods have been explored to tackle the problem of table structure recognition, i.e. the correct identification of columns, rows and spanning cells in a given table. Broadly speaking, the current deeplearning based approaches fall into three categories: object detection (OD) methods, Graph-Neural-Network (GNN) methods and Image-to-Markup-Sequence (Im2Seq) methods. Object-detection based methods [11,12,13,14,21] rely on tablestructure annotation using (overlapping) bounding boxes for training, and produce bounding-box predictions to define table cells, rows, and columns on a table image. Graph Neural Network (GNN) based methods [3,6,17,18], as the name suggests, represent tables as graph structures. The graph nodes represent the content of each table cell, an embedding vector from the table image, or geometric coordinates of the table cell. The edges of the graph define the relationship between the nodes, e.g. if they belong to the same column, row, or table cell." } ], "headers": [ { "label": "page_header", "id": 5, "page_no": 2, "cluster": { "id": 5, "label": "page_header", "bbox": { "l": 194.48, "t": 93.77, "r": 447.54, "b": 101.84, "coord_origin": "TOPLEFT" }, "confidence": 0.933, "cells": [ { "index": 0, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 194.48, "r_y0": 101.84, "r_x1": 447.54, "r_y1": 101.84, "r_x2": 447.54, "r_y2": 93.77, "r_x3": 194.48, "r_y3": 93.77, "coord_origin": "TOPLEFT" }, "text": "Optimized Table Tokenization for Table Structure Recognition", "orig": "Optimized Table Tokenization for Table Structure Recognition", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "Optimized Table Tokenization for Table Structure Recognition" }, { "label": "page_header", "id": 6, "page_no": 2, "cluster": { "id": 6, "label": "page_header", "bbox": { "l": 475.98, "t": 93.77, "r": 480.59, "b": 101.84, "coord_origin": "TOPLEFT" }, "confidence": 0.877, "cells": [ { "index": 1, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 475.98, "r_y0": 101.84, "r_x1": 480.59, "r_y1": 101.84, "r_x2": 480.59, "r_y2": 93.77, "r_x3": 475.98, "r_y3": 93.77, "coord_origin": "TOPLEFT" }, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "3" } ] } }, { "page_no": 3, "size": { "width": 612.0, "height": 792.0 }, "parsed_page": { "dimension": { "angle": 0.0, "rect": { "r_x0": 0.0, "r_y0": 0.0, "r_x1": 612.0, "r_y1": 0.0, "r_x2": 612.0, "r_y2": 792.0, "r_x3": 0.0, "r_y3": 792.0, "coord_origin": "BOTTOMLEFT" }, "boundary_type": "crop_box", "art_bbox": { "l": 0.0, "t": 792.0, "r": 612.0, "b": 0.0, "coord_origin": "BOTTOMLEFT" }, "bleed_bbox": { "l": 0.0, "t": 792.0, "r": 612.0, "b": 0.0, "coord_origin": "BOTTOMLEFT" }, "crop_bbox": { "l": 0.0, "t": 792.0, "r": 612.0, "b": 0.0, "coord_origin": "BOTTOMLEFT" }, "media_bbox": { "l": 0.0, "t": 792.0, "r": 612.0, "b": 0.0, "coord_origin": "BOTTOMLEFT" }, "trim_bbox": { "l": 0.0, "t": 792.0, "r": 612.0, "b": 0.0, "coord_origin": "BOTTOMLEFT" } }, "bitmap_resources": [], "char_cells": [], "word_cells": [], "textline_cells": [ { "index": 0, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 101.84, "r_x1": 139.37, "r_y1": 101.84, "r_x2": 139.37, "r_y2": 93.77, "r_x3": 134.76, "r_y3": 93.77, "coord_origin": "TOPLEFT" }, "text": "4", "orig": "4", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 1, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 167.81, "r_y0": 101.84, "r_x1": 178.08, "r_y1": 101.84, "r_x2": 178.08, "r_y2": 93.77, "r_x3": 167.81, "r_y3": 93.77, "coord_origin": "TOPLEFT" }, "text": "M.", "orig": "M.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 2, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 182.37, "r_y0": 101.84, "r_x1": 231.72, "r_y1": 101.84, "r_x2": 231.72, "r_y2": 93.77, "r_x3": 182.37, "r_y3": 93.77, "coord_origin": "TOPLEFT" }, "text": "Lysak, et al.", "orig": "Lysak, et al.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 3, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 127.73, "r_x1": 480.59, "r_y1": 127.73, "r_x2": 480.59, "r_y2": 118.93, "r_x3": 134.76, "r_y3": 118.93, "coord_origin": "TOPLEFT" }, "text": "Other work [20] aims at predicting a grid for each table and deciding which cells", "orig": "Other work [20] aims at predicting a grid for each table and deciding which cells", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 4, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 139.69, "r_x1": 480.59, "r_y1": 139.69, "r_x2": 480.59, "r_y2": 130.89, "r_x3": 134.76, "r_y3": 130.89, "coord_origin": "TOPLEFT" }, "text": "must be merged using an attention network. Im2Seq methods cast the problem", "orig": "must be merged using an attention network. Im2Seq methods cast the problem", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 5, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 151.64, "r_x1": 480.59, "r_y1": 151.64, "r_x2": 480.59, "r_y2": 142.84, "r_x3": 134.76, "r_y3": 142.84, "coord_origin": "TOPLEFT" }, "text": "as a sequence generation task [4,5,9,22], and therefore need an internal table-", "orig": "as a sequence generation task [4,5,9,22], and therefore need an internal table-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 6, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 163.6, "r_x1": 480.59, "r_y1": 163.6, "r_x2": 480.59, "r_y2": 154.8, "r_x3": 134.76, "r_y3": 154.8, "coord_origin": "TOPLEFT" }, "text": "structure representation language, which is often implemented with standard", "orig": "structure representation language, which is often implemented with standard", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 7, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 175.55, "r_x1": 480.59, "r_y1": 175.55, "r_x2": 480.59, "r_y2": 166.75, "r_x3": 134.76, "r_y3": 166.75, "coord_origin": "TOPLEFT" }, "text": "markup languages (e.g. HTML, LaTeX, Markdown). In theory, Im2Seq methods", "orig": "markup languages (e.g. HTML, LaTeX, Markdown). In theory, Im2Seq methods", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 8, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 187.51, "r_x1": 480.6, "r_y1": 187.51, "r_x2": 480.6, "r_y2": 178.71, "r_x3": 134.76, "r_y3": 178.71, "coord_origin": "TOPLEFT" }, "text": "have a natural advantage over the OD and GNN methods by virtue of directly", "orig": "have a natural advantage over the OD and GNN methods by virtue of directly", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 9, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 199.46, "r_x1": 480.59, "r_y1": 199.46, "r_x2": 480.59, "r_y2": 190.66, "r_x3": 134.76, "r_y3": 190.66, "coord_origin": "TOPLEFT" }, "text": "predicting the table-structure. As such, no post-processing or rules are needed", "orig": "predicting the table-structure. As such, no post-processing or rules are needed", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 10, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 211.42, "r_x1": 480.59, "r_y1": 211.42, "r_x2": 480.59, "r_y2": 202.62, "r_x3": 134.76, "r_y3": 202.62, "coord_origin": "TOPLEFT" }, "text": "in order to obtain the table-structure, which is necessary with OD and GNN", "orig": "in order to obtain the table-structure, which is necessary with OD and GNN", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 11, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 223.37, "r_x1": 480.59, "r_y1": 223.37, "r_x2": 480.59, "r_y2": 214.58, "r_x3": 134.76, "r_y3": 214.58, "coord_origin": "TOPLEFT" }, "text": "approaches. In practice, this is not entirely true, because a predicted sequence", "orig": "approaches. In practice, this is not entirely true, because a predicted sequence", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 12, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 235.33, "r_x1": 480.59, "r_y1": 235.33, "r_x2": 480.59, "r_y2": 226.53, "r_x3": 134.76, "r_y3": 226.53, "coord_origin": "TOPLEFT" }, "text": "of table-structure markup does not necessarily have to be syntactically correct.", "orig": "of table-structure markup does not necessarily have to be syntactically correct.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 13, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 247.28, "r_x1": 480.6, "r_y1": 247.28, "r_x2": 480.6, "r_y2": 238.49, "r_x3": 134.76, "r_y3": 238.49, "coord_origin": "TOPLEFT" }, "text": "Hence, depending on the quality of the predicted sequence, some post-processing", "orig": "Hence, depending on the quality of the predicted sequence, some post-processing", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 14, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 259.24, "r_x1": 480.59, "r_y1": 259.24, "r_x2": 480.59, "r_y2": 250.44, "r_x3": 134.76, "r_y3": 250.44, "coord_origin": "TOPLEFT" }, "text": "needs to be performed to ensure a syntactically valid (let alone correct) sequence.", "orig": "needs to be performed to ensure a syntactically valid (let alone correct) sequence.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 15, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 149.71, "r_y0": 271.45, "r_x1": 480.59, "r_y1": 271.45, "r_x2": 480.59, "r_y2": 262.66, "r_x3": 149.71, "r_y3": 262.66, "coord_origin": "TOPLEFT" }, "text": "Within the Im2Seq method, we find several popular models, namely the", "orig": "Within the Im2Seq method, we find several popular models, namely the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 16, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 283.41, "r_x1": 480.59, "r_y1": 283.41, "r_x2": 480.59, "r_y2": 274.61, "r_x3": 134.76, "r_y3": 274.61, "coord_origin": "TOPLEFT" }, "text": "encoder-dual-decoder model (EDD) [22], TableFormer [9], Tabsplitter[2] and Ye", "orig": "encoder-dual-decoder model (EDD) [22], TableFormer [9], Tabsplitter[2] and Ye", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 17, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 295.36, "r_x1": 480.59, "r_y1": 295.36, "r_x2": 480.59, "r_y2": 286.57, "r_x3": 134.76, "r_y3": 286.57, "coord_origin": "TOPLEFT" }, "text": "et. al. [19]. EDD uses two consecutive long short-term memory (LSTM) decoders", "orig": "et. al. [19]. EDD uses two consecutive long short-term memory (LSTM) decoders", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 18, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 307.32, "r_x1": 342.02, "r_y1": 307.32, "r_x2": 342.02, "r_y2": 298.52, "r_x3": 134.76, "r_y3": 298.52, "coord_origin": "TOPLEFT" }, "text": "to predict a table in HTML representation. The", "orig": "to predict a table in HTML representation. The", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 19, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 345.06, "r_y0": 307.32, "r_x1": 393.05, "r_y1": 307.32, "r_x2": 393.05, "r_y2": 298.52, "r_x3": 345.06, "r_y3": 298.52, "coord_origin": "TOPLEFT" }, "text": "tag decoder", "orig": "tag decoder", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 20, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 397.17, "r_y0": 307.32, "r_x1": 480.59, "r_y1": 307.32, "r_x2": 480.59, "r_y2": 298.52, "r_x3": 397.17, "r_y3": 298.52, "coord_origin": "TOPLEFT" }, "text": "predicts a sequence", "orig": "predicts a sequence", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 21, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 319.27, "r_x1": 333.3, "r_y1": 319.27, "r_x2": 333.3, "r_y2": 310.48, "r_x3": 134.76, "r_y3": 310.48, "coord_origin": "TOPLEFT" }, "text": "of HTML tags. For each decoded table cell (", "orig": "of HTML tags. For each decoded table cell (", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 22, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 333.3, "r_y0": 319.27, "r_x1": 356.97, "r_y1": 319.27, "r_x2": 356.97, "r_y2": 310.48, "r_x3": 333.3, "r_y3": 310.48, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 23, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 357.08, "r_y0": 319.27, "r_x1": 480.59, "r_y1": 319.27, "r_x2": 480.59, "r_y2": 310.48, "r_x3": 357.08, "r_y3": 310.48, "coord_origin": "TOPLEFT" }, "text": "), the attention is passed to", "orig": "), the attention is passed to", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 24, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 331.23, "r_x1": 148.6, "r_y1": 331.23, "r_x2": 148.6, "r_y2": 322.43, "r_x3": 134.76, "r_y3": 322.43, "coord_origin": "TOPLEFT" }, "text": "the", "orig": "the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 25, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 152.28, "r_y0": 331.23, "r_x1": 202.11, "r_y1": 331.23, "r_x2": 202.11, "r_y2": 322.43, "r_x3": 152.28, "r_y3": 322.43, "coord_origin": "TOPLEFT" }, "text": "cell decoder", "orig": "cell decoder", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 26, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 206.86, "r_y0": 331.23, "r_x1": 480.59, "r_y1": 331.23, "r_x2": 480.59, "r_y2": 322.43, "r_x3": 206.86, "r_y3": 322.43, "coord_origin": "TOPLEFT" }, "text": "to predict the content with an embedded OCR approach. The", "orig": "to predict the content with an embedded OCR approach. The", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 27, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 343.18, "r_x1": 480.59, "r_y1": 343.18, "r_x2": 480.59, "r_y2": 334.39, "r_x3": 134.76, "r_y3": 334.39, "coord_origin": "TOPLEFT" }, "text": "latter makes it susceptible to transcription errors in the cell content of the table.", "orig": "latter makes it susceptible to transcription errors in the cell content of the table.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 28, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 355.14, "r_x1": 480.59, "r_y1": 355.14, "r_x2": 480.59, "r_y2": 346.34, "r_x3": 134.76, "r_y3": 346.34, "coord_origin": "TOPLEFT" }, "text": "TableFormer address this reliance on OCR and uses two transformer decoders for", "orig": "TableFormer address this reliance on OCR and uses two transformer decoders for", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 29, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 367.09, "r_x1": 480.59, "r_y1": 367.09, "r_x2": 480.59, "r_y2": 358.3, "r_x3": 134.76, "r_y3": 358.3, "coord_origin": "TOPLEFT" }, "text": "HTML structure and cell bounding box prediction in an end-to-end architecture.", "orig": "HTML structure and cell bounding box prediction in an end-to-end architecture.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 30, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 379.05, "r_x1": 480.59, "r_y1": 379.05, "r_x2": 480.59, "r_y2": 370.25, "r_x3": 134.76, "r_y3": 370.25, "coord_origin": "TOPLEFT" }, "text": "The predicted cell bounding box is then used to extract text tokens from an", "orig": "The predicted cell bounding box is then used to extract text tokens from an", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 31, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 391.01, "r_x1": 480.59, "r_y1": 391.01, "r_x2": 480.59, "r_y2": 382.21, "r_x3": 134.76, "r_y3": 382.21, "coord_origin": "TOPLEFT" }, "text": "originating (digital) PDF page, circumventing any need for OCR. TabSplitter", "orig": "originating (digital) PDF page, circumventing any need for OCR. TabSplitter", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 32, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 402.96, "r_x1": 144.77, "r_y1": 402.96, "r_x2": 144.77, "r_y2": 394.16, "r_x3": 134.76, "r_y3": 394.16, "coord_origin": "TOPLEFT" }, "text": "[2]", "orig": "[2]", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 33, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 149.51, "r_y0": 402.96, "r_x1": 480.59, "r_y1": 402.96, "r_x2": 480.59, "r_y2": 394.16, "r_x3": 149.51, "r_y3": 394.16, "coord_origin": "TOPLEFT" }, "text": "proposes a compact double-matrix representation of table rows and columns", "orig": "proposes a compact double-matrix representation of table rows and columns", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 34, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 414.92, "r_x1": 480.6, "r_y1": 414.92, "r_x2": 480.6, "r_y2": 406.12, "r_x3": 134.76, "r_y3": 406.12, "coord_origin": "TOPLEFT" }, "text": "to do error detection and error correction of HTML structure sequences based", "orig": "to do error detection and error correction of HTML structure sequences based", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 35, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 426.87, "r_x1": 480.59, "r_y1": 426.87, "r_x2": 480.59, "r_y2": 418.07, "r_x3": 134.76, "r_y3": 418.07, "coord_origin": "TOPLEFT" }, "text": "on predictions from [19]. This compact double-matrix representation can not be", "orig": "on predictions from [19]. This compact double-matrix representation can not be", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 36, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 438.83, "r_x1": 480.59, "r_y1": 438.83, "r_x2": 480.59, "r_y2": 430.03, "r_x3": 134.76, "r_y3": 430.03, "coord_origin": "TOPLEFT" }, "text": "used directly by the Img2seq model training, so the model uses HTML as an", "orig": "used directly by the Img2seq model training, so the model uses HTML as an", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 37, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 450.78, "r_x1": 480.59, "r_y1": 450.78, "r_x2": 480.59, "r_y2": 441.98, "r_x3": 134.76, "r_y3": 441.98, "coord_origin": "TOPLEFT" }, "text": "intermediate form. Chi et. al. [4] introduce a data set and a baseline method", "orig": "intermediate form. Chi et. al. [4] introduce a data set and a baseline method", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 38, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 462.74, "r_x1": 384.58, "r_y1": 462.74, "r_x2": 384.58, "r_y2": 453.94, "r_x3": 134.76, "r_y3": 453.94, "coord_origin": "TOPLEFT" }, "text": "using bidirectional LSTMs to predict LaTeX code. Kayal", "orig": "using bidirectional LSTMs to predict LaTeX code. Kayal", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 39, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 391.56, "r_y0": 462.74, "r_x1": 401.73, "r_y1": 462.74, "r_x2": 401.73, "r_y2": 453.94, "r_x3": 391.56, "r_y3": 453.94, "coord_origin": "TOPLEFT" }, "text": "[5]", "orig": "[5]", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 40, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 406.55, "r_y0": 462.74, "r_x1": 480.59, "r_y1": 462.74, "r_x2": 480.59, "r_y2": 453.94, "r_x3": 406.55, "r_y3": 453.94, "coord_origin": "TOPLEFT" }, "text": "introduces Gated", "orig": "introduces Gated", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 41, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 474.69, "r_x1": 480.59, "r_y1": 474.69, "r_x2": 480.59, "r_y2": 465.89, "r_x3": 134.76, "r_y3": 465.89, "coord_origin": "TOPLEFT" }, "text": "ResNet transformers to predict LaTeX code, and a separate OCR module to", "orig": "ResNet transformers to predict LaTeX code, and a separate OCR module to", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 42, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 486.65, "r_x1": 203.69, "r_y1": 486.65, "r_x2": 203.69, "r_y2": 477.85, "r_x3": 134.76, "r_y3": 477.85, "coord_origin": "TOPLEFT" }, "text": "extract content.", "orig": "extract content.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 43, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 149.71, "r_y0": 498.86, "r_x1": 480.59, "r_y1": 498.86, "r_x2": 480.59, "r_y2": 490.07, "r_x3": 149.71, "r_y3": 490.07, "coord_origin": "TOPLEFT" }, "text": "Im2Seq approaches have shown to be well-suited for the TSR task and allow a", "orig": "Im2Seq approaches have shown to be well-suited for the TSR task and allow a", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 44, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 510.82, "r_x1": 480.59, "r_y1": 510.82, "r_x2": 480.59, "r_y2": 502.02, "r_x3": 134.76, "r_y3": 502.02, "coord_origin": "TOPLEFT" }, "text": "full end-to-end network design that can output the final table structure without", "orig": "full end-to-end network design that can output the final table structure without", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 45, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 522.77, "r_x1": 480.59, "r_y1": 522.77, "r_x2": 480.59, "r_y2": 513.98, "r_x3": 134.76, "r_y3": 513.98, "coord_origin": "TOPLEFT" }, "text": "pre- or post-processing logic. Furthermore, Im2Seq models have demonstrated", "orig": "pre- or post-processing logic. Furthermore, Im2Seq models have demonstrated", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 46, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 534.73, "r_x1": 480.59, "r_y1": 534.73, "r_x2": 480.59, "r_y2": 525.93, "r_x3": 134.76, "r_y3": 525.93, "coord_origin": "TOPLEFT" }, "text": "to deliver state-of-the-art prediction accuracy [9]. This motivated the authors", "orig": "to deliver state-of-the-art prediction accuracy [9]. This motivated the authors", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 47, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 546.68, "r_x1": 480.59, "r_y1": 546.68, "r_x2": 480.59, "r_y2": 537.89, "r_x3": 134.76, "r_y3": 537.89, "coord_origin": "TOPLEFT" }, "text": "to investigate if the performance (both in accuracy and inference time) can", "orig": "to investigate if the performance (both in accuracy and inference time) can", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 48, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 558.64, "r_x1": 480.59, "r_y1": 558.64, "r_x2": 480.59, "r_y2": 549.84, "r_x3": 134.76, "r_y3": 549.84, "coord_origin": "TOPLEFT" }, "text": "be further improved by optimising the table structure representation language.", "orig": "be further improved by optimising the table structure representation language.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 49, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 570.59, "r_x1": 480.59, "r_y1": 570.59, "r_x2": 480.59, "r_y2": 561.8, "r_x3": 134.76, "r_y3": 561.8, "coord_origin": "TOPLEFT" }, "text": "We believe this is a necessary step before further improving neural network", "orig": "We believe this is a necessary step before further improving neural network", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 50, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 582.55, "r_x1": 249.28, "r_y1": 582.55, "r_x2": 249.28, "r_y2": 573.75, "r_x3": 134.76, "r_y3": 573.75, "coord_origin": "TOPLEFT" }, "text": "architectures for this task.", "orig": "architectures for this task.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 51, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 616.12, "r_x1": 141.49, "r_y1": 616.12, "r_x2": 141.49, "r_y2": 605.55, "r_x3": 134.76, "r_y3": 605.55, "coord_origin": "TOPLEFT" }, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 52, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 154.94, "r_y0": 616.12, "r_x1": 269.62, "r_y1": 616.12, "r_x2": 269.62, "r_y2": 605.55, "r_x3": 154.94, "r_y3": 605.55, "coord_origin": "TOPLEFT" }, "text": "Problem Statement", "orig": "Problem Statement", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 53, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 640.94, "r_x1": 480.59, "r_y1": 640.94, "r_x2": 480.59, "r_y2": 632.15, "r_x3": 134.76, "r_y3": 632.15, "coord_origin": "TOPLEFT" }, "text": "All known Im2Seq based models for TSR fundamentally work in similar ways.", "orig": "All known Im2Seq based models for TSR fundamentally work in similar ways.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 54, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 652.9, "r_x1": 480.59, "r_y1": 652.9, "r_x2": 480.59, "r_y2": 644.1, "r_x3": 134.76, "r_y3": 644.1, "coord_origin": "TOPLEFT" }, "text": "Given an image of a table, the Im2Seq model predicts the structure of the table", "orig": "Given an image of a table, the Im2Seq model predicts the structure of the table", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 55, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 664.86, "r_x1": 480.59, "r_y1": 664.86, "r_x2": 480.59, "r_y2": 656.06, "r_x3": 134.76, "r_y3": 656.06, "coord_origin": "TOPLEFT" }, "text": "by generating a sequence of tokens. These tokens originate from a finite vocab-", "orig": "by generating a sequence of tokens. These tokens originate from a finite vocab-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "has_chars": false, "has_words": false, "has_lines": true, "image": null, "lines": [] }, "predictions": { "layout": { "clusters": [ { "id": 6, "label": "page_header", "bbox": { "l": 134.76, "t": 93.77, "r": 139.37, "b": 101.84, "coord_origin": "TOPLEFT" }, "confidence": 0.789, "cells": [ { "index": 0, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 101.84, "r_x1": 139.37, "r_y1": 101.84, "r_x2": 139.37, "r_y2": 93.77, "r_x3": 134.76, "r_y3": 93.77, "coord_origin": "TOPLEFT" }, "text": "4", "orig": "4", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 5, "label": "page_header", "bbox": { "l": 167.81, "t": 93.77, "r": 231.72, "b": 101.84, "coord_origin": "TOPLEFT" }, "confidence": 0.905, "cells": [ { "index": 1, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 167.81, "r_y0": 101.84, "r_x1": 178.08, "r_y1": 101.84, "r_x2": 178.08, "r_y2": 93.77, "r_x3": 167.81, "r_y3": 93.77, "coord_origin": "TOPLEFT" }, "text": "M.", "orig": "M.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 2, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 182.37, "r_y0": 101.84, "r_x1": 231.72, "r_y1": 101.84, "r_x2": 231.72, "r_y2": 93.77, "r_x3": 182.37, "r_y3": 93.77, "coord_origin": "TOPLEFT" }, "text": "Lysak, et al.", "orig": "Lysak, et al.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 2, "label": "text", "bbox": { "l": 134.76, "t": 118.93, "r": 480.6, "b": 259.24, "coord_origin": "TOPLEFT" }, "confidence": 0.947, "cells": [ { "index": 3, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 127.73, "r_x1": 480.59, "r_y1": 127.73, "r_x2": 480.59, "r_y2": 118.93, "r_x3": 134.76, "r_y3": 118.93, "coord_origin": "TOPLEFT" }, "text": "Other work [20] aims at predicting a grid for each table and deciding which cells", "orig": "Other work [20] aims at predicting a grid for each table and deciding which cells", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 4, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 139.69, "r_x1": 480.59, "r_y1": 139.69, "r_x2": 480.59, "r_y2": 130.89, "r_x3": 134.76, "r_y3": 130.89, "coord_origin": "TOPLEFT" }, "text": "must be merged using an attention network. Im2Seq methods cast the problem", "orig": "must be merged using an attention network. Im2Seq methods cast the problem", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 5, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 151.64, "r_x1": 480.59, "r_y1": 151.64, "r_x2": 480.59, "r_y2": 142.84, "r_x3": 134.76, "r_y3": 142.84, "coord_origin": "TOPLEFT" }, "text": "as a sequence generation task [4,5,9,22], and therefore need an internal table-", "orig": "as a sequence generation task [4,5,9,22], and therefore need an internal table-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 6, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 163.6, "r_x1": 480.59, "r_y1": 163.6, "r_x2": 480.59, "r_y2": 154.8, "r_x3": 134.76, "r_y3": 154.8, "coord_origin": "TOPLEFT" }, "text": "structure representation language, which is often implemented with standard", "orig": "structure representation language, which is often implemented with standard", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 7, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 175.55, "r_x1": 480.59, "r_y1": 175.55, "r_x2": 480.59, "r_y2": 166.75, "r_x3": 134.76, "r_y3": 166.75, "coord_origin": "TOPLEFT" }, "text": "markup languages (e.g. HTML, LaTeX, Markdown). In theory, Im2Seq methods", "orig": "markup languages (e.g. HTML, LaTeX, Markdown). In theory, Im2Seq methods", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 8, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 187.51, "r_x1": 480.6, "r_y1": 187.51, "r_x2": 480.6, "r_y2": 178.71, "r_x3": 134.76, "r_y3": 178.71, "coord_origin": "TOPLEFT" }, "text": "have a natural advantage over the OD and GNN methods by virtue of directly", "orig": "have a natural advantage over the OD and GNN methods by virtue of directly", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 9, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 199.46, "r_x1": 480.59, "r_y1": 199.46, "r_x2": 480.59, "r_y2": 190.66, "r_x3": 134.76, "r_y3": 190.66, "coord_origin": "TOPLEFT" }, "text": "predicting the table-structure. As such, no post-processing or rules are needed", "orig": "predicting the table-structure. As such, no post-processing or rules are needed", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 10, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 211.42, "r_x1": 480.59, "r_y1": 211.42, "r_x2": 480.59, "r_y2": 202.62, "r_x3": 134.76, "r_y3": 202.62, "coord_origin": "TOPLEFT" }, "text": "in order to obtain the table-structure, which is necessary with OD and GNN", "orig": "in order to obtain the table-structure, which is necessary with OD and GNN", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 11, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 223.37, "r_x1": 480.59, "r_y1": 223.37, "r_x2": 480.59, "r_y2": 214.58, "r_x3": 134.76, "r_y3": 214.58, "coord_origin": "TOPLEFT" }, "text": "approaches. In practice, this is not entirely true, because a predicted sequence", "orig": "approaches. In practice, this is not entirely true, because a predicted sequence", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 12, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 235.33, "r_x1": 480.59, "r_y1": 235.33, "r_x2": 480.59, "r_y2": 226.53, "r_x3": 134.76, "r_y3": 226.53, "coord_origin": "TOPLEFT" }, "text": "of table-structure markup does not necessarily have to be syntactically correct.", "orig": "of table-structure markup does not necessarily have to be syntactically correct.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 13, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 247.28, "r_x1": 480.6, "r_y1": 247.28, "r_x2": 480.6, "r_y2": 238.49, "r_x3": 134.76, "r_y3": 238.49, "coord_origin": "TOPLEFT" }, "text": "Hence, depending on the quality of the predicted sequence, some post-processing", "orig": "Hence, depending on the quality of the predicted sequence, some post-processing", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 14, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 259.24, "r_x1": 480.59, "r_y1": 259.24, "r_x2": 480.59, "r_y2": 250.44, "r_x3": 134.76, "r_y3": 250.44, "coord_origin": "TOPLEFT" }, "text": "needs to be performed to ensure a syntactically valid (let alone correct) sequence.", "orig": "needs to be performed to ensure a syntactically valid (let alone correct) sequence.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 4, "label": "text", "bbox": { "l": 134.76, "t": 262.66, "r": 480.6, "b": 486.65, "coord_origin": "TOPLEFT" }, "confidence": 0.929, "cells": [ { "index": 15, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 149.71, "r_y0": 271.45, "r_x1": 480.59, "r_y1": 271.45, "r_x2": 480.59, "r_y2": 262.66, "r_x3": 149.71, "r_y3": 262.66, "coord_origin": "TOPLEFT" }, "text": "Within the Im2Seq method, we find several popular models, namely the", "orig": "Within the Im2Seq method, we find several popular models, namely the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 16, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 283.41, "r_x1": 480.59, "r_y1": 283.41, "r_x2": 480.59, "r_y2": 274.61, "r_x3": 134.76, "r_y3": 274.61, "coord_origin": "TOPLEFT" }, "text": "encoder-dual-decoder model (EDD) [22], TableFormer [9], Tabsplitter[2] and Ye", "orig": "encoder-dual-decoder model (EDD) [22], TableFormer [9], Tabsplitter[2] and Ye", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 17, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 295.36, "r_x1": 480.59, "r_y1": 295.36, "r_x2": 480.59, "r_y2": 286.57, "r_x3": 134.76, "r_y3": 286.57, "coord_origin": "TOPLEFT" }, "text": "et. al. [19]. EDD uses two consecutive long short-term memory (LSTM) decoders", "orig": "et. al. [19]. EDD uses two consecutive long short-term memory (LSTM) decoders", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 18, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 307.32, "r_x1": 342.02, "r_y1": 307.32, "r_x2": 342.02, "r_y2": 298.52, "r_x3": 134.76, "r_y3": 298.52, "coord_origin": "TOPLEFT" }, "text": "to predict a table in HTML representation. The", "orig": "to predict a table in HTML representation. The", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 19, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 345.06, "r_y0": 307.32, "r_x1": 393.05, "r_y1": 307.32, "r_x2": 393.05, "r_y2": 298.52, "r_x3": 345.06, "r_y3": 298.52, "coord_origin": "TOPLEFT" }, "text": "tag decoder", "orig": "tag decoder", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 20, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 397.17, "r_y0": 307.32, "r_x1": 480.59, "r_y1": 307.32, "r_x2": 480.59, "r_y2": 298.52, "r_x3": 397.17, "r_y3": 298.52, "coord_origin": "TOPLEFT" }, "text": "predicts a sequence", "orig": "predicts a sequence", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 21, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 319.27, "r_x1": 333.3, "r_y1": 319.27, "r_x2": 333.3, "r_y2": 310.48, "r_x3": 134.76, "r_y3": 310.48, "coord_origin": "TOPLEFT" }, "text": "of HTML tags. For each decoded table cell (", "orig": "of HTML tags. For each decoded table cell (", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 22, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 333.3, "r_y0": 319.27, "r_x1": 356.97, "r_y1": 319.27, "r_x2": 356.97, "r_y2": 310.48, "r_x3": 333.3, "r_y3": 310.48, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 23, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 357.08, "r_y0": 319.27, "r_x1": 480.59, "r_y1": 319.27, "r_x2": 480.59, "r_y2": 310.48, "r_x3": 357.08, "r_y3": 310.48, "coord_origin": "TOPLEFT" }, "text": "), the attention is passed to", "orig": "), the attention is passed to", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 24, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 331.23, "r_x1": 148.6, "r_y1": 331.23, "r_x2": 148.6, "r_y2": 322.43, "r_x3": 134.76, "r_y3": 322.43, "coord_origin": "TOPLEFT" }, "text": "the", "orig": "the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 25, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 152.28, "r_y0": 331.23, "r_x1": 202.11, "r_y1": 331.23, "r_x2": 202.11, "r_y2": 322.43, "r_x3": 152.28, "r_y3": 322.43, "coord_origin": "TOPLEFT" }, "text": "cell decoder", "orig": "cell decoder", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 26, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 206.86, "r_y0": 331.23, "r_x1": 480.59, "r_y1": 331.23, "r_x2": 480.59, "r_y2": 322.43, "r_x3": 206.86, "r_y3": 322.43, "coord_origin": "TOPLEFT" }, "text": "to predict the content with an embedded OCR approach. The", "orig": "to predict the content with an embedded OCR approach. The", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 27, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 343.18, "r_x1": 480.59, "r_y1": 343.18, "r_x2": 480.59, "r_y2": 334.39, "r_x3": 134.76, "r_y3": 334.39, "coord_origin": "TOPLEFT" }, "text": "latter makes it susceptible to transcription errors in the cell content of the table.", "orig": "latter makes it susceptible to transcription errors in the cell content of the table.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 28, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 355.14, "r_x1": 480.59, "r_y1": 355.14, "r_x2": 480.59, "r_y2": 346.34, "r_x3": 134.76, "r_y3": 346.34, "coord_origin": "TOPLEFT" }, "text": "TableFormer address this reliance on OCR and uses two transformer decoders for", "orig": "TableFormer address this reliance on OCR and uses two transformer decoders for", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 29, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 367.09, "r_x1": 480.59, "r_y1": 367.09, "r_x2": 480.59, "r_y2": 358.3, "r_x3": 134.76, "r_y3": 358.3, "coord_origin": "TOPLEFT" }, "text": "HTML structure and cell bounding box prediction in an end-to-end architecture.", "orig": "HTML structure and cell bounding box prediction in an end-to-end architecture.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 30, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 379.05, "r_x1": 480.59, "r_y1": 379.05, "r_x2": 480.59, "r_y2": 370.25, "r_x3": 134.76, "r_y3": 370.25, "coord_origin": "TOPLEFT" }, "text": "The predicted cell bounding box is then used to extract text tokens from an", "orig": "The predicted cell bounding box is then used to extract text tokens from an", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 31, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 391.01, "r_x1": 480.59, "r_y1": 391.01, "r_x2": 480.59, "r_y2": 382.21, "r_x3": 134.76, "r_y3": 382.21, "coord_origin": "TOPLEFT" }, "text": "originating (digital) PDF page, circumventing any need for OCR. TabSplitter", "orig": "originating (digital) PDF page, circumventing any need for OCR. TabSplitter", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 32, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 402.96, "r_x1": 144.77, "r_y1": 402.96, "r_x2": 144.77, "r_y2": 394.16, "r_x3": 134.76, "r_y3": 394.16, "coord_origin": "TOPLEFT" }, "text": "[2]", "orig": "[2]", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 33, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 149.51, "r_y0": 402.96, "r_x1": 480.59, "r_y1": 402.96, "r_x2": 480.59, "r_y2": 394.16, "r_x3": 149.51, "r_y3": 394.16, "coord_origin": "TOPLEFT" }, "text": "proposes a compact double-matrix representation of table rows and columns", "orig": "proposes a compact double-matrix representation of table rows and columns", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 34, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 414.92, "r_x1": 480.6, "r_y1": 414.92, "r_x2": 480.6, "r_y2": 406.12, "r_x3": 134.76, "r_y3": 406.12, "coord_origin": "TOPLEFT" }, "text": "to do error detection and error correction of HTML structure sequences based", "orig": "to do error detection and error correction of HTML structure sequences based", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 35, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 426.87, "r_x1": 480.59, "r_y1": 426.87, "r_x2": 480.59, "r_y2": 418.07, "r_x3": 134.76, "r_y3": 418.07, "coord_origin": "TOPLEFT" }, "text": "on predictions from [19]. This compact double-matrix representation can not be", "orig": "on predictions from [19]. This compact double-matrix representation can not be", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 36, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 438.83, "r_x1": 480.59, "r_y1": 438.83, "r_x2": 480.59, "r_y2": 430.03, "r_x3": 134.76, "r_y3": 430.03, "coord_origin": "TOPLEFT" }, "text": "used directly by the Img2seq model training, so the model uses HTML as an", "orig": "used directly by the Img2seq model training, so the model uses HTML as an", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 37, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 450.78, "r_x1": 480.59, "r_y1": 450.78, "r_x2": 480.59, "r_y2": 441.98, "r_x3": 134.76, "r_y3": 441.98, "coord_origin": "TOPLEFT" }, "text": "intermediate form. Chi et. al. [4] introduce a data set and a baseline method", "orig": "intermediate form. Chi et. al. [4] introduce a data set and a baseline method", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 38, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 462.74, "r_x1": 384.58, "r_y1": 462.74, "r_x2": 384.58, "r_y2": 453.94, "r_x3": 134.76, "r_y3": 453.94, "coord_origin": "TOPLEFT" }, "text": "using bidirectional LSTMs to predict LaTeX code. Kayal", "orig": "using bidirectional LSTMs to predict LaTeX code. Kayal", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 39, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 391.56, "r_y0": 462.74, "r_x1": 401.73, "r_y1": 462.74, "r_x2": 401.73, "r_y2": 453.94, "r_x3": 391.56, "r_y3": 453.94, "coord_origin": "TOPLEFT" }, "text": "[5]", "orig": "[5]", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 40, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 406.55, "r_y0": 462.74, "r_x1": 480.59, "r_y1": 462.74, "r_x2": 480.59, "r_y2": 453.94, "r_x3": 406.55, "r_y3": 453.94, "coord_origin": "TOPLEFT" }, "text": "introduces Gated", "orig": "introduces Gated", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 41, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 474.69, "r_x1": 480.59, "r_y1": 474.69, "r_x2": 480.59, "r_y2": 465.89, "r_x3": 134.76, "r_y3": 465.89, "coord_origin": "TOPLEFT" }, "text": "ResNet transformers to predict LaTeX code, and a separate OCR module to", "orig": "ResNet transformers to predict LaTeX code, and a separate OCR module to", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 42, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 486.65, "r_x1": 203.69, "r_y1": 486.65, "r_x2": 203.69, "r_y2": 477.85, "r_x3": 134.76, "r_y3": 477.85, "coord_origin": "TOPLEFT" }, "text": "extract content.", "orig": "extract content.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 0, "label": "text", "bbox": { "l": 134.76, "t": 490.07, "r": 480.59, "b": 582.55, "coord_origin": "TOPLEFT" }, "confidence": 0.985, "cells": [ { "index": 43, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 149.71, "r_y0": 498.86, "r_x1": 480.59, "r_y1": 498.86, "r_x2": 480.59, "r_y2": 490.07, "r_x3": 149.71, "r_y3": 490.07, "coord_origin": "TOPLEFT" }, "text": "Im2Seq approaches have shown to be well-suited for the TSR task and allow a", "orig": "Im2Seq approaches have shown to be well-suited for the TSR task and allow a", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 44, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 510.82, "r_x1": 480.59, "r_y1": 510.82, "r_x2": 480.59, "r_y2": 502.02, "r_x3": 134.76, "r_y3": 502.02, "coord_origin": "TOPLEFT" }, "text": "full end-to-end network design that can output the final table structure without", "orig": "full end-to-end network design that can output the final table structure without", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 45, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 522.77, "r_x1": 480.59, "r_y1": 522.77, "r_x2": 480.59, "r_y2": 513.98, "r_x3": 134.76, "r_y3": 513.98, "coord_origin": "TOPLEFT" }, "text": "pre- or post-processing logic. Furthermore, Im2Seq models have demonstrated", "orig": "pre- or post-processing logic. Furthermore, Im2Seq models have demonstrated", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 46, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 534.73, "r_x1": 480.59, "r_y1": 534.73, "r_x2": 480.59, "r_y2": 525.93, "r_x3": 134.76, "r_y3": 525.93, "coord_origin": "TOPLEFT" }, "text": "to deliver state-of-the-art prediction accuracy [9]. This motivated the authors", "orig": "to deliver state-of-the-art prediction accuracy [9]. This motivated the authors", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 47, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 546.68, "r_x1": 480.59, "r_y1": 546.68, "r_x2": 480.59, "r_y2": 537.89, "r_x3": 134.76, "r_y3": 537.89, "coord_origin": "TOPLEFT" }, "text": "to investigate if the performance (both in accuracy and inference time) can", "orig": "to investigate if the performance (both in accuracy and inference time) can", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 48, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 558.64, "r_x1": 480.59, "r_y1": 558.64, "r_x2": 480.59, "r_y2": 549.84, "r_x3": 134.76, "r_y3": 549.84, "coord_origin": "TOPLEFT" }, "text": "be further improved by optimising the table structure representation language.", "orig": "be further improved by optimising the table structure representation language.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 49, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 570.59, "r_x1": 480.59, "r_y1": 570.59, "r_x2": 480.59, "r_y2": 561.8, "r_x3": 134.76, "r_y3": 561.8, "coord_origin": "TOPLEFT" }, "text": "We believe this is a necessary step before further improving neural network", "orig": "We believe this is a necessary step before further improving neural network", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 50, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 582.55, "r_x1": 249.28, "r_y1": 582.55, "r_x2": 249.28, "r_y2": 573.75, "r_x3": 134.76, "r_y3": 573.75, "coord_origin": "TOPLEFT" }, "text": "architectures for this task.", "orig": "architectures for this task.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 3, "label": "section_header", "bbox": { "l": 134.76, "t": 605.55, "r": 269.62, "b": 616.12, "coord_origin": "TOPLEFT" }, "confidence": 0.939, "cells": [ { "index": 51, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 616.12, "r_x1": 141.49, "r_y1": 616.12, "r_x2": 141.49, "r_y2": 605.55, "r_x3": 134.76, "r_y3": 605.55, "coord_origin": "TOPLEFT" }, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 52, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 154.94, "r_y0": 616.12, "r_x1": 269.62, "r_y1": 616.12, "r_x2": 269.62, "r_y2": 605.55, "r_x3": 154.94, "r_y3": 605.55, "coord_origin": "TOPLEFT" }, "text": "Problem Statement", "orig": "Problem Statement", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 1, "label": "text", "bbox": { "l": 134.76, "t": 632.15, "r": 480.59, "b": 664.86, "coord_origin": "TOPLEFT" }, "confidence": 0.969, "cells": [ { "index": 53, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 640.94, "r_x1": 480.59, "r_y1": 640.94, "r_x2": 480.59, "r_y2": 632.15, "r_x3": 134.76, "r_y3": 632.15, "coord_origin": "TOPLEFT" }, "text": "All known Im2Seq based models for TSR fundamentally work in similar ways.", "orig": "All known Im2Seq based models for TSR fundamentally work in similar ways.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 54, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 652.9, "r_x1": 480.59, "r_y1": 652.9, "r_x2": 480.59, "r_y2": 644.1, "r_x3": 134.76, "r_y3": 644.1, "coord_origin": "TOPLEFT" }, "text": "Given an image of a table, the Im2Seq model predicts the structure of the table", "orig": "Given an image of a table, the Im2Seq model predicts the structure of the table", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 55, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 664.86, "r_x1": 480.59, "r_y1": 664.86, "r_x2": 480.59, "r_y2": 656.06, "r_x3": 134.76, "r_y3": 656.06, "coord_origin": "TOPLEFT" }, "text": "by generating a sequence of tokens. These tokens originate from a finite vocab-", "orig": "by generating a sequence of tokens. These tokens originate from a finite vocab-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] } ] }, "tablestructure": { "table_map": {} }, "figures_classification": null, "equations_prediction": null, "vlm_response": null }, "assembled": { "elements": [ { "label": "page_header", "id": 6, "page_no": 3, "cluster": { "id": 6, "label": "page_header", "bbox": { "l": 134.76, "t": 93.77, "r": 139.37, "b": 101.84, "coord_origin": "TOPLEFT" }, "confidence": 0.789, "cells": [ { "index": 0, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 101.84, "r_x1": 139.37, "r_y1": 101.84, "r_x2": 139.37, "r_y2": 93.77, "r_x3": 134.76, "r_y3": 93.77, "coord_origin": "TOPLEFT" }, "text": "4", "orig": "4", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "4" }, { "label": "page_header", "id": 5, "page_no": 3, "cluster": { "id": 5, "label": "page_header", "bbox": { "l": 167.81, "t": 93.77, "r": 231.72, "b": 101.84, "coord_origin": "TOPLEFT" }, "confidence": 0.905, "cells": [ { "index": 1, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 167.81, "r_y0": 101.84, "r_x1": 178.08, "r_y1": 101.84, "r_x2": 178.08, "r_y2": 93.77, "r_x3": 167.81, "r_y3": 93.77, "coord_origin": "TOPLEFT" }, "text": "M.", "orig": "M.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 2, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 182.37, "r_y0": 101.84, "r_x1": 231.72, "r_y1": 101.84, "r_x2": 231.72, "r_y2": 93.77, "r_x3": 182.37, "r_y3": 93.77, "coord_origin": "TOPLEFT" }, "text": "Lysak, et al.", "orig": "Lysak, et al.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "M. Lysak, et al." }, { "label": "text", "id": 2, "page_no": 3, "cluster": { "id": 2, "label": "text", "bbox": { "l": 134.76, "t": 118.93, "r": 480.6, "b": 259.24, "coord_origin": "TOPLEFT" }, "confidence": 0.947, "cells": [ { "index": 3, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 127.73, "r_x1": 480.59, "r_y1": 127.73, "r_x2": 480.59, "r_y2": 118.93, "r_x3": 134.76, "r_y3": 118.93, "coord_origin": "TOPLEFT" }, "text": "Other work [20] aims at predicting a grid for each table and deciding which cells", "orig": "Other work [20] aims at predicting a grid for each table and deciding which cells", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 4, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 139.69, "r_x1": 480.59, "r_y1": 139.69, "r_x2": 480.59, "r_y2": 130.89, "r_x3": 134.76, "r_y3": 130.89, "coord_origin": "TOPLEFT" }, "text": "must be merged using an attention network. Im2Seq methods cast the problem", "orig": "must be merged using an attention network. Im2Seq methods cast the problem", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 5, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 151.64, "r_x1": 480.59, "r_y1": 151.64, "r_x2": 480.59, "r_y2": 142.84, "r_x3": 134.76, "r_y3": 142.84, "coord_origin": "TOPLEFT" }, "text": "as a sequence generation task [4,5,9,22], and therefore need an internal table-", "orig": "as a sequence generation task [4,5,9,22], and therefore need an internal table-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 6, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 163.6, "r_x1": 480.59, "r_y1": 163.6, "r_x2": 480.59, "r_y2": 154.8, "r_x3": 134.76, "r_y3": 154.8, "coord_origin": "TOPLEFT" }, "text": "structure representation language, which is often implemented with standard", "orig": "structure representation language, which is often implemented with standard", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 7, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 175.55, "r_x1": 480.59, "r_y1": 175.55, "r_x2": 480.59, "r_y2": 166.75, "r_x3": 134.76, "r_y3": 166.75, "coord_origin": "TOPLEFT" }, "text": "markup languages (e.g. HTML, LaTeX, Markdown). In theory, Im2Seq methods", "orig": "markup languages (e.g. HTML, LaTeX, Markdown). In theory, Im2Seq methods", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 8, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 187.51, "r_x1": 480.6, "r_y1": 187.51, "r_x2": 480.6, "r_y2": 178.71, "r_x3": 134.76, "r_y3": 178.71, "coord_origin": "TOPLEFT" }, "text": "have a natural advantage over the OD and GNN methods by virtue of directly", "orig": "have a natural advantage over the OD and GNN methods by virtue of directly", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 9, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 199.46, "r_x1": 480.59, "r_y1": 199.46, "r_x2": 480.59, "r_y2": 190.66, "r_x3": 134.76, "r_y3": 190.66, "coord_origin": "TOPLEFT" }, "text": "predicting the table-structure. As such, no post-processing or rules are needed", "orig": "predicting the table-structure. As such, no post-processing or rules are needed", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 10, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 211.42, "r_x1": 480.59, "r_y1": 211.42, "r_x2": 480.59, "r_y2": 202.62, "r_x3": 134.76, "r_y3": 202.62, "coord_origin": "TOPLEFT" }, "text": "in order to obtain the table-structure, which is necessary with OD and GNN", "orig": "in order to obtain the table-structure, which is necessary with OD and GNN", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 11, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 223.37, "r_x1": 480.59, "r_y1": 223.37, "r_x2": 480.59, "r_y2": 214.58, "r_x3": 134.76, "r_y3": 214.58, "coord_origin": "TOPLEFT" }, "text": "approaches. In practice, this is not entirely true, because a predicted sequence", "orig": "approaches. In practice, this is not entirely true, because a predicted sequence", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 12, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 235.33, "r_x1": 480.59, "r_y1": 235.33, "r_x2": 480.59, "r_y2": 226.53, "r_x3": 134.76, "r_y3": 226.53, "coord_origin": "TOPLEFT" }, "text": "of table-structure markup does not necessarily have to be syntactically correct.", "orig": "of table-structure markup does not necessarily have to be syntactically correct.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 13, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 247.28, "r_x1": 480.6, "r_y1": 247.28, "r_x2": 480.6, "r_y2": 238.49, "r_x3": 134.76, "r_y3": 238.49, "coord_origin": "TOPLEFT" }, "text": "Hence, depending on the quality of the predicted sequence, some post-processing", "orig": "Hence, depending on the quality of the predicted sequence, some post-processing", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 14, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 259.24, "r_x1": 480.59, "r_y1": 259.24, "r_x2": 480.59, "r_y2": 250.44, "r_x3": 134.76, "r_y3": 250.44, "coord_origin": "TOPLEFT" }, "text": "needs to be performed to ensure a syntactically valid (let alone correct) sequence.", "orig": "needs to be performed to ensure a syntactically valid (let alone correct) sequence.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "Other work [20] aims at predicting a grid for each table and deciding which cells must be merged using an attention network. Im2Seq methods cast the problem as a sequence generation task [4,5,9,22], and therefore need an internal tablestructure representation language, which is often implemented with standard markup languages (e.g. HTML, LaTeX, Markdown). In theory, Im2Seq methods have a natural advantage over the OD and GNN methods by virtue of directly predicting the table-structure. As such, no post-processing or rules are needed in order to obtain the table-structure, which is necessary with OD and GNN approaches. In practice, this is not entirely true, because a predicted sequence of table-structure markup does not necessarily have to be syntactically correct. Hence, depending on the quality of the predicted sequence, some post-processing needs to be performed to ensure a syntactically valid (let alone correct) sequence." }, { "label": "text", "id": 4, "page_no": 3, "cluster": { "id": 4, "label": "text", "bbox": { "l": 134.76, "t": 262.66, "r": 480.6, "b": 486.65, "coord_origin": "TOPLEFT" }, "confidence": 0.929, "cells": [ { "index": 15, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 149.71, "r_y0": 271.45, "r_x1": 480.59, "r_y1": 271.45, "r_x2": 480.59, "r_y2": 262.66, "r_x3": 149.71, "r_y3": 262.66, "coord_origin": "TOPLEFT" }, "text": "Within the Im2Seq method, we find several popular models, namely the", "orig": "Within the Im2Seq method, we find several popular models, namely the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 16, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 283.41, "r_x1": 480.59, "r_y1": 283.41, "r_x2": 480.59, "r_y2": 274.61, "r_x3": 134.76, "r_y3": 274.61, "coord_origin": "TOPLEFT" }, "text": "encoder-dual-decoder model (EDD) [22], TableFormer [9], Tabsplitter[2] and Ye", "orig": "encoder-dual-decoder model (EDD) [22], TableFormer [9], Tabsplitter[2] and Ye", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 17, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 295.36, "r_x1": 480.59, "r_y1": 295.36, "r_x2": 480.59, "r_y2": 286.57, "r_x3": 134.76, "r_y3": 286.57, "coord_origin": "TOPLEFT" }, "text": "et. al. [19]. EDD uses two consecutive long short-term memory (LSTM) decoders", "orig": "et. al. [19]. EDD uses two consecutive long short-term memory (LSTM) decoders", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 18, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 307.32, "r_x1": 342.02, "r_y1": 307.32, "r_x2": 342.02, "r_y2": 298.52, "r_x3": 134.76, "r_y3": 298.52, "coord_origin": "TOPLEFT" }, "text": "to predict a table in HTML representation. The", "orig": "to predict a table in HTML representation. The", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 19, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 345.06, "r_y0": 307.32, "r_x1": 393.05, "r_y1": 307.32, "r_x2": 393.05, "r_y2": 298.52, "r_x3": 345.06, "r_y3": 298.52, "coord_origin": "TOPLEFT" }, "text": "tag decoder", "orig": "tag decoder", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 20, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 397.17, "r_y0": 307.32, "r_x1": 480.59, "r_y1": 307.32, "r_x2": 480.59, "r_y2": 298.52, "r_x3": 397.17, "r_y3": 298.52, "coord_origin": "TOPLEFT" }, "text": "predicts a sequence", "orig": "predicts a sequence", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 21, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 319.27, "r_x1": 333.3, "r_y1": 319.27, "r_x2": 333.3, "r_y2": 310.48, "r_x3": 134.76, "r_y3": 310.48, "coord_origin": "TOPLEFT" }, "text": "of HTML tags. For each decoded table cell (", "orig": "of HTML tags. For each decoded table cell (", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 22, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 333.3, "r_y0": 319.27, "r_x1": 356.97, "r_y1": 319.27, "r_x2": 356.97, "r_y2": 310.48, "r_x3": 333.3, "r_y3": 310.48, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 23, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 357.08, "r_y0": 319.27, "r_x1": 480.59, "r_y1": 319.27, "r_x2": 480.59, "r_y2": 310.48, "r_x3": 357.08, "r_y3": 310.48, "coord_origin": "TOPLEFT" }, "text": "), the attention is passed to", "orig": "), the attention is passed to", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 24, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 331.23, "r_x1": 148.6, "r_y1": 331.23, "r_x2": 148.6, "r_y2": 322.43, "r_x3": 134.76, "r_y3": 322.43, "coord_origin": "TOPLEFT" }, "text": "the", "orig": "the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 25, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 152.28, "r_y0": 331.23, "r_x1": 202.11, "r_y1": 331.23, "r_x2": 202.11, "r_y2": 322.43, "r_x3": 152.28, "r_y3": 322.43, "coord_origin": "TOPLEFT" }, "text": "cell decoder", "orig": "cell decoder", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 26, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 206.86, "r_y0": 331.23, "r_x1": 480.59, "r_y1": 331.23, "r_x2": 480.59, "r_y2": 322.43, "r_x3": 206.86, "r_y3": 322.43, "coord_origin": "TOPLEFT" }, "text": "to predict the content with an embedded OCR approach. The", "orig": "to predict the content with an embedded OCR approach. The", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 27, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 343.18, "r_x1": 480.59, "r_y1": 343.18, "r_x2": 480.59, "r_y2": 334.39, "r_x3": 134.76, "r_y3": 334.39, "coord_origin": "TOPLEFT" }, "text": "latter makes it susceptible to transcription errors in the cell content of the table.", "orig": "latter makes it susceptible to transcription errors in the cell content of the table.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 28, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 355.14, "r_x1": 480.59, "r_y1": 355.14, "r_x2": 480.59, "r_y2": 346.34, "r_x3": 134.76, "r_y3": 346.34, "coord_origin": "TOPLEFT" }, "text": "TableFormer address this reliance on OCR and uses two transformer decoders for", "orig": "TableFormer address this reliance on OCR and uses two transformer decoders for", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 29, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 367.09, "r_x1": 480.59, "r_y1": 367.09, "r_x2": 480.59, "r_y2": 358.3, "r_x3": 134.76, "r_y3": 358.3, "coord_origin": "TOPLEFT" }, "text": "HTML structure and cell bounding box prediction in an end-to-end architecture.", "orig": "HTML structure and cell bounding box prediction in an end-to-end architecture.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 30, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 379.05, "r_x1": 480.59, "r_y1": 379.05, "r_x2": 480.59, "r_y2": 370.25, "r_x3": 134.76, "r_y3": 370.25, "coord_origin": "TOPLEFT" }, "text": "The predicted cell bounding box is then used to extract text tokens from an", "orig": "The predicted cell bounding box is then used to extract text tokens from an", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 31, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 391.01, "r_x1": 480.59, "r_y1": 391.01, "r_x2": 480.59, "r_y2": 382.21, "r_x3": 134.76, "r_y3": 382.21, "coord_origin": "TOPLEFT" }, "text": "originating (digital) PDF page, circumventing any need for OCR. TabSplitter", "orig": "originating (digital) PDF page, circumventing any need for OCR. TabSplitter", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 32, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 402.96, "r_x1": 144.77, "r_y1": 402.96, "r_x2": 144.77, "r_y2": 394.16, "r_x3": 134.76, "r_y3": 394.16, "coord_origin": "TOPLEFT" }, "text": "[2]", "orig": "[2]", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 33, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 149.51, "r_y0": 402.96, "r_x1": 480.59, "r_y1": 402.96, "r_x2": 480.59, "r_y2": 394.16, "r_x3": 149.51, "r_y3": 394.16, "coord_origin": "TOPLEFT" }, "text": "proposes a compact double-matrix representation of table rows and columns", "orig": "proposes a compact double-matrix representation of table rows and columns", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 34, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 414.92, "r_x1": 480.6, "r_y1": 414.92, "r_x2": 480.6, "r_y2": 406.12, "r_x3": 134.76, "r_y3": 406.12, "coord_origin": "TOPLEFT" }, "text": "to do error detection and error correction of HTML structure sequences based", "orig": "to do error detection and error correction of HTML structure sequences based", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 35, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 426.87, "r_x1": 480.59, "r_y1": 426.87, "r_x2": 480.59, "r_y2": 418.07, "r_x3": 134.76, "r_y3": 418.07, "coord_origin": "TOPLEFT" }, "text": "on predictions from [19]. This compact double-matrix representation can not be", "orig": "on predictions from [19]. This compact double-matrix representation can not be", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 36, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 438.83, "r_x1": 480.59, "r_y1": 438.83, "r_x2": 480.59, "r_y2": 430.03, "r_x3": 134.76, "r_y3": 430.03, "coord_origin": "TOPLEFT" }, "text": "used directly by the Img2seq model training, so the model uses HTML as an", "orig": "used directly by the Img2seq model training, so the model uses HTML as an", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 37, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 450.78, "r_x1": 480.59, "r_y1": 450.78, "r_x2": 480.59, "r_y2": 441.98, "r_x3": 134.76, "r_y3": 441.98, "coord_origin": "TOPLEFT" }, "text": "intermediate form. Chi et. al. [4] introduce a data set and a baseline method", "orig": "intermediate form. Chi et. al. [4] introduce a data set and a baseline method", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 38, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 462.74, "r_x1": 384.58, "r_y1": 462.74, "r_x2": 384.58, "r_y2": 453.94, "r_x3": 134.76, "r_y3": 453.94, "coord_origin": "TOPLEFT" }, "text": "using bidirectional LSTMs to predict LaTeX code. Kayal", "orig": "using bidirectional LSTMs to predict LaTeX code. Kayal", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 39, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 391.56, "r_y0": 462.74, "r_x1": 401.73, "r_y1": 462.74, "r_x2": 401.73, "r_y2": 453.94, "r_x3": 391.56, "r_y3": 453.94, "coord_origin": "TOPLEFT" }, "text": "[5]", "orig": "[5]", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 40, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 406.55, "r_y0": 462.74, "r_x1": 480.59, "r_y1": 462.74, "r_x2": 480.59, "r_y2": 453.94, "r_x3": 406.55, "r_y3": 453.94, "coord_origin": "TOPLEFT" }, "text": "introduces Gated", "orig": "introduces Gated", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 41, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 474.69, "r_x1": 480.59, "r_y1": 474.69, "r_x2": 480.59, "r_y2": 465.89, "r_x3": 134.76, "r_y3": 465.89, "coord_origin": "TOPLEFT" }, "text": "ResNet transformers to predict LaTeX code, and a separate OCR module to", "orig": "ResNet transformers to predict LaTeX code, and a separate OCR module to", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 42, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 486.65, "r_x1": 203.69, "r_y1": 486.65, "r_x2": 203.69, "r_y2": 477.85, "r_x3": 134.76, "r_y3": 477.85, "coord_origin": "TOPLEFT" }, "text": "extract content.", "orig": "extract content.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "Within the Im2Seq method, we find several popular models, namely the encoder-dual-decoder model (EDD) [22], TableFormer [9], Tabsplitter[2] and Ye et. al. [19]. EDD uses two consecutive long short-term memory (LSTM) decoders to predict a table in HTML representation. The tag decoder predicts a sequence of HTML tags. For each decoded table cell ( ), the attention is passed to the cell decoder to predict the content with an embedded OCR approach. The latter makes it susceptible to transcription errors in the cell content of the table. TableFormer address this reliance on OCR and uses two transformer decoders for HTML structure and cell bounding box prediction in an end-to-end architecture. The predicted cell bounding box is then used to extract text tokens from an originating (digital) PDF page, circumventing any need for OCR. TabSplitter [2] proposes a compact double-matrix representation of table rows and columns to do error detection and error correction of HTML structure sequences based on predictions from [19]. This compact double-matrix representation can not be used directly by the Img2seq model training, so the model uses HTML as an intermediate form. Chi et. al. [4] introduce a data set and a baseline method using bidirectional LSTMs to predict LaTeX code. Kayal [5] introduces Gated ResNet transformers to predict LaTeX code, and a separate OCR module to extract content." }, { "label": "text", "id": 0, "page_no": 3, "cluster": { "id": 0, "label": "text", "bbox": { "l": 134.76, "t": 490.07, "r": 480.59, "b": 582.55, "coord_origin": "TOPLEFT" }, "confidence": 0.985, "cells": [ { "index": 43, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 149.71, "r_y0": 498.86, "r_x1": 480.59, "r_y1": 498.86, "r_x2": 480.59, "r_y2": 490.07, "r_x3": 149.71, "r_y3": 490.07, "coord_origin": "TOPLEFT" }, "text": "Im2Seq approaches have shown to be well-suited for the TSR task and allow a", "orig": "Im2Seq approaches have shown to be well-suited for the TSR task and allow a", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 44, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 510.82, "r_x1": 480.59, "r_y1": 510.82, "r_x2": 480.59, "r_y2": 502.02, "r_x3": 134.76, "r_y3": 502.02, "coord_origin": "TOPLEFT" }, "text": "full end-to-end network design that can output the final table structure without", "orig": "full end-to-end network design that can output the final table structure without", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 45, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 522.77, "r_x1": 480.59, "r_y1": 522.77, "r_x2": 480.59, "r_y2": 513.98, "r_x3": 134.76, "r_y3": 513.98, "coord_origin": "TOPLEFT" }, "text": "pre- or post-processing logic. Furthermore, Im2Seq models have demonstrated", "orig": "pre- or post-processing logic. Furthermore, Im2Seq models have demonstrated", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 46, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 534.73, "r_x1": 480.59, "r_y1": 534.73, "r_x2": 480.59, "r_y2": 525.93, "r_x3": 134.76, "r_y3": 525.93, "coord_origin": "TOPLEFT" }, "text": "to deliver state-of-the-art prediction accuracy [9]. This motivated the authors", "orig": "to deliver state-of-the-art prediction accuracy [9]. This motivated the authors", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 47, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 546.68, "r_x1": 480.59, "r_y1": 546.68, "r_x2": 480.59, "r_y2": 537.89, "r_x3": 134.76, "r_y3": 537.89, "coord_origin": "TOPLEFT" }, "text": "to investigate if the performance (both in accuracy and inference time) can", "orig": "to investigate if the performance (both in accuracy and inference time) can", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 48, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 558.64, "r_x1": 480.59, "r_y1": 558.64, "r_x2": 480.59, "r_y2": 549.84, "r_x3": 134.76, "r_y3": 549.84, "coord_origin": "TOPLEFT" }, "text": "be further improved by optimising the table structure representation language.", "orig": "be further improved by optimising the table structure representation language.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 49, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 570.59, "r_x1": 480.59, "r_y1": 570.59, "r_x2": 480.59, "r_y2": 561.8, "r_x3": 134.76, "r_y3": 561.8, "coord_origin": "TOPLEFT" }, "text": "We believe this is a necessary step before further improving neural network", "orig": "We believe this is a necessary step before further improving neural network", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 50, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 582.55, "r_x1": 249.28, "r_y1": 582.55, "r_x2": 249.28, "r_y2": 573.75, "r_x3": 134.76, "r_y3": 573.75, "coord_origin": "TOPLEFT" }, "text": "architectures for this task.", "orig": "architectures for this task.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "Im2Seq approaches have shown to be well-suited for the TSR task and allow a full end-to-end network design that can output the final table structure without pre- or post-processing logic. Furthermore, Im2Seq models have demonstrated to deliver state-of-the-art prediction accuracy [9]. This motivated the authors to investigate if the performance (both in accuracy and inference time) can be further improved by optimising the table structure representation language. We believe this is a necessary step before further improving neural network architectures for this task." }, { "label": "section_header", "id": 3, "page_no": 3, "cluster": { "id": 3, "label": "section_header", "bbox": { "l": 134.76, "t": 605.55, "r": 269.62, "b": 616.12, "coord_origin": "TOPLEFT" }, "confidence": 0.939, "cells": [ { "index": 51, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 616.12, "r_x1": 141.49, "r_y1": 616.12, "r_x2": 141.49, "r_y2": 605.55, "r_x3": 134.76, "r_y3": 605.55, "coord_origin": "TOPLEFT" }, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 52, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 154.94, "r_y0": 616.12, "r_x1": 269.62, "r_y1": 616.12, "r_x2": 269.62, "r_y2": 605.55, "r_x3": 154.94, "r_y3": 605.55, "coord_origin": "TOPLEFT" }, "text": "Problem Statement", "orig": "Problem Statement", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "3 Problem Statement" }, { "label": "text", "id": 1, "page_no": 3, "cluster": { "id": 1, "label": "text", "bbox": { "l": 134.76, "t": 632.15, "r": 480.59, "b": 664.86, "coord_origin": "TOPLEFT" }, "confidence": 0.969, "cells": [ { "index": 53, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 640.94, "r_x1": 480.59, "r_y1": 640.94, "r_x2": 480.59, "r_y2": 632.15, "r_x3": 134.76, "r_y3": 632.15, "coord_origin": "TOPLEFT" }, "text": "All known Im2Seq based models for TSR fundamentally work in similar ways.", "orig": "All known Im2Seq based models for TSR fundamentally work in similar ways.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 54, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 652.9, "r_x1": 480.59, "r_y1": 652.9, "r_x2": 480.59, "r_y2": 644.1, "r_x3": 134.76, "r_y3": 644.1, "coord_origin": "TOPLEFT" }, "text": "Given an image of a table, the Im2Seq model predicts the structure of the table", "orig": "Given an image of a table, the Im2Seq model predicts the structure of the table", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 55, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 664.86, "r_x1": 480.59, "r_y1": 664.86, "r_x2": 480.59, "r_y2": 656.06, "r_x3": 134.76, "r_y3": 656.06, "coord_origin": "TOPLEFT" }, "text": "by generating a sequence of tokens. These tokens originate from a finite vocab-", "orig": "by generating a sequence of tokens. These tokens originate from a finite vocab-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "All known Im2Seq based models for TSR fundamentally work in similar ways. Given an image of a table, the Im2Seq model predicts the structure of the table by generating a sequence of tokens. These tokens originate from a finite vocab-" } ], "body": [ { "label": "text", "id": 2, "page_no": 3, "cluster": { "id": 2, "label": "text", "bbox": { "l": 134.76, "t": 118.93, "r": 480.6, "b": 259.24, "coord_origin": "TOPLEFT" }, "confidence": 0.947, "cells": [ { "index": 3, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 127.73, "r_x1": 480.59, "r_y1": 127.73, "r_x2": 480.59, "r_y2": 118.93, "r_x3": 134.76, "r_y3": 118.93, "coord_origin": "TOPLEFT" }, "text": "Other work [20] aims at predicting a grid for each table and deciding which cells", "orig": "Other work [20] aims at predicting a grid for each table and deciding which cells", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 4, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 139.69, "r_x1": 480.59, "r_y1": 139.69, "r_x2": 480.59, "r_y2": 130.89, "r_x3": 134.76, "r_y3": 130.89, "coord_origin": "TOPLEFT" }, "text": "must be merged using an attention network. Im2Seq methods cast the problem", "orig": "must be merged using an attention network. Im2Seq methods cast the problem", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 5, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 151.64, "r_x1": 480.59, "r_y1": 151.64, "r_x2": 480.59, "r_y2": 142.84, "r_x3": 134.76, "r_y3": 142.84, "coord_origin": "TOPLEFT" }, "text": "as a sequence generation task [4,5,9,22], and therefore need an internal table-", "orig": "as a sequence generation task [4,5,9,22], and therefore need an internal table-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 6, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 163.6, "r_x1": 480.59, "r_y1": 163.6, "r_x2": 480.59, "r_y2": 154.8, "r_x3": 134.76, "r_y3": 154.8, "coord_origin": "TOPLEFT" }, "text": "structure representation language, which is often implemented with standard", "orig": "structure representation language, which is often implemented with standard", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 7, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 175.55, "r_x1": 480.59, "r_y1": 175.55, "r_x2": 480.59, "r_y2": 166.75, "r_x3": 134.76, "r_y3": 166.75, "coord_origin": "TOPLEFT" }, "text": "markup languages (e.g. HTML, LaTeX, Markdown). In theory, Im2Seq methods", "orig": "markup languages (e.g. HTML, LaTeX, Markdown). In theory, Im2Seq methods", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 8, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 187.51, "r_x1": 480.6, "r_y1": 187.51, "r_x2": 480.6, "r_y2": 178.71, "r_x3": 134.76, "r_y3": 178.71, "coord_origin": "TOPLEFT" }, "text": "have a natural advantage over the OD and GNN methods by virtue of directly", "orig": "have a natural advantage over the OD and GNN methods by virtue of directly", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 9, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 199.46, "r_x1": 480.59, "r_y1": 199.46, "r_x2": 480.59, "r_y2": 190.66, "r_x3": 134.76, "r_y3": 190.66, "coord_origin": "TOPLEFT" }, "text": "predicting the table-structure. As such, no post-processing or rules are needed", "orig": "predicting the table-structure. As such, no post-processing or rules are needed", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 10, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 211.42, "r_x1": 480.59, "r_y1": 211.42, "r_x2": 480.59, "r_y2": 202.62, "r_x3": 134.76, "r_y3": 202.62, "coord_origin": "TOPLEFT" }, "text": "in order to obtain the table-structure, which is necessary with OD and GNN", "orig": "in order to obtain the table-structure, which is necessary with OD and GNN", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 11, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 223.37, "r_x1": 480.59, "r_y1": 223.37, "r_x2": 480.59, "r_y2": 214.58, "r_x3": 134.76, "r_y3": 214.58, "coord_origin": "TOPLEFT" }, "text": "approaches. In practice, this is not entirely true, because a predicted sequence", "orig": "approaches. In practice, this is not entirely true, because a predicted sequence", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 12, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 235.33, "r_x1": 480.59, "r_y1": 235.33, "r_x2": 480.59, "r_y2": 226.53, "r_x3": 134.76, "r_y3": 226.53, "coord_origin": "TOPLEFT" }, "text": "of table-structure markup does not necessarily have to be syntactically correct.", "orig": "of table-structure markup does not necessarily have to be syntactically correct.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 13, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 247.28, "r_x1": 480.6, "r_y1": 247.28, "r_x2": 480.6, "r_y2": 238.49, "r_x3": 134.76, "r_y3": 238.49, "coord_origin": "TOPLEFT" }, "text": "Hence, depending on the quality of the predicted sequence, some post-processing", "orig": "Hence, depending on the quality of the predicted sequence, some post-processing", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 14, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 259.24, "r_x1": 480.59, "r_y1": 259.24, "r_x2": 480.59, "r_y2": 250.44, "r_x3": 134.76, "r_y3": 250.44, "coord_origin": "TOPLEFT" }, "text": "needs to be performed to ensure a syntactically valid (let alone correct) sequence.", "orig": "needs to be performed to ensure a syntactically valid (let alone correct) sequence.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "Other work [20] aims at predicting a grid for each table and deciding which cells must be merged using an attention network. Im2Seq methods cast the problem as a sequence generation task [4,5,9,22], and therefore need an internal tablestructure representation language, which is often implemented with standard markup languages (e.g. HTML, LaTeX, Markdown). In theory, Im2Seq methods have a natural advantage over the OD and GNN methods by virtue of directly predicting the table-structure. As such, no post-processing or rules are needed in order to obtain the table-structure, which is necessary with OD and GNN approaches. In practice, this is not entirely true, because a predicted sequence of table-structure markup does not necessarily have to be syntactically correct. Hence, depending on the quality of the predicted sequence, some post-processing needs to be performed to ensure a syntactically valid (let alone correct) sequence." }, { "label": "text", "id": 4, "page_no": 3, "cluster": { "id": 4, "label": "text", "bbox": { "l": 134.76, "t": 262.66, "r": 480.6, "b": 486.65, "coord_origin": "TOPLEFT" }, "confidence": 0.929, "cells": [ { "index": 15, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 149.71, "r_y0": 271.45, "r_x1": 480.59, "r_y1": 271.45, "r_x2": 480.59, "r_y2": 262.66, "r_x3": 149.71, "r_y3": 262.66, "coord_origin": "TOPLEFT" }, "text": "Within the Im2Seq method, we find several popular models, namely the", "orig": "Within the Im2Seq method, we find several popular models, namely the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 16, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 283.41, "r_x1": 480.59, "r_y1": 283.41, "r_x2": 480.59, "r_y2": 274.61, "r_x3": 134.76, "r_y3": 274.61, "coord_origin": "TOPLEFT" }, "text": "encoder-dual-decoder model (EDD) [22], TableFormer [9], Tabsplitter[2] and Ye", "orig": "encoder-dual-decoder model (EDD) [22], TableFormer [9], Tabsplitter[2] and Ye", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 17, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 295.36, "r_x1": 480.59, "r_y1": 295.36, "r_x2": 480.59, "r_y2": 286.57, "r_x3": 134.76, "r_y3": 286.57, "coord_origin": "TOPLEFT" }, "text": "et. al. [19]. EDD uses two consecutive long short-term memory (LSTM) decoders", "orig": "et. al. [19]. EDD uses two consecutive long short-term memory (LSTM) decoders", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 18, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 307.32, "r_x1": 342.02, "r_y1": 307.32, "r_x2": 342.02, "r_y2": 298.52, "r_x3": 134.76, "r_y3": 298.52, "coord_origin": "TOPLEFT" }, "text": "to predict a table in HTML representation. The", "orig": "to predict a table in HTML representation. The", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 19, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 345.06, "r_y0": 307.32, "r_x1": 393.05, "r_y1": 307.32, "r_x2": 393.05, "r_y2": 298.52, "r_x3": 345.06, "r_y3": 298.52, "coord_origin": "TOPLEFT" }, "text": "tag decoder", "orig": "tag decoder", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 20, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 397.17, "r_y0": 307.32, "r_x1": 480.59, "r_y1": 307.32, "r_x2": 480.59, "r_y2": 298.52, "r_x3": 397.17, "r_y3": 298.52, "coord_origin": "TOPLEFT" }, "text": "predicts a sequence", "orig": "predicts a sequence", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 21, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 319.27, "r_x1": 333.3, "r_y1": 319.27, "r_x2": 333.3, "r_y2": 310.48, "r_x3": 134.76, "r_y3": 310.48, "coord_origin": "TOPLEFT" }, "text": "of HTML tags. For each decoded table cell (", "orig": "of HTML tags. For each decoded table cell (", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 22, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 333.3, "r_y0": 319.27, "r_x1": 356.97, "r_y1": 319.27, "r_x2": 356.97, "r_y2": 310.48, "r_x3": 333.3, "r_y3": 310.48, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 23, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 357.08, "r_y0": 319.27, "r_x1": 480.59, "r_y1": 319.27, "r_x2": 480.59, "r_y2": 310.48, "r_x3": 357.08, "r_y3": 310.48, "coord_origin": "TOPLEFT" }, "text": "), the attention is passed to", "orig": "), the attention is passed to", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 24, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 331.23, "r_x1": 148.6, "r_y1": 331.23, "r_x2": 148.6, "r_y2": 322.43, "r_x3": 134.76, "r_y3": 322.43, "coord_origin": "TOPLEFT" }, "text": "the", "orig": "the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 25, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 152.28, "r_y0": 331.23, "r_x1": 202.11, "r_y1": 331.23, "r_x2": 202.11, "r_y2": 322.43, "r_x3": 152.28, "r_y3": 322.43, "coord_origin": "TOPLEFT" }, "text": "cell decoder", "orig": "cell decoder", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 26, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 206.86, "r_y0": 331.23, "r_x1": 480.59, "r_y1": 331.23, "r_x2": 480.59, "r_y2": 322.43, "r_x3": 206.86, "r_y3": 322.43, "coord_origin": "TOPLEFT" }, "text": "to predict the content with an embedded OCR approach. The", "orig": "to predict the content with an embedded OCR approach. The", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 27, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 343.18, "r_x1": 480.59, "r_y1": 343.18, "r_x2": 480.59, "r_y2": 334.39, "r_x3": 134.76, "r_y3": 334.39, "coord_origin": "TOPLEFT" }, "text": "latter makes it susceptible to transcription errors in the cell content of the table.", "orig": "latter makes it susceptible to transcription errors in the cell content of the table.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 28, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 355.14, "r_x1": 480.59, "r_y1": 355.14, "r_x2": 480.59, "r_y2": 346.34, "r_x3": 134.76, "r_y3": 346.34, "coord_origin": "TOPLEFT" }, "text": "TableFormer address this reliance on OCR and uses two transformer decoders for", "orig": "TableFormer address this reliance on OCR and uses two transformer decoders for", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 29, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 367.09, "r_x1": 480.59, "r_y1": 367.09, "r_x2": 480.59, "r_y2": 358.3, "r_x3": 134.76, "r_y3": 358.3, "coord_origin": "TOPLEFT" }, "text": "HTML structure and cell bounding box prediction in an end-to-end architecture.", "orig": "HTML structure and cell bounding box prediction in an end-to-end architecture.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 30, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 379.05, "r_x1": 480.59, "r_y1": 379.05, "r_x2": 480.59, "r_y2": 370.25, "r_x3": 134.76, "r_y3": 370.25, "coord_origin": "TOPLEFT" }, "text": "The predicted cell bounding box is then used to extract text tokens from an", "orig": "The predicted cell bounding box is then used to extract text tokens from an", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 31, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 391.01, "r_x1": 480.59, "r_y1": 391.01, "r_x2": 480.59, "r_y2": 382.21, "r_x3": 134.76, "r_y3": 382.21, "coord_origin": "TOPLEFT" }, "text": "originating (digital) PDF page, circumventing any need for OCR. TabSplitter", "orig": "originating (digital) PDF page, circumventing any need for OCR. TabSplitter", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 32, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 402.96, "r_x1": 144.77, "r_y1": 402.96, "r_x2": 144.77, "r_y2": 394.16, "r_x3": 134.76, "r_y3": 394.16, "coord_origin": "TOPLEFT" }, "text": "[2]", "orig": "[2]", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 33, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 149.51, "r_y0": 402.96, "r_x1": 480.59, "r_y1": 402.96, "r_x2": 480.59, "r_y2": 394.16, "r_x3": 149.51, "r_y3": 394.16, "coord_origin": "TOPLEFT" }, "text": "proposes a compact double-matrix representation of table rows and columns", "orig": "proposes a compact double-matrix representation of table rows and columns", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 34, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 414.92, "r_x1": 480.6, "r_y1": 414.92, "r_x2": 480.6, "r_y2": 406.12, "r_x3": 134.76, "r_y3": 406.12, "coord_origin": "TOPLEFT" }, "text": "to do error detection and error correction of HTML structure sequences based", "orig": "to do error detection and error correction of HTML structure sequences based", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 35, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 426.87, "r_x1": 480.59, "r_y1": 426.87, "r_x2": 480.59, "r_y2": 418.07, "r_x3": 134.76, "r_y3": 418.07, "coord_origin": "TOPLEFT" }, "text": "on predictions from [19]. This compact double-matrix representation can not be", "orig": "on predictions from [19]. This compact double-matrix representation can not be", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 36, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 438.83, "r_x1": 480.59, "r_y1": 438.83, "r_x2": 480.59, "r_y2": 430.03, "r_x3": 134.76, "r_y3": 430.03, "coord_origin": "TOPLEFT" }, "text": "used directly by the Img2seq model training, so the model uses HTML as an", "orig": "used directly by the Img2seq model training, so the model uses HTML as an", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 37, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 450.78, "r_x1": 480.59, "r_y1": 450.78, "r_x2": 480.59, "r_y2": 441.98, "r_x3": 134.76, "r_y3": 441.98, "coord_origin": "TOPLEFT" }, "text": "intermediate form. Chi et. al. [4] introduce a data set and a baseline method", "orig": "intermediate form. Chi et. al. [4] introduce a data set and a baseline method", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 38, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 462.74, "r_x1": 384.58, "r_y1": 462.74, "r_x2": 384.58, "r_y2": 453.94, "r_x3": 134.76, "r_y3": 453.94, "coord_origin": "TOPLEFT" }, "text": "using bidirectional LSTMs to predict LaTeX code. Kayal", "orig": "using bidirectional LSTMs to predict LaTeX code. Kayal", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 39, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 391.56, "r_y0": 462.74, "r_x1": 401.73, "r_y1": 462.74, "r_x2": 401.73, "r_y2": 453.94, "r_x3": 391.56, "r_y3": 453.94, "coord_origin": "TOPLEFT" }, "text": "[5]", "orig": "[5]", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 40, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 406.55, "r_y0": 462.74, "r_x1": 480.59, "r_y1": 462.74, "r_x2": 480.59, "r_y2": 453.94, "r_x3": 406.55, "r_y3": 453.94, "coord_origin": "TOPLEFT" }, "text": "introduces Gated", "orig": "introduces Gated", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 41, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 474.69, "r_x1": 480.59, "r_y1": 474.69, "r_x2": 480.59, "r_y2": 465.89, "r_x3": 134.76, "r_y3": 465.89, "coord_origin": "TOPLEFT" }, "text": "ResNet transformers to predict LaTeX code, and a separate OCR module to", "orig": "ResNet transformers to predict LaTeX code, and a separate OCR module to", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 42, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 486.65, "r_x1": 203.69, "r_y1": 486.65, "r_x2": 203.69, "r_y2": 477.85, "r_x3": 134.76, "r_y3": 477.85, "coord_origin": "TOPLEFT" }, "text": "extract content.", "orig": "extract content.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "Within the Im2Seq method, we find several popular models, namely the encoder-dual-decoder model (EDD) [22], TableFormer [9], Tabsplitter[2] and Ye et. al. [19]. EDD uses two consecutive long short-term memory (LSTM) decoders to predict a table in HTML representation. The tag decoder predicts a sequence of HTML tags. For each decoded table cell ( ), the attention is passed to the cell decoder to predict the content with an embedded OCR approach. The latter makes it susceptible to transcription errors in the cell content of the table. TableFormer address this reliance on OCR and uses two transformer decoders for HTML structure and cell bounding box prediction in an end-to-end architecture. The predicted cell bounding box is then used to extract text tokens from an originating (digital) PDF page, circumventing any need for OCR. TabSplitter [2] proposes a compact double-matrix representation of table rows and columns to do error detection and error correction of HTML structure sequences based on predictions from [19]. This compact double-matrix representation can not be used directly by the Img2seq model training, so the model uses HTML as an intermediate form. Chi et. al. [4] introduce a data set and a baseline method using bidirectional LSTMs to predict LaTeX code. Kayal [5] introduces Gated ResNet transformers to predict LaTeX code, and a separate OCR module to extract content." }, { "label": "text", "id": 0, "page_no": 3, "cluster": { "id": 0, "label": "text", "bbox": { "l": 134.76, "t": 490.07, "r": 480.59, "b": 582.55, "coord_origin": "TOPLEFT" }, "confidence": 0.985, "cells": [ { "index": 43, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 149.71, "r_y0": 498.86, "r_x1": 480.59, "r_y1": 498.86, "r_x2": 480.59, "r_y2": 490.07, "r_x3": 149.71, "r_y3": 490.07, "coord_origin": "TOPLEFT" }, "text": "Im2Seq approaches have shown to be well-suited for the TSR task and allow a", "orig": "Im2Seq approaches have shown to be well-suited for the TSR task and allow a", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 44, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 510.82, "r_x1": 480.59, "r_y1": 510.82, "r_x2": 480.59, "r_y2": 502.02, "r_x3": 134.76, "r_y3": 502.02, "coord_origin": "TOPLEFT" }, "text": "full end-to-end network design that can output the final table structure without", "orig": "full end-to-end network design that can output the final table structure without", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 45, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 522.77, "r_x1": 480.59, "r_y1": 522.77, "r_x2": 480.59, "r_y2": 513.98, "r_x3": 134.76, "r_y3": 513.98, "coord_origin": "TOPLEFT" }, "text": "pre- or post-processing logic. Furthermore, Im2Seq models have demonstrated", "orig": "pre- or post-processing logic. Furthermore, Im2Seq models have demonstrated", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 46, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 534.73, "r_x1": 480.59, "r_y1": 534.73, "r_x2": 480.59, "r_y2": 525.93, "r_x3": 134.76, "r_y3": 525.93, "coord_origin": "TOPLEFT" }, "text": "to deliver state-of-the-art prediction accuracy [9]. This motivated the authors", "orig": "to deliver state-of-the-art prediction accuracy [9]. This motivated the authors", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 47, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 546.68, "r_x1": 480.59, "r_y1": 546.68, "r_x2": 480.59, "r_y2": 537.89, "r_x3": 134.76, "r_y3": 537.89, "coord_origin": "TOPLEFT" }, "text": "to investigate if the performance (both in accuracy and inference time) can", "orig": "to investigate if the performance (both in accuracy and inference time) can", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 48, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 558.64, "r_x1": 480.59, "r_y1": 558.64, "r_x2": 480.59, "r_y2": 549.84, "r_x3": 134.76, "r_y3": 549.84, "coord_origin": "TOPLEFT" }, "text": "be further improved by optimising the table structure representation language.", "orig": "be further improved by optimising the table structure representation language.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 49, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 570.59, "r_x1": 480.59, "r_y1": 570.59, "r_x2": 480.59, "r_y2": 561.8, "r_x3": 134.76, "r_y3": 561.8, "coord_origin": "TOPLEFT" }, "text": "We believe this is a necessary step before further improving neural network", "orig": "We believe this is a necessary step before further improving neural network", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 50, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 582.55, "r_x1": 249.28, "r_y1": 582.55, "r_x2": 249.28, "r_y2": 573.75, "r_x3": 134.76, "r_y3": 573.75, "coord_origin": "TOPLEFT" }, "text": "architectures for this task.", "orig": "architectures for this task.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "Im2Seq approaches have shown to be well-suited for the TSR task and allow a full end-to-end network design that can output the final table structure without pre- or post-processing logic. Furthermore, Im2Seq models have demonstrated to deliver state-of-the-art prediction accuracy [9]. This motivated the authors to investigate if the performance (both in accuracy and inference time) can be further improved by optimising the table structure representation language. We believe this is a necessary step before further improving neural network architectures for this task." }, { "label": "section_header", "id": 3, "page_no": 3, "cluster": { "id": 3, "label": "section_header", "bbox": { "l": 134.76, "t": 605.55, "r": 269.62, "b": 616.12, "coord_origin": "TOPLEFT" }, "confidence": 0.939, "cells": [ { "index": 51, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 616.12, "r_x1": 141.49, "r_y1": 616.12, "r_x2": 141.49, "r_y2": 605.55, "r_x3": 134.76, "r_y3": 605.55, "coord_origin": "TOPLEFT" }, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 52, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 154.94, "r_y0": 616.12, "r_x1": 269.62, "r_y1": 616.12, "r_x2": 269.62, "r_y2": 605.55, "r_x3": 154.94, "r_y3": 605.55, "coord_origin": "TOPLEFT" }, "text": "Problem Statement", "orig": "Problem Statement", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "3 Problem Statement" }, { "label": "text", "id": 1, "page_no": 3, "cluster": { "id": 1, "label": "text", "bbox": { "l": 134.76, "t": 632.15, "r": 480.59, "b": 664.86, "coord_origin": "TOPLEFT" }, "confidence": 0.969, "cells": [ { "index": 53, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 640.94, "r_x1": 480.59, "r_y1": 640.94, "r_x2": 480.59, "r_y2": 632.15, "r_x3": 134.76, "r_y3": 632.15, "coord_origin": "TOPLEFT" }, "text": "All known Im2Seq based models for TSR fundamentally work in similar ways.", "orig": "All known Im2Seq based models for TSR fundamentally work in similar ways.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 54, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 652.9, "r_x1": 480.59, "r_y1": 652.9, "r_x2": 480.59, "r_y2": 644.1, "r_x3": 134.76, "r_y3": 644.1, "coord_origin": "TOPLEFT" }, "text": "Given an image of a table, the Im2Seq model predicts the structure of the table", "orig": "Given an image of a table, the Im2Seq model predicts the structure of the table", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 55, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 664.86, "r_x1": 480.59, "r_y1": 664.86, "r_x2": 480.59, "r_y2": 656.06, "r_x3": 134.76, "r_y3": 656.06, "coord_origin": "TOPLEFT" }, "text": "by generating a sequence of tokens. These tokens originate from a finite vocab-", "orig": "by generating a sequence of tokens. These tokens originate from a finite vocab-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "All known Im2Seq based models for TSR fundamentally work in similar ways. Given an image of a table, the Im2Seq model predicts the structure of the table by generating a sequence of tokens. These tokens originate from a finite vocab-" } ], "headers": [ { "label": "page_header", "id": 6, "page_no": 3, "cluster": { "id": 6, "label": "page_header", "bbox": { "l": 134.76, "t": 93.77, "r": 139.37, "b": 101.84, "coord_origin": "TOPLEFT" }, "confidence": 0.789, "cells": [ { "index": 0, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 101.84, "r_x1": 139.37, "r_y1": 101.84, "r_x2": 139.37, "r_y2": 93.77, "r_x3": 134.76, "r_y3": 93.77, "coord_origin": "TOPLEFT" }, "text": "4", "orig": "4", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "4" }, { "label": "page_header", "id": 5, "page_no": 3, "cluster": { "id": 5, "label": "page_header", "bbox": { "l": 167.81, "t": 93.77, "r": 231.72, "b": 101.84, "coord_origin": "TOPLEFT" }, "confidence": 0.905, "cells": [ { "index": 1, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 167.81, "r_y0": 101.84, "r_x1": 178.08, "r_y1": 101.84, "r_x2": 178.08, "r_y2": 93.77, "r_x3": 167.81, "r_y3": 93.77, "coord_origin": "TOPLEFT" }, "text": "M.", "orig": "M.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 2, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 182.37, "r_y0": 101.84, "r_x1": 231.72, "r_y1": 101.84, "r_x2": 231.72, "r_y2": 93.77, "r_x3": 182.37, "r_y3": 93.77, "coord_origin": "TOPLEFT" }, "text": "Lysak, et al.", "orig": "Lysak, et al.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "M. Lysak, et al." } ] } }, { "page_no": 4, "size": { "width": 612.0, "height": 792.0 }, "parsed_page": { "dimension": { "angle": 0.0, "rect": { "r_x0": 0.0, "r_y0": 0.0, "r_x1": 612.0, "r_y1": 0.0, "r_x2": 612.0, "r_y2": 792.0, "r_x3": 0.0, "r_y3": 792.0, "coord_origin": "BOTTOMLEFT" }, "boundary_type": "crop_box", "art_bbox": { "l": 0.0, "t": 792.0, "r": 612.0, "b": 0.0, "coord_origin": "BOTTOMLEFT" }, "bleed_bbox": { "l": 0.0, "t": 792.0, "r": 612.0, "b": 0.0, "coord_origin": "BOTTOMLEFT" }, "crop_bbox": { "l": 0.0, "t": 792.0, "r": 612.0, "b": 0.0, "coord_origin": "BOTTOMLEFT" }, "media_bbox": { "l": 0.0, "t": 792.0, "r": 612.0, "b": 0.0, "coord_origin": "BOTTOMLEFT" }, "trim_bbox": { "l": 0.0, "t": 792.0, "r": 612.0, "b": 0.0, "coord_origin": "BOTTOMLEFT" } }, "bitmap_resources": [], "char_cells": [], "word_cells": [], "textline_cells": [ { "index": 0, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 194.48, "r_y0": 101.84, "r_x1": 447.54, "r_y1": 101.84, "r_x2": 447.54, "r_y2": 93.77, "r_x3": 194.48, "r_y3": 93.77, "coord_origin": "TOPLEFT" }, "text": "Optimized Table Tokenization for Table Structure Recognition", "orig": "Optimized Table Tokenization for Table Structure Recognition", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 1, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 475.98, "r_y0": 101.84, "r_x1": 480.59, "r_y1": 101.84, "r_x2": 480.59, "r_y2": 93.77, "r_x3": 475.98, "r_y3": 93.77, "coord_origin": "TOPLEFT" }, "text": "5", "orig": "5", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 2, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 127.73, "r_x1": 480.59, "r_y1": 127.73, "r_x2": 480.59, "r_y2": 118.93, "r_x3": 134.76, "r_y3": 118.93, "coord_origin": "TOPLEFT" }, "text": "ulary and can be interpreted as a table structure. For example, with the HTML", "orig": "ulary and can be interpreted as a table structure. For example, with the HTML", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 3, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 139.69, "r_x1": 162.48, "r_y1": 139.69, "r_x2": 162.48, "r_y2": 130.89, "r_x3": 134.76, "r_y3": 130.89, "coord_origin": "TOPLEFT" }, "text": "tokens", "orig": "tokens", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 4, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 166.37, "r_y0": 139.69, "r_x1": 201.75, "r_y1": 139.69, "r_x2": 201.75, "r_y2": 130.89, "r_x3": 166.37, "r_y3": 130.89, "coord_origin": "TOPLEFT" }, "text": "", "orig": "
", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 5, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 201.75, "r_y0": 139.69, "r_x1": 204.52, "r_y1": 139.69, "r_x2": 204.52, "r_y2": 130.89, "r_x3": 201.75, "r_y3": 130.89, "coord_origin": "TOPLEFT" }, "text": ",", "orig": ",", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 6, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 208.4, "r_y0": 139.69, "r_x1": 248.87, "r_y1": 139.69, "r_x2": 248.87, "r_y2": 130.89, "r_x3": 208.4, "r_y3": 130.89, "coord_origin": "TOPLEFT" }, "text": "
", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 7, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 248.87, "r_y0": 139.69, "r_x1": 251.64, "r_y1": 139.69, "r_x2": 251.64, "r_y2": 130.89, "r_x3": 248.87, "r_y3": 130.89, "coord_origin": "TOPLEFT" }, "text": ",", "orig": ",", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 8, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 255.52, "r_y0": 139.69, "r_x1": 278.3, "r_y1": 139.69, "r_x2": 278.3, "r_y2": 130.89, "r_x3": 255.52, "r_y3": 130.89, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 9, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 278.3, "r_y0": 139.69, "r_x1": 281.06, "r_y1": 139.69, "r_x2": 281.06, "r_y2": 130.89, "r_x3": 278.3, "r_y3": 130.89, "coord_origin": "TOPLEFT" }, "text": ",", "orig": ",", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 10, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 284.95, "r_y0": 139.69, "r_x1": 312.82, "r_y1": 139.69, "r_x2": 312.82, "r_y2": 130.89, "r_x3": 284.95, "r_y3": 130.89, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 11, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 312.82, "r_y0": 139.69, "r_x1": 315.58, "r_y1": 139.69, "r_x2": 315.58, "r_y2": 130.89, "r_x3": 312.82, "r_y3": 130.89, "coord_origin": "TOPLEFT" }, "text": ",", "orig": ",", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 12, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 319.47, "r_y0": 139.69, "r_x1": 343.14, "r_y1": 139.69, "r_x2": 343.14, "r_y2": 130.89, "r_x3": 319.47, "r_y3": 130.89, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 13, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 347.13, "r_y0": 139.69, "r_x1": 363.18, "r_y1": 139.69, "r_x2": 363.18, "r_y2": 130.89, "r_x3": 347.13, "r_y3": 130.89, "coord_origin": "TOPLEFT" }, "text": "and", "orig": "and", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 14, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 367.06, "r_y0": 139.69, "r_x1": 395.82, "r_y1": 139.69, "r_x2": 395.82, "r_y2": 130.89, "r_x3": 367.06, "r_y3": 130.89, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 15, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 395.82, "r_y0": 139.69, "r_x1": 480.59, "r_y1": 139.69, "r_x2": 480.59, "r_y2": 130.89, "r_x3": 395.82, "r_y3": 130.89, "coord_origin": "TOPLEFT" }, "text": ", one can construct", "orig": ", one can construct", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 16, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.77, "r_y0": 151.64, "r_x1": 480.59, "r_y1": 151.64, "r_x2": 480.59, "r_y2": 142.84, "r_x3": 134.77, "r_y3": 142.84, "coord_origin": "TOPLEFT" }, "text": "simple table structures without any spanning cells. In reality though, one needs", "orig": "simple table structures without any spanning cells. In reality though, one needs", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 17, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.77, "r_y0": 163.6, "r_x1": 480.59, "r_y1": 163.6, "r_x2": 480.59, "r_y2": 154.8, "r_x3": 134.77, "r_y3": 154.8, "coord_origin": "TOPLEFT" }, "text": "at least 28 HTML tokens to describe the most common complex tables observed", "orig": "at least 28 HTML tokens to describe the most common complex tables observed", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 18, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.77, "r_y0": 175.55, "r_x1": 480.59, "r_y1": 175.55, "r_x2": 480.59, "r_y2": 166.75, "r_x3": 134.77, "r_y3": 166.75, "coord_origin": "TOPLEFT" }, "text": "in real-world documents [21,22], due to a variety of spanning cells definitions in", "orig": "in real-world documents [21,22], due to a variety of spanning cells definitions in", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 19, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.77, "r_y0": 187.51, "r_x1": 261.93, "r_y1": 187.51, "r_x2": 261.93, "r_y2": 178.71, "r_x3": 134.77, "r_y3": 178.71, "coord_origin": "TOPLEFT" }, "text": "the HTML token vocabulary.", "orig": "the HTML token vocabulary.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 20, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 145.61, "r_y0": 229.01, "r_x1": 173.49, "r_y1": 229.01, "r_x2": 173.49, "r_y2": 221.08, "r_x3": 145.61, "r_y3": 221.08, "coord_origin": "TOPLEFT" }, "text": "Fig. 2.", "orig": "Fig. 2.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 21, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 176.56, "r_y0": 229.21, "r_x1": 469.75, "r_y1": 229.21, "r_x2": 469.75, "r_y2": 221.14, "r_x3": 176.56, "r_y3": 221.14, "coord_origin": "TOPLEFT" }, "text": "Frequency of tokens in HTML and OTSL as they appear in PubTabNet.", "orig": "Frequency of tokens in HTML and OTSL as they appear in PubTabNet.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 22, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 149.71, "r_y0": 377.0, "r_x1": 480.59, "r_y1": 377.0, "r_x2": 480.59, "r_y2": 368.21, "r_x3": 149.71, "r_y3": 368.21, "coord_origin": "TOPLEFT" }, "text": "Obviously, HTML and other general-purpose markup languages were not de-", "orig": "Obviously, HTML and other general-purpose markup languages were not de-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 23, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 388.96, "r_x1": 480.59, "r_y1": 388.96, "r_x2": 480.59, "r_y2": 380.16, "r_x3": 134.76, "r_y3": 380.16, "coord_origin": "TOPLEFT" }, "text": "signed for Im2Seq models. As such, they have some serious drawbacks. First, the", "orig": "signed for Im2Seq models. As such, they have some serious drawbacks. First, the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 24, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 400.91, "r_x1": 480.59, "r_y1": 400.91, "r_x2": 480.59, "r_y2": 392.12, "r_x3": 134.76, "r_y3": 392.12, "coord_origin": "TOPLEFT" }, "text": "token vocabulary needs to be artificially large in order to describe all plausible", "orig": "token vocabulary needs to be artificially large in order to describe all plausible", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 25, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 412.87, "r_x1": 480.59, "r_y1": 412.87, "r_x2": 480.59, "r_y2": 404.07, "r_x3": 134.76, "r_y3": 404.07, "coord_origin": "TOPLEFT" }, "text": "tabular structures. Since most Im2Seq models use an autoregressive approach,", "orig": "tabular structures. Since most Im2Seq models use an autoregressive approach,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 26, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 424.82, "r_x1": 480.59, "r_y1": 424.82, "r_x2": 480.59, "r_y2": 416.03, "r_x3": 134.76, "r_y3": 416.03, "coord_origin": "TOPLEFT" }, "text": "they generate the sequence token by token. Therefore, to reduce inference time,", "orig": "they generate the sequence token by token. Therefore, to reduce inference time,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 27, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 436.78, "r_x1": 480.59, "r_y1": 436.78, "r_x2": 480.59, "r_y2": 427.98, "r_x3": 134.76, "r_y3": 427.98, "coord_origin": "TOPLEFT" }, "text": "a shorter sequence length is critical. Every table-cell is represented by at least", "orig": "a shorter sequence length is critical. Every table-cell is represented by at least", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 28, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 448.73, "r_x1": 187.93, "r_y1": 448.73, "r_x2": 187.93, "r_y2": 439.94, "r_x3": 134.76, "r_y3": 439.94, "coord_origin": "TOPLEFT" }, "text": "two tokens (", "orig": "two tokens (", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 29, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 187.93, "r_y0": 448.73, "r_x1": 211.6, "r_y1": 448.73, "r_x2": 211.6, "r_y2": 439.94, "r_x3": 187.93, "r_y3": 439.94, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 30, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 214.75, "r_y0": 448.73, "r_x1": 230.8, "r_y1": 448.73, "r_x2": 230.8, "r_y2": 439.94, "r_x3": 214.75, "r_y3": 439.94, "coord_origin": "TOPLEFT" }, "text": "and", "orig": "and", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 31, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 233.84, "r_y0": 448.73, "r_x1": 262.6, "r_y1": 448.73, "r_x2": 262.6, "r_y2": 439.94, "r_x3": 233.84, "r_y3": 439.94, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 32, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 262.72, "r_y0": 448.73, "r_x1": 480.59, "r_y1": 448.73, "r_x2": 480.59, "r_y2": 439.94, "r_x3": 262.72, "r_y3": 439.94, "coord_origin": "TOPLEFT" }, "text": "). Furthermore, when tokenizing the HTML struc-", "orig": "). Furthermore, when tokenizing the HTML struc-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 33, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.77, "r_y0": 460.69, "r_x1": 480.59, "r_y1": 460.69, "r_x2": 480.59, "r_y2": 451.89, "r_x3": 134.77, "r_y3": 451.89, "coord_origin": "TOPLEFT" }, "text": "ture, one needs to explicitly enumerate possible column-spans and row-spans", "orig": "ture, one needs to explicitly enumerate possible column-spans and row-spans", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 34, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.77, "r_y0": 472.64, "r_x1": 480.59, "r_y1": 472.64, "r_x2": 480.59, "r_y2": 463.85, "r_x3": 134.77, "r_y3": 463.85, "coord_origin": "TOPLEFT" }, "text": "as words. In practice, this ends up requiring 28 different HTML tokens (when", "orig": "as words. In practice, this ends up requiring 28 different HTML tokens (when", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 35, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.77, "r_y0": 484.6, "r_x1": 480.59, "r_y1": 484.6, "r_x2": 480.59, "r_y2": 475.8, "r_x3": 134.77, "r_y3": 475.8, "coord_origin": "TOPLEFT" }, "text": "including column- and row-spans up to 10 cells) just to describe every table in", "orig": "including column- and row-spans up to 10 cells) just to describe every table in", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 36, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.77, "r_y0": 496.56, "r_x1": 480.59, "r_y1": 496.56, "r_x2": 480.59, "r_y2": 487.76, "r_x3": 134.77, "r_y3": 487.76, "coord_origin": "TOPLEFT" }, "text": "the PubTabNet dataset. Clearly, not every token is equally represented, as is", "orig": "the PubTabNet dataset. Clearly, not every token is equally represented, as is", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 37, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.77, "r_y0": 508.51, "r_x1": 480.59, "r_y1": 508.51, "r_x2": 480.59, "r_y2": 499.71, "r_x3": 134.77, "r_y3": 499.71, "coord_origin": "TOPLEFT" }, "text": "depicted in Figure 2. This skewed distribution of tokens in combination with", "orig": "depicted in Figure 2. This skewed distribution of tokens in combination with", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 38, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.77, "r_y0": 520.47, "r_x1": 480.59, "r_y1": 520.47, "r_x2": 480.59, "r_y2": 511.67, "r_x3": 134.77, "r_y3": 511.67, "coord_origin": "TOPLEFT" }, "text": "variable token row-length makes it challenging for models to learn the HTML", "orig": "variable token row-length makes it challenging for models to learn the HTML", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 39, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.77, "r_y0": 532.42, "r_x1": 176.93, "r_y1": 532.42, "r_x2": 176.93, "r_y2": 523.62, "r_x3": 134.77, "r_y3": 523.62, "coord_origin": "TOPLEFT" }, "text": "structure.", "orig": "structure.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 40, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 149.71, "r_y0": 544.84, "r_x1": 480.59, "r_y1": 544.84, "r_x2": 480.59, "r_y2": 536.04, "r_x3": 149.71, "r_y3": 536.04, "coord_origin": "TOPLEFT" }, "text": "Additionally, it would be desirable if the representation would easily allow", "orig": "Additionally, it would be desirable if the representation would easily allow", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 41, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.77, "r_y0": 556.79, "r_x1": 480.59, "r_y1": 556.79, "r_x2": 480.59, "r_y2": 548.0, "r_x3": 134.77, "r_y3": 548.0, "coord_origin": "TOPLEFT" }, "text": "an early detection of invalid sequences on-the-go, before the prediction of the", "orig": "an early detection of invalid sequences on-the-go, before the prediction of the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 42, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.77, "r_y0": 568.75, "r_x1": 480.59, "r_y1": 568.75, "r_x2": 480.59, "r_y2": 559.95, "r_x3": 134.77, "r_y3": 559.95, "coord_origin": "TOPLEFT" }, "text": "entire table structure is completed. HTML is not well-suited for this purpose as", "orig": "entire table structure is completed. HTML is not well-suited for this purpose as", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 43, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.77, "r_y0": 580.71, "r_x1": 452.19, "r_y1": 580.71, "r_x2": 452.19, "r_y2": 571.91, "r_x3": 134.77, "r_y3": 571.91, "coord_origin": "TOPLEFT" }, "text": "the verification of incomplete sequences is non-trivial or even impossible.", "orig": "the verification of incomplete sequences is non-trivial or even impossible.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 44, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 149.71, "r_y0": 593.12, "r_x1": 480.59, "r_y1": 593.12, "r_x2": 480.59, "r_y2": 584.33, "r_x3": 149.71, "r_y3": 584.33, "coord_origin": "TOPLEFT" }, "text": "In a valid HTML table, the token sequence must describe a 2D grid of table", "orig": "In a valid HTML table, the token sequence must describe a 2D grid of table", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 45, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.77, "r_y0": 605.08, "r_x1": 480.59, "r_y1": 605.08, "r_x2": 480.59, "r_y2": 596.28, "r_x3": 134.77, "r_y3": 596.28, "coord_origin": "TOPLEFT" }, "text": "cells, serialised in row-major ordering, where each row and each column have", "orig": "cells, serialised in row-major ordering, where each row and each column have", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 46, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.77, "r_y0": 617.03, "r_x1": 480.59, "r_y1": 617.03, "r_x2": 480.59, "r_y2": 608.24, "r_x3": 134.77, "r_y3": 608.24, "coord_origin": "TOPLEFT" }, "text": "the same length (while considering row- and column-spans). Furthermore, every", "orig": "the same length (while considering row- and column-spans). Furthermore, every", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 47, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.77, "r_y0": 628.99, "r_x1": 480.59, "r_y1": 628.99, "r_x2": 480.59, "r_y2": 620.19, "r_x3": 134.77, "r_y3": 620.19, "coord_origin": "TOPLEFT" }, "text": "opening tag in HTML needs to be matched by a closing tag in a correct hierar-", "orig": "opening tag in HTML needs to be matched by a closing tag in a correct hierar-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 48, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.77, "r_y0": 640.94, "r_x1": 480.59, "r_y1": 640.94, "r_x2": 480.59, "r_y2": 632.15, "r_x3": 134.77, "r_y3": 632.15, "coord_origin": "TOPLEFT" }, "text": "chical manner. Since the number of tokens for each table row and column can", "orig": "chical manner. Since the number of tokens for each table row and column can", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 49, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.77, "r_y0": 652.9, "r_x1": 480.59, "r_y1": 652.9, "r_x2": 480.59, "r_y2": 644.1, "r_x3": 134.77, "r_y3": 644.1, "coord_origin": "TOPLEFT" }, "text": "vary significantly, especially for large tables with many row- and column-spans,", "orig": "vary significantly, especially for large tables with many row- and column-spans,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 50, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.77, "r_y0": 664.85, "r_x1": 480.59, "r_y1": 664.85, "r_x2": 480.59, "r_y2": 656.06, "r_x3": 134.77, "r_y3": 656.06, "coord_origin": "TOPLEFT" }, "text": "it is complex to verify the consistency of predicted structures during sequence", "orig": "it is complex to verify the consistency of predicted structures during sequence", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "has_chars": false, "has_words": false, "has_lines": true, "image": null, "lines": [] }, "predictions": { "layout": { "clusters": [ { "id": 5, "label": "page_header", "bbox": { "l": 194.48, "t": 93.77, "r": 447.54, "b": 101.84, "coord_origin": "TOPLEFT" }, "confidence": 0.927, "cells": [ { "index": 0, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 194.48, "r_y0": 101.84, "r_x1": 447.54, "r_y1": 101.84, "r_x2": 447.54, "r_y2": 93.77, "r_x3": 194.48, "r_y3": 93.77, "coord_origin": "TOPLEFT" }, "text": "Optimized Table Tokenization for Table Structure Recognition", "orig": "Optimized Table Tokenization for Table Structure Recognition", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 6, "label": "page_header", "bbox": { "l": 475.98, "t": 93.77, "r": 480.59, "b": 101.84, "coord_origin": "TOPLEFT" }, "confidence": 0.87, "cells": [ { "index": 1, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 475.98, "r_y0": 101.84, "r_x1": 480.59, "r_y1": 101.84, "r_x2": 480.59, "r_y2": 93.77, "r_x3": 475.98, "r_y3": 93.77, "coord_origin": "TOPLEFT" }, "text": "5", "orig": "5", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 0, "label": "text", "bbox": { "l": 134.76, "t": 118.93, "r": 480.59, "b": 187.51, "coord_origin": "TOPLEFT" }, "confidence": 0.986, "cells": [ { "index": 2, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 127.73, "r_x1": 480.59, "r_y1": 127.73, "r_x2": 480.59, "r_y2": 118.93, "r_x3": 134.76, "r_y3": 118.93, "coord_origin": "TOPLEFT" }, "text": "ulary and can be interpreted as a table structure. For example, with the HTML", "orig": "ulary and can be interpreted as a table structure. For example, with the HTML", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 3, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 139.69, "r_x1": 162.48, "r_y1": 139.69, "r_x2": 162.48, "r_y2": 130.89, "r_x3": 134.76, "r_y3": 130.89, "coord_origin": "TOPLEFT" }, "text": "tokens", "orig": "tokens", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 4, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 166.37, "r_y0": 139.69, "r_x1": 201.75, "r_y1": 139.69, "r_x2": 201.75, "r_y2": 130.89, "r_x3": 166.37, "r_y3": 130.89, "coord_origin": "TOPLEFT" }, "text": "", "orig": "
", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 5, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 201.75, "r_y0": 139.69, "r_x1": 204.52, "r_y1": 139.69, "r_x2": 204.52, "r_y2": 130.89, "r_x3": 201.75, "r_y3": 130.89, "coord_origin": "TOPLEFT" }, "text": ",", "orig": ",", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 6, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 208.4, "r_y0": 139.69, "r_x1": 248.87, "r_y1": 139.69, "r_x2": 248.87, "r_y2": 130.89, "r_x3": 208.4, "r_y3": 130.89, "coord_origin": "TOPLEFT" }, "text": "
", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 7, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 248.87, "r_y0": 139.69, "r_x1": 251.64, "r_y1": 139.69, "r_x2": 251.64, "r_y2": 130.89, "r_x3": 248.87, "r_y3": 130.89, "coord_origin": "TOPLEFT" }, "text": ",", "orig": ",", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 8, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 255.52, "r_y0": 139.69, "r_x1": 278.3, "r_y1": 139.69, "r_x2": 278.3, "r_y2": 130.89, "r_x3": 255.52, "r_y3": 130.89, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 9, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 278.3, "r_y0": 139.69, "r_x1": 281.06, "r_y1": 139.69, "r_x2": 281.06, "r_y2": 130.89, "r_x3": 278.3, "r_y3": 130.89, "coord_origin": "TOPLEFT" }, "text": ",", "orig": ",", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 10, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 284.95, "r_y0": 139.69, "r_x1": 312.82, "r_y1": 139.69, "r_x2": 312.82, "r_y2": 130.89, "r_x3": 284.95, "r_y3": 130.89, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 11, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 312.82, "r_y0": 139.69, "r_x1": 315.58, "r_y1": 139.69, "r_x2": 315.58, "r_y2": 130.89, "r_x3": 312.82, "r_y3": 130.89, "coord_origin": "TOPLEFT" }, "text": ",", "orig": ",", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 12, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 319.47, "r_y0": 139.69, "r_x1": 343.14, "r_y1": 139.69, "r_x2": 343.14, "r_y2": 130.89, "r_x3": 319.47, "r_y3": 130.89, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 13, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 347.13, "r_y0": 139.69, "r_x1": 363.18, "r_y1": 139.69, "r_x2": 363.18, "r_y2": 130.89, "r_x3": 347.13, "r_y3": 130.89, "coord_origin": "TOPLEFT" }, "text": "and", "orig": "and", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 14, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 367.06, "r_y0": 139.69, "r_x1": 395.82, "r_y1": 139.69, "r_x2": 395.82, "r_y2": 130.89, "r_x3": 367.06, "r_y3": 130.89, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 15, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 395.82, "r_y0": 139.69, "r_x1": 480.59, "r_y1": 139.69, "r_x2": 480.59, "r_y2": 130.89, "r_x3": 395.82, "r_y3": 130.89, "coord_origin": "TOPLEFT" }, "text": ", one can construct", "orig": ", one can construct", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 16, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.77, "r_y0": 151.64, "r_x1": 480.59, "r_y1": 151.64, "r_x2": 480.59, "r_y2": 142.84, "r_x3": 134.77, "r_y3": 142.84, "coord_origin": "TOPLEFT" }, "text": "simple table structures without any spanning cells. In reality though, one needs", "orig": "simple table structures without any spanning cells. In reality though, one needs", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 17, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.77, "r_y0": 163.6, "r_x1": 480.59, "r_y1": 163.6, "r_x2": 480.59, "r_y2": 154.8, "r_x3": 134.77, "r_y3": 154.8, "coord_origin": "TOPLEFT" }, "text": "at least 28 HTML tokens to describe the most common complex tables observed", "orig": "at least 28 HTML tokens to describe the most common complex tables observed", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 18, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.77, "r_y0": 175.55, "r_x1": 480.59, "r_y1": 175.55, "r_x2": 480.59, "r_y2": 166.75, "r_x3": 134.77, "r_y3": 166.75, "coord_origin": "TOPLEFT" }, "text": "in real-world documents [21,22], due to a variety of spanning cells definitions in", "orig": "in real-world documents [21,22], due to a variety of spanning cells definitions in", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 19, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.77, "r_y0": 187.51, "r_x1": 261.93, "r_y1": 187.51, "r_x2": 261.93, "r_y2": 178.71, "r_x3": 134.77, "r_y3": 178.71, "coord_origin": "TOPLEFT" }, "text": "the HTML token vocabulary.", "orig": "the HTML token vocabulary.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 7, "label": "caption", "bbox": { "l": 145.61, "t": 221.08, "r": 469.75, "b": 229.21, "coord_origin": "TOPLEFT" }, "confidence": 0.847, "cells": [ { "index": 20, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 145.61, "r_y0": 229.01, "r_x1": 173.49, "r_y1": 229.01, "r_x2": 173.49, "r_y2": 221.08, "r_x3": 145.61, "r_y3": 221.08, "coord_origin": "TOPLEFT" }, "text": "Fig. 2.", "orig": "Fig. 2.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 21, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 176.56, "r_y0": 229.21, "r_x1": 469.75, "r_y1": 229.21, "r_x2": 469.75, "r_y2": 221.14, "r_x3": 176.56, "r_y3": 221.14, "coord_origin": "TOPLEFT" }, "text": "Frequency of tokens in HTML and OTSL as they appear in PubTabNet.", "orig": "Frequency of tokens in HTML and OTSL as they appear in PubTabNet.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 1, "label": "text", "bbox": { "l": 134.76, "t": 368.21, "r": 480.59, "b": 532.42, "coord_origin": "TOPLEFT" }, "confidence": 0.984, "cells": [ { "index": 22, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 149.71, "r_y0": 377.0, "r_x1": 480.59, "r_y1": 377.0, "r_x2": 480.59, "r_y2": 368.21, "r_x3": 149.71, "r_y3": 368.21, "coord_origin": "TOPLEFT" }, "text": "Obviously, HTML and other general-purpose markup languages were not de-", "orig": "Obviously, HTML and other general-purpose markup languages were not de-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 23, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 388.96, "r_x1": 480.59, "r_y1": 388.96, "r_x2": 480.59, "r_y2": 380.16, "r_x3": 134.76, "r_y3": 380.16, "coord_origin": "TOPLEFT" }, "text": "signed for Im2Seq models. As such, they have some serious drawbacks. First, the", "orig": "signed for Im2Seq models. As such, they have some serious drawbacks. First, the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 24, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 400.91, "r_x1": 480.59, "r_y1": 400.91, "r_x2": 480.59, "r_y2": 392.12, "r_x3": 134.76, "r_y3": 392.12, "coord_origin": "TOPLEFT" }, "text": "token vocabulary needs to be artificially large in order to describe all plausible", "orig": "token vocabulary needs to be artificially large in order to describe all plausible", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 25, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 412.87, "r_x1": 480.59, "r_y1": 412.87, "r_x2": 480.59, "r_y2": 404.07, "r_x3": 134.76, "r_y3": 404.07, "coord_origin": "TOPLEFT" }, "text": "tabular structures. Since most Im2Seq models use an autoregressive approach,", "orig": "tabular structures. Since most Im2Seq models use an autoregressive approach,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 26, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 424.82, "r_x1": 480.59, "r_y1": 424.82, "r_x2": 480.59, "r_y2": 416.03, "r_x3": 134.76, "r_y3": 416.03, "coord_origin": "TOPLEFT" }, "text": "they generate the sequence token by token. Therefore, to reduce inference time,", "orig": "they generate the sequence token by token. Therefore, to reduce inference time,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 27, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 436.78, "r_x1": 480.59, "r_y1": 436.78, "r_x2": 480.59, "r_y2": 427.98, "r_x3": 134.76, "r_y3": 427.98, "coord_origin": "TOPLEFT" }, "text": "a shorter sequence length is critical. Every table-cell is represented by at least", "orig": "a shorter sequence length is critical. Every table-cell is represented by at least", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 28, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 448.73, "r_x1": 187.93, "r_y1": 448.73, "r_x2": 187.93, "r_y2": 439.94, "r_x3": 134.76, "r_y3": 439.94, "coord_origin": "TOPLEFT" }, "text": "two tokens (", "orig": "two tokens (", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 29, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 187.93, "r_y0": 448.73, "r_x1": 211.6, "r_y1": 448.73, "r_x2": 211.6, "r_y2": 439.94, "r_x3": 187.93, "r_y3": 439.94, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 30, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 214.75, "r_y0": 448.73, "r_x1": 230.8, "r_y1": 448.73, "r_x2": 230.8, "r_y2": 439.94, "r_x3": 214.75, "r_y3": 439.94, "coord_origin": "TOPLEFT" }, "text": "and", "orig": "and", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 31, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 233.84, "r_y0": 448.73, "r_x1": 262.6, "r_y1": 448.73, "r_x2": 262.6, "r_y2": 439.94, "r_x3": 233.84, "r_y3": 439.94, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 32, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 262.72, "r_y0": 448.73, "r_x1": 480.59, "r_y1": 448.73, "r_x2": 480.59, "r_y2": 439.94, "r_x3": 262.72, "r_y3": 439.94, "coord_origin": "TOPLEFT" }, "text": "). Furthermore, when tokenizing the HTML struc-", "orig": "). Furthermore, when tokenizing the HTML struc-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 33, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.77, "r_y0": 460.69, "r_x1": 480.59, "r_y1": 460.69, "r_x2": 480.59, "r_y2": 451.89, "r_x3": 134.77, "r_y3": 451.89, "coord_origin": "TOPLEFT" }, "text": "ture, one needs to explicitly enumerate possible column-spans and row-spans", "orig": "ture, one needs to explicitly enumerate possible column-spans and row-spans", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 34, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.77, "r_y0": 472.64, "r_x1": 480.59, "r_y1": 472.64, "r_x2": 480.59, "r_y2": 463.85, "r_x3": 134.77, "r_y3": 463.85, "coord_origin": "TOPLEFT" }, "text": "as words. In practice, this ends up requiring 28 different HTML tokens (when", "orig": "as words. In practice, this ends up requiring 28 different HTML tokens (when", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 35, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.77, "r_y0": 484.6, "r_x1": 480.59, "r_y1": 484.6, "r_x2": 480.59, "r_y2": 475.8, "r_x3": 134.77, "r_y3": 475.8, "coord_origin": "TOPLEFT" }, "text": "including column- and row-spans up to 10 cells) just to describe every table in", "orig": "including column- and row-spans up to 10 cells) just to describe every table in", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 36, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.77, "r_y0": 496.56, "r_x1": 480.59, "r_y1": 496.56, "r_x2": 480.59, "r_y2": 487.76, "r_x3": 134.77, "r_y3": 487.76, "coord_origin": "TOPLEFT" }, "text": "the PubTabNet dataset. Clearly, not every token is equally represented, as is", "orig": "the PubTabNet dataset. Clearly, not every token is equally represented, as is", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 37, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.77, "r_y0": 508.51, "r_x1": 480.59, "r_y1": 508.51, "r_x2": 480.59, "r_y2": 499.71, "r_x3": 134.77, "r_y3": 499.71, "coord_origin": "TOPLEFT" }, "text": "depicted in Figure 2. This skewed distribution of tokens in combination with", "orig": "depicted in Figure 2. This skewed distribution of tokens in combination with", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 38, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.77, "r_y0": 520.47, "r_x1": 480.59, "r_y1": 520.47, "r_x2": 480.59, "r_y2": 511.67, "r_x3": 134.77, "r_y3": 511.67, "coord_origin": "TOPLEFT" }, "text": "variable token row-length makes it challenging for models to learn the HTML", "orig": "variable token row-length makes it challenging for models to learn the HTML", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 39, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.77, "r_y0": 532.42, "r_x1": 176.93, "r_y1": 532.42, "r_x2": 176.93, "r_y2": 523.62, "r_x3": 134.77, "r_y3": 523.62, "coord_origin": "TOPLEFT" }, "text": "structure.", "orig": "structure.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 3, "label": "text", "bbox": { "l": 134.77, "t": 536.04, "r": 480.59, "b": 580.71, "coord_origin": "TOPLEFT" }, "confidence": 0.978, "cells": [ { "index": 40, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 149.71, "r_y0": 544.84, "r_x1": 480.59, "r_y1": 544.84, "r_x2": 480.59, "r_y2": 536.04, "r_x3": 149.71, "r_y3": 536.04, "coord_origin": "TOPLEFT" }, "text": "Additionally, it would be desirable if the representation would easily allow", "orig": "Additionally, it would be desirable if the representation would easily allow", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 41, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.77, "r_y0": 556.79, "r_x1": 480.59, "r_y1": 556.79, "r_x2": 480.59, "r_y2": 548.0, "r_x3": 134.77, "r_y3": 548.0, "coord_origin": "TOPLEFT" }, "text": "an early detection of invalid sequences on-the-go, before the prediction of the", "orig": "an early detection of invalid sequences on-the-go, before the prediction of the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 42, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.77, "r_y0": 568.75, "r_x1": 480.59, "r_y1": 568.75, "r_x2": 480.59, "r_y2": 559.95, "r_x3": 134.77, "r_y3": 559.95, "coord_origin": "TOPLEFT" }, "text": "entire table structure is completed. HTML is not well-suited for this purpose as", "orig": "entire table structure is completed. HTML is not well-suited for this purpose as", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 43, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.77, "r_y0": 580.71, "r_x1": 452.19, "r_y1": 580.71, "r_x2": 452.19, "r_y2": 571.91, "r_x3": 134.77, "r_y3": 571.91, "coord_origin": "TOPLEFT" }, "text": "the verification of incomplete sequences is non-trivial or even impossible.", "orig": "the verification of incomplete sequences is non-trivial or even impossible.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 2, "label": "text", "bbox": { "l": 134.77, "t": 584.33, "r": 480.59, "b": 664.85, "coord_origin": "TOPLEFT" }, "confidence": 0.984, "cells": [ { "index": 44, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 149.71, "r_y0": 593.12, "r_x1": 480.59, "r_y1": 593.12, "r_x2": 480.59, "r_y2": 584.33, "r_x3": 149.71, "r_y3": 584.33, "coord_origin": "TOPLEFT" }, "text": "In a valid HTML table, the token sequence must describe a 2D grid of table", "orig": "In a valid HTML table, the token sequence must describe a 2D grid of table", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 45, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.77, "r_y0": 605.08, "r_x1": 480.59, "r_y1": 605.08, "r_x2": 480.59, "r_y2": 596.28, "r_x3": 134.77, "r_y3": 596.28, "coord_origin": "TOPLEFT" }, "text": "cells, serialised in row-major ordering, where each row and each column have", "orig": "cells, serialised in row-major ordering, where each row and each column have", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 46, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.77, "r_y0": 617.03, "r_x1": 480.59, "r_y1": 617.03, "r_x2": 480.59, "r_y2": 608.24, "r_x3": 134.77, "r_y3": 608.24, "coord_origin": "TOPLEFT" }, "text": "the same length (while considering row- and column-spans). Furthermore, every", "orig": "the same length (while considering row- and column-spans). Furthermore, every", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 47, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.77, "r_y0": 628.99, "r_x1": 480.59, "r_y1": 628.99, "r_x2": 480.59, "r_y2": 620.19, "r_x3": 134.77, "r_y3": 620.19, "coord_origin": "TOPLEFT" }, "text": "opening tag in HTML needs to be matched by a closing tag in a correct hierar-", "orig": "opening tag in HTML needs to be matched by a closing tag in a correct hierar-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 48, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.77, "r_y0": 640.94, "r_x1": 480.59, "r_y1": 640.94, "r_x2": 480.59, "r_y2": 632.15, "r_x3": 134.77, "r_y3": 632.15, "coord_origin": "TOPLEFT" }, "text": "chical manner. Since the number of tokens for each table row and column can", "orig": "chical manner. Since the number of tokens for each table row and column can", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 49, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.77, "r_y0": 652.9, "r_x1": 480.59, "r_y1": 652.9, "r_x2": 480.59, "r_y2": 644.1, "r_x3": 134.77, "r_y3": 644.1, "coord_origin": "TOPLEFT" }, "text": "vary significantly, especially for large tables with many row- and column-spans,", "orig": "vary significantly, especially for large tables with many row- and column-spans,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 50, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.77, "r_y0": 664.85, "r_x1": 480.59, "r_y1": 664.85, "r_x2": 480.59, "r_y2": 656.06, "r_x3": 134.77, "r_y3": 656.06, "coord_origin": "TOPLEFT" }, "text": "it is complex to verify the consistency of predicted structures during sequence", "orig": "it is complex to verify the consistency of predicted structures during sequence", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 4, "label": "picture", "bbox": { "l": 137.41, "t": 233.51, "r": 476.56, "b": 340.23, "coord_origin": "TOPLEFT" }, "confidence": 0.939, "cells": [], "children": [] } ] }, "tablestructure": { "table_map": {} }, "figures_classification": null, "equations_prediction": null, "vlm_response": null }, "assembled": { "elements": [ { "label": "page_header", "id": 5, "page_no": 4, "cluster": { "id": 5, "label": "page_header", "bbox": { "l": 194.48, "t": 93.77, "r": 447.54, "b": 101.84, "coord_origin": "TOPLEFT" }, "confidence": 0.927, "cells": [ { "index": 0, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 194.48, "r_y0": 101.84, "r_x1": 447.54, "r_y1": 101.84, "r_x2": 447.54, "r_y2": 93.77, "r_x3": 194.48, "r_y3": 93.77, "coord_origin": "TOPLEFT" }, "text": "Optimized Table Tokenization for Table Structure Recognition", "orig": "Optimized Table Tokenization for Table Structure Recognition", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "Optimized Table Tokenization for Table Structure Recognition" }, { "label": "page_header", "id": 6, "page_no": 4, "cluster": { "id": 6, "label": "page_header", "bbox": { "l": 475.98, "t": 93.77, "r": 480.59, "b": 101.84, "coord_origin": "TOPLEFT" }, "confidence": 0.87, "cells": [ { "index": 1, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 475.98, "r_y0": 101.84, "r_x1": 480.59, "r_y1": 101.84, "r_x2": 480.59, "r_y2": 93.77, "r_x3": 475.98, "r_y3": 93.77, "coord_origin": "TOPLEFT" }, "text": "5", "orig": "5", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "5" }, { "label": "text", "id": 0, "page_no": 4, "cluster": { "id": 0, "label": "text", "bbox": { "l": 134.76, "t": 118.93, "r": 480.59, "b": 187.51, "coord_origin": "TOPLEFT" }, "confidence": 0.986, "cells": [ { "index": 2, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 127.73, "r_x1": 480.59, "r_y1": 127.73, "r_x2": 480.59, "r_y2": 118.93, "r_x3": 134.76, "r_y3": 118.93, "coord_origin": "TOPLEFT" }, "text": "ulary and can be interpreted as a table structure. For example, with the HTML", "orig": "ulary and can be interpreted as a table structure. For example, with the HTML", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 3, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 139.69, "r_x1": 162.48, "r_y1": 139.69, "r_x2": 162.48, "r_y2": 130.89, "r_x3": 134.76, "r_y3": 130.89, "coord_origin": "TOPLEFT" }, "text": "tokens", "orig": "tokens", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 4, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 166.37, "r_y0": 139.69, "r_x1": 201.75, "r_y1": 139.69, "r_x2": 201.75, "r_y2": 130.89, "r_x3": 166.37, "r_y3": 130.89, "coord_origin": "TOPLEFT" }, "text": "", "orig": "
", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 5, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 201.75, "r_y0": 139.69, "r_x1": 204.52, "r_y1": 139.69, "r_x2": 204.52, "r_y2": 130.89, "r_x3": 201.75, "r_y3": 130.89, "coord_origin": "TOPLEFT" }, "text": ",", "orig": ",", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 6, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 208.4, "r_y0": 139.69, "r_x1": 248.87, "r_y1": 139.69, "r_x2": 248.87, "r_y2": 130.89, "r_x3": 208.4, "r_y3": 130.89, "coord_origin": "TOPLEFT" }, "text": "
", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 7, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 248.87, "r_y0": 139.69, "r_x1": 251.64, "r_y1": 139.69, "r_x2": 251.64, "r_y2": 130.89, "r_x3": 248.87, "r_y3": 130.89, "coord_origin": "TOPLEFT" }, "text": ",", "orig": ",", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 8, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 255.52, "r_y0": 139.69, "r_x1": 278.3, "r_y1": 139.69, "r_x2": 278.3, "r_y2": 130.89, "r_x3": 255.52, "r_y3": 130.89, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 9, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 278.3, "r_y0": 139.69, "r_x1": 281.06, "r_y1": 139.69, "r_x2": 281.06, "r_y2": 130.89, "r_x3": 278.3, "r_y3": 130.89, "coord_origin": "TOPLEFT" }, "text": ",", "orig": ",", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 10, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 284.95, "r_y0": 139.69, "r_x1": 312.82, "r_y1": 139.69, "r_x2": 312.82, "r_y2": 130.89, "r_x3": 284.95, "r_y3": 130.89, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 11, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 312.82, "r_y0": 139.69, "r_x1": 315.58, "r_y1": 139.69, "r_x2": 315.58, "r_y2": 130.89, "r_x3": 312.82, "r_y3": 130.89, "coord_origin": "TOPLEFT" }, "text": ",", "orig": ",", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 12, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 319.47, "r_y0": 139.69, "r_x1": 343.14, "r_y1": 139.69, "r_x2": 343.14, "r_y2": 130.89, "r_x3": 319.47, "r_y3": 130.89, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 13, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 347.13, "r_y0": 139.69, "r_x1": 363.18, "r_y1": 139.69, "r_x2": 363.18, "r_y2": 130.89, "r_x3": 347.13, "r_y3": 130.89, "coord_origin": "TOPLEFT" }, "text": "and", "orig": "and", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 14, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 367.06, "r_y0": 139.69, "r_x1": 395.82, "r_y1": 139.69, "r_x2": 395.82, "r_y2": 130.89, "r_x3": 367.06, "r_y3": 130.89, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 15, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 395.82, "r_y0": 139.69, "r_x1": 480.59, "r_y1": 139.69, "r_x2": 480.59, "r_y2": 130.89, "r_x3": 395.82, "r_y3": 130.89, "coord_origin": "TOPLEFT" }, "text": ", one can construct", "orig": ", one can construct", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 16, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.77, "r_y0": 151.64, "r_x1": 480.59, "r_y1": 151.64, "r_x2": 480.59, "r_y2": 142.84, "r_x3": 134.77, "r_y3": 142.84, "coord_origin": "TOPLEFT" }, "text": "simple table structures without any spanning cells. In reality though, one needs", "orig": "simple table structures without any spanning cells. In reality though, one needs", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 17, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.77, "r_y0": 163.6, "r_x1": 480.59, "r_y1": 163.6, "r_x2": 480.59, "r_y2": 154.8, "r_x3": 134.77, "r_y3": 154.8, "coord_origin": "TOPLEFT" }, "text": "at least 28 HTML tokens to describe the most common complex tables observed", "orig": "at least 28 HTML tokens to describe the most common complex tables observed", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 18, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.77, "r_y0": 175.55, "r_x1": 480.59, "r_y1": 175.55, "r_x2": 480.59, "r_y2": 166.75, "r_x3": 134.77, "r_y3": 166.75, "coord_origin": "TOPLEFT" }, "text": "in real-world documents [21,22], due to a variety of spanning cells definitions in", "orig": "in real-world documents [21,22], due to a variety of spanning cells definitions in", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 19, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.77, "r_y0": 187.51, "r_x1": 261.93, "r_y1": 187.51, "r_x2": 261.93, "r_y2": 178.71, "r_x3": 134.77, "r_y3": 178.71, "coord_origin": "TOPLEFT" }, "text": "the HTML token vocabulary.", "orig": "the HTML token vocabulary.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "ulary and can be interpreted as a table structure. For example, with the HTML tokens ,
, , , and , one can construct simple table structures without any spanning cells. In reality though, one needs at least 28 HTML tokens to describe the most common complex tables observed in real-world documents [21,22], due to a variety of spanning cells definitions in the HTML token vocabulary." }, { "label": "caption", "id": 7, "page_no": 4, "cluster": { "id": 7, "label": "caption", "bbox": { "l": 145.61, "t": 221.08, "r": 469.75, "b": 229.21, "coord_origin": "TOPLEFT" }, "confidence": 0.847, "cells": [ { "index": 20, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 145.61, "r_y0": 229.01, "r_x1": 173.49, "r_y1": 229.01, "r_x2": 173.49, "r_y2": 221.08, "r_x3": 145.61, "r_y3": 221.08, "coord_origin": "TOPLEFT" }, "text": "Fig. 2.", "orig": "Fig. 2.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 21, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 176.56, "r_y0": 229.21, "r_x1": 469.75, "r_y1": 229.21, "r_x2": 469.75, "r_y2": 221.14, "r_x3": 176.56, "r_y3": 221.14, "coord_origin": "TOPLEFT" }, "text": "Frequency of tokens in HTML and OTSL as they appear in PubTabNet.", "orig": "Frequency of tokens in HTML and OTSL as they appear in PubTabNet.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "Fig. 2. Frequency of tokens in HTML and OTSL as they appear in PubTabNet." }, { "label": "text", "id": 1, "page_no": 4, "cluster": { "id": 1, "label": "text", "bbox": { "l": 134.76, "t": 368.21, "r": 480.59, "b": 532.42, "coord_origin": "TOPLEFT" }, "confidence": 0.984, "cells": [ { "index": 22, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 149.71, "r_y0": 377.0, "r_x1": 480.59, "r_y1": 377.0, "r_x2": 480.59, "r_y2": 368.21, "r_x3": 149.71, "r_y3": 368.21, "coord_origin": "TOPLEFT" }, "text": "Obviously, HTML and other general-purpose markup languages were not de-", "orig": "Obviously, HTML and other general-purpose markup languages were not de-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 23, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 388.96, "r_x1": 480.59, "r_y1": 388.96, "r_x2": 480.59, "r_y2": 380.16, "r_x3": 134.76, "r_y3": 380.16, "coord_origin": "TOPLEFT" }, "text": "signed for Im2Seq models. As such, they have some serious drawbacks. First, the", "orig": "signed for Im2Seq models. As such, they have some serious drawbacks. First, the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 24, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 400.91, "r_x1": 480.59, "r_y1": 400.91, "r_x2": 480.59, "r_y2": 392.12, "r_x3": 134.76, "r_y3": 392.12, "coord_origin": "TOPLEFT" }, "text": "token vocabulary needs to be artificially large in order to describe all plausible", "orig": "token vocabulary needs to be artificially large in order to describe all plausible", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 25, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 412.87, "r_x1": 480.59, "r_y1": 412.87, "r_x2": 480.59, "r_y2": 404.07, "r_x3": 134.76, "r_y3": 404.07, "coord_origin": "TOPLEFT" }, "text": "tabular structures. Since most Im2Seq models use an autoregressive approach,", "orig": "tabular structures. Since most Im2Seq models use an autoregressive approach,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 26, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 424.82, "r_x1": 480.59, "r_y1": 424.82, "r_x2": 480.59, "r_y2": 416.03, "r_x3": 134.76, "r_y3": 416.03, "coord_origin": "TOPLEFT" }, "text": "they generate the sequence token by token. Therefore, to reduce inference time,", "orig": "they generate the sequence token by token. Therefore, to reduce inference time,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 27, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 436.78, "r_x1": 480.59, "r_y1": 436.78, "r_x2": 480.59, "r_y2": 427.98, "r_x3": 134.76, "r_y3": 427.98, "coord_origin": "TOPLEFT" }, "text": "a shorter sequence length is critical. Every table-cell is represented by at least", "orig": "a shorter sequence length is critical. Every table-cell is represented by at least", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 28, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 448.73, "r_x1": 187.93, "r_y1": 448.73, "r_x2": 187.93, "r_y2": 439.94, "r_x3": 134.76, "r_y3": 439.94, "coord_origin": "TOPLEFT" }, "text": "two tokens (", "orig": "two tokens (", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 29, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 187.93, "r_y0": 448.73, "r_x1": 211.6, "r_y1": 448.73, "r_x2": 211.6, "r_y2": 439.94, "r_x3": 187.93, "r_y3": 439.94, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 30, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 214.75, "r_y0": 448.73, "r_x1": 230.8, "r_y1": 448.73, "r_x2": 230.8, "r_y2": 439.94, "r_x3": 214.75, "r_y3": 439.94, "coord_origin": "TOPLEFT" }, "text": "and", "orig": "and", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 31, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 233.84, "r_y0": 448.73, "r_x1": 262.6, "r_y1": 448.73, "r_x2": 262.6, "r_y2": 439.94, "r_x3": 233.84, "r_y3": 439.94, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 32, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 262.72, "r_y0": 448.73, "r_x1": 480.59, "r_y1": 448.73, "r_x2": 480.59, "r_y2": 439.94, "r_x3": 262.72, "r_y3": 439.94, "coord_origin": "TOPLEFT" }, "text": "). Furthermore, when tokenizing the HTML struc-", "orig": "). Furthermore, when tokenizing the HTML struc-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 33, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.77, "r_y0": 460.69, "r_x1": 480.59, "r_y1": 460.69, "r_x2": 480.59, "r_y2": 451.89, "r_x3": 134.77, "r_y3": 451.89, "coord_origin": "TOPLEFT" }, "text": "ture, one needs to explicitly enumerate possible column-spans and row-spans", "orig": "ture, one needs to explicitly enumerate possible column-spans and row-spans", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 34, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.77, "r_y0": 472.64, "r_x1": 480.59, "r_y1": 472.64, "r_x2": 480.59, "r_y2": 463.85, "r_x3": 134.77, "r_y3": 463.85, "coord_origin": "TOPLEFT" }, "text": "as words. In practice, this ends up requiring 28 different HTML tokens (when", "orig": "as words. In practice, this ends up requiring 28 different HTML tokens (when", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 35, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.77, "r_y0": 484.6, "r_x1": 480.59, "r_y1": 484.6, "r_x2": 480.59, "r_y2": 475.8, "r_x3": 134.77, "r_y3": 475.8, "coord_origin": "TOPLEFT" }, "text": "including column- and row-spans up to 10 cells) just to describe every table in", "orig": "including column- and row-spans up to 10 cells) just to describe every table in", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 36, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.77, "r_y0": 496.56, "r_x1": 480.59, "r_y1": 496.56, "r_x2": 480.59, "r_y2": 487.76, "r_x3": 134.77, "r_y3": 487.76, "coord_origin": "TOPLEFT" }, "text": "the PubTabNet dataset. Clearly, not every token is equally represented, as is", "orig": "the PubTabNet dataset. Clearly, not every token is equally represented, as is", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 37, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.77, "r_y0": 508.51, "r_x1": 480.59, "r_y1": 508.51, "r_x2": 480.59, "r_y2": 499.71, "r_x3": 134.77, "r_y3": 499.71, "coord_origin": "TOPLEFT" }, "text": "depicted in Figure 2. This skewed distribution of tokens in combination with", "orig": "depicted in Figure 2. This skewed distribution of tokens in combination with", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 38, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.77, "r_y0": 520.47, "r_x1": 480.59, "r_y1": 520.47, "r_x2": 480.59, "r_y2": 511.67, "r_x3": 134.77, "r_y3": 511.67, "coord_origin": "TOPLEFT" }, "text": "variable token row-length makes it challenging for models to learn the HTML", "orig": "variable token row-length makes it challenging for models to learn the HTML", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 39, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.77, "r_y0": 532.42, "r_x1": 176.93, "r_y1": 532.42, "r_x2": 176.93, "r_y2": 523.62, "r_x3": 134.77, "r_y3": 523.62, "coord_origin": "TOPLEFT" }, "text": "structure.", "orig": "structure.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "Obviously, HTML and other general-purpose markup languages were not designed for Im2Seq models. As such, they have some serious drawbacks. First, the token vocabulary needs to be artificially large in order to describe all plausible tabular structures. Since most Im2Seq models use an autoregressive approach, they generate the sequence token by token. Therefore, to reduce inference time, a shorter sequence length is critical. Every table-cell is represented by at least two tokens ( and ). Furthermore, when tokenizing the HTML structure, one needs to explicitly enumerate possible column-spans and row-spans as words. In practice, this ends up requiring 28 different HTML tokens (when including column- and row-spans up to 10 cells) just to describe every table in the PubTabNet dataset. Clearly, not every token is equally represented, as is depicted in Figure 2. This skewed distribution of tokens in combination with variable token row-length makes it challenging for models to learn the HTML structure." }, { "label": "text", "id": 3, "page_no": 4, "cluster": { "id": 3, "label": "text", "bbox": { "l": 134.77, "t": 536.04, "r": 480.59, "b": 580.71, "coord_origin": "TOPLEFT" }, "confidence": 0.978, "cells": [ { "index": 40, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 149.71, "r_y0": 544.84, "r_x1": 480.59, "r_y1": 544.84, "r_x2": 480.59, "r_y2": 536.04, "r_x3": 149.71, "r_y3": 536.04, "coord_origin": "TOPLEFT" }, "text": "Additionally, it would be desirable if the representation would easily allow", "orig": "Additionally, it would be desirable if the representation would easily allow", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 41, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.77, "r_y0": 556.79, "r_x1": 480.59, "r_y1": 556.79, "r_x2": 480.59, "r_y2": 548.0, "r_x3": 134.77, "r_y3": 548.0, "coord_origin": "TOPLEFT" }, "text": "an early detection of invalid sequences on-the-go, before the prediction of the", "orig": "an early detection of invalid sequences on-the-go, before the prediction of the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 42, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.77, "r_y0": 568.75, "r_x1": 480.59, "r_y1": 568.75, "r_x2": 480.59, "r_y2": 559.95, "r_x3": 134.77, "r_y3": 559.95, "coord_origin": "TOPLEFT" }, "text": "entire table structure is completed. HTML is not well-suited for this purpose as", "orig": "entire table structure is completed. HTML is not well-suited for this purpose as", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 43, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.77, "r_y0": 580.71, "r_x1": 452.19, "r_y1": 580.71, "r_x2": 452.19, "r_y2": 571.91, "r_x3": 134.77, "r_y3": 571.91, "coord_origin": "TOPLEFT" }, "text": "the verification of incomplete sequences is non-trivial or even impossible.", "orig": "the verification of incomplete sequences is non-trivial or even impossible.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "Additionally, it would be desirable if the representation would easily allow an early detection of invalid sequences on-the-go, before the prediction of the entire table structure is completed. HTML is not well-suited for this purpose as the verification of incomplete sequences is non-trivial or even impossible." }, { "label": "text", "id": 2, "page_no": 4, "cluster": { "id": 2, "label": "text", "bbox": { "l": 134.77, "t": 584.33, "r": 480.59, "b": 664.85, "coord_origin": "TOPLEFT" }, "confidence": 0.984, "cells": [ { "index": 44, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 149.71, "r_y0": 593.12, "r_x1": 480.59, "r_y1": 593.12, "r_x2": 480.59, "r_y2": 584.33, "r_x3": 149.71, "r_y3": 584.33, "coord_origin": "TOPLEFT" }, "text": "In a valid HTML table, the token sequence must describe a 2D grid of table", "orig": "In a valid HTML table, the token sequence must describe a 2D grid of table", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 45, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.77, "r_y0": 605.08, "r_x1": 480.59, "r_y1": 605.08, "r_x2": 480.59, "r_y2": 596.28, "r_x3": 134.77, "r_y3": 596.28, "coord_origin": "TOPLEFT" }, "text": "cells, serialised in row-major ordering, where each row and each column have", "orig": "cells, serialised in row-major ordering, where each row and each column have", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 46, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.77, "r_y0": 617.03, "r_x1": 480.59, "r_y1": 617.03, "r_x2": 480.59, "r_y2": 608.24, "r_x3": 134.77, "r_y3": 608.24, "coord_origin": "TOPLEFT" }, "text": "the same length (while considering row- and column-spans). Furthermore, every", "orig": "the same length (while considering row- and column-spans). Furthermore, every", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 47, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.77, "r_y0": 628.99, "r_x1": 480.59, "r_y1": 628.99, "r_x2": 480.59, "r_y2": 620.19, "r_x3": 134.77, "r_y3": 620.19, "coord_origin": "TOPLEFT" }, "text": "opening tag in HTML needs to be matched by a closing tag in a correct hierar-", "orig": "opening tag in HTML needs to be matched by a closing tag in a correct hierar-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 48, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.77, "r_y0": 640.94, "r_x1": 480.59, "r_y1": 640.94, "r_x2": 480.59, "r_y2": 632.15, "r_x3": 134.77, "r_y3": 632.15, "coord_origin": "TOPLEFT" }, "text": "chical manner. Since the number of tokens for each table row and column can", "orig": "chical manner. Since the number of tokens for each table row and column can", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 49, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.77, "r_y0": 652.9, "r_x1": 480.59, "r_y1": 652.9, "r_x2": 480.59, "r_y2": 644.1, "r_x3": 134.77, "r_y3": 644.1, "coord_origin": "TOPLEFT" }, "text": "vary significantly, especially for large tables with many row- and column-spans,", "orig": "vary significantly, especially for large tables with many row- and column-spans,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 50, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.77, "r_y0": 664.85, "r_x1": 480.59, "r_y1": 664.85, "r_x2": 480.59, "r_y2": 656.06, "r_x3": 134.77, "r_y3": 656.06, "coord_origin": "TOPLEFT" }, "text": "it is complex to verify the consistency of predicted structures during sequence", "orig": "it is complex to verify the consistency of predicted structures during sequence", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "In a valid HTML table, the token sequence must describe a 2D grid of table cells, serialised in row-major ordering, where each row and each column have the same length (while considering row- and column-spans). Furthermore, every opening tag in HTML needs to be matched by a closing tag in a correct hierarchical manner. Since the number of tokens for each table row and column can vary significantly, especially for large tables with many row- and column-spans, it is complex to verify the consistency of predicted structures during sequence" }, { "label": "picture", "id": 4, "page_no": 4, "cluster": { "id": 4, "label": "picture", "bbox": { "l": 137.41, "t": 233.51, "r": 476.56, "b": 340.23, "coord_origin": "TOPLEFT" }, "confidence": 0.939, "cells": [], "children": [] }, "text": "", "annotations": [], "provenance": null, "predicted_class": null, "confidence": null } ], "body": [ { "label": "text", "id": 0, "page_no": 4, "cluster": { "id": 0, "label": "text", "bbox": { "l": 134.76, "t": 118.93, "r": 480.59, "b": 187.51, "coord_origin": "TOPLEFT" }, "confidence": 0.986, "cells": [ { "index": 2, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 127.73, "r_x1": 480.59, "r_y1": 127.73, "r_x2": 480.59, "r_y2": 118.93, "r_x3": 134.76, "r_y3": 118.93, "coord_origin": "TOPLEFT" }, "text": "ulary and can be interpreted as a table structure. For example, with the HTML", "orig": "ulary and can be interpreted as a table structure. For example, with the HTML", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 3, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 139.69, "r_x1": 162.48, "r_y1": 139.69, "r_x2": 162.48, "r_y2": 130.89, "r_x3": 134.76, "r_y3": 130.89, "coord_origin": "TOPLEFT" }, "text": "tokens", "orig": "tokens", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 4, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 166.37, "r_y0": 139.69, "r_x1": 201.75, "r_y1": 139.69, "r_x2": 201.75, "r_y2": 130.89, "r_x3": 166.37, "r_y3": 130.89, "coord_origin": "TOPLEFT" }, "text": "", "orig": "
", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 5, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 201.75, "r_y0": 139.69, "r_x1": 204.52, "r_y1": 139.69, "r_x2": 204.52, "r_y2": 130.89, "r_x3": 201.75, "r_y3": 130.89, "coord_origin": "TOPLEFT" }, "text": ",", "orig": ",", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 6, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 208.4, "r_y0": 139.69, "r_x1": 248.87, "r_y1": 139.69, "r_x2": 248.87, "r_y2": 130.89, "r_x3": 208.4, "r_y3": 130.89, "coord_origin": "TOPLEFT" }, "text": "
", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 7, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 248.87, "r_y0": 139.69, "r_x1": 251.64, "r_y1": 139.69, "r_x2": 251.64, "r_y2": 130.89, "r_x3": 248.87, "r_y3": 130.89, "coord_origin": "TOPLEFT" }, "text": ",", "orig": ",", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 8, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 255.52, "r_y0": 139.69, "r_x1": 278.3, "r_y1": 139.69, "r_x2": 278.3, "r_y2": 130.89, "r_x3": 255.52, "r_y3": 130.89, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 9, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 278.3, "r_y0": 139.69, "r_x1": 281.06, "r_y1": 139.69, "r_x2": 281.06, "r_y2": 130.89, "r_x3": 278.3, "r_y3": 130.89, "coord_origin": "TOPLEFT" }, "text": ",", "orig": ",", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 10, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 284.95, "r_y0": 139.69, "r_x1": 312.82, "r_y1": 139.69, "r_x2": 312.82, "r_y2": 130.89, "r_x3": 284.95, "r_y3": 130.89, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 11, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 312.82, "r_y0": 139.69, "r_x1": 315.58, "r_y1": 139.69, "r_x2": 315.58, "r_y2": 130.89, "r_x3": 312.82, "r_y3": 130.89, "coord_origin": "TOPLEFT" }, "text": ",", "orig": ",", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 12, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 319.47, "r_y0": 139.69, "r_x1": 343.14, "r_y1": 139.69, "r_x2": 343.14, "r_y2": 130.89, "r_x3": 319.47, "r_y3": 130.89, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 13, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 347.13, "r_y0": 139.69, "r_x1": 363.18, "r_y1": 139.69, "r_x2": 363.18, "r_y2": 130.89, "r_x3": 347.13, "r_y3": 130.89, "coord_origin": "TOPLEFT" }, "text": "and", "orig": "and", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 14, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 367.06, "r_y0": 139.69, "r_x1": 395.82, "r_y1": 139.69, "r_x2": 395.82, "r_y2": 130.89, "r_x3": 367.06, "r_y3": 130.89, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 15, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 395.82, "r_y0": 139.69, "r_x1": 480.59, "r_y1": 139.69, "r_x2": 480.59, "r_y2": 130.89, "r_x3": 395.82, "r_y3": 130.89, "coord_origin": "TOPLEFT" }, "text": ", one can construct", "orig": ", one can construct", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 16, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.77, "r_y0": 151.64, "r_x1": 480.59, "r_y1": 151.64, "r_x2": 480.59, "r_y2": 142.84, "r_x3": 134.77, "r_y3": 142.84, "coord_origin": "TOPLEFT" }, "text": "simple table structures without any spanning cells. In reality though, one needs", "orig": "simple table structures without any spanning cells. In reality though, one needs", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 17, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.77, "r_y0": 163.6, "r_x1": 480.59, "r_y1": 163.6, "r_x2": 480.59, "r_y2": 154.8, "r_x3": 134.77, "r_y3": 154.8, "coord_origin": "TOPLEFT" }, "text": "at least 28 HTML tokens to describe the most common complex tables observed", "orig": "at least 28 HTML tokens to describe the most common complex tables observed", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 18, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.77, "r_y0": 175.55, "r_x1": 480.59, "r_y1": 175.55, "r_x2": 480.59, "r_y2": 166.75, "r_x3": 134.77, "r_y3": 166.75, "coord_origin": "TOPLEFT" }, "text": "in real-world documents [21,22], due to a variety of spanning cells definitions in", "orig": "in real-world documents [21,22], due to a variety of spanning cells definitions in", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 19, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.77, "r_y0": 187.51, "r_x1": 261.93, "r_y1": 187.51, "r_x2": 261.93, "r_y2": 178.71, "r_x3": 134.77, "r_y3": 178.71, "coord_origin": "TOPLEFT" }, "text": "the HTML token vocabulary.", "orig": "the HTML token vocabulary.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "ulary and can be interpreted as a table structure. For example, with the HTML tokens ,
, , , and , one can construct simple table structures without any spanning cells. In reality though, one needs at least 28 HTML tokens to describe the most common complex tables observed in real-world documents [21,22], due to a variety of spanning cells definitions in the HTML token vocabulary." }, { "label": "caption", "id": 7, "page_no": 4, "cluster": { "id": 7, "label": "caption", "bbox": { "l": 145.61, "t": 221.08, "r": 469.75, "b": 229.21, "coord_origin": "TOPLEFT" }, "confidence": 0.847, "cells": [ { "index": 20, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 145.61, "r_y0": 229.01, "r_x1": 173.49, "r_y1": 229.01, "r_x2": 173.49, "r_y2": 221.08, "r_x3": 145.61, "r_y3": 221.08, "coord_origin": "TOPLEFT" }, "text": "Fig. 2.", "orig": "Fig. 2.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 21, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 176.56, "r_y0": 229.21, "r_x1": 469.75, "r_y1": 229.21, "r_x2": 469.75, "r_y2": 221.14, "r_x3": 176.56, "r_y3": 221.14, "coord_origin": "TOPLEFT" }, "text": "Frequency of tokens in HTML and OTSL as they appear in PubTabNet.", "orig": "Frequency of tokens in HTML and OTSL as they appear in PubTabNet.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "Fig. 2. Frequency of tokens in HTML and OTSL as they appear in PubTabNet." }, { "label": "text", "id": 1, "page_no": 4, "cluster": { "id": 1, "label": "text", "bbox": { "l": 134.76, "t": 368.21, "r": 480.59, "b": 532.42, "coord_origin": "TOPLEFT" }, "confidence": 0.984, "cells": [ { "index": 22, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 149.71, "r_y0": 377.0, "r_x1": 480.59, "r_y1": 377.0, "r_x2": 480.59, "r_y2": 368.21, "r_x3": 149.71, "r_y3": 368.21, "coord_origin": "TOPLEFT" }, "text": "Obviously, HTML and other general-purpose markup languages were not de-", "orig": "Obviously, HTML and other general-purpose markup languages were not de-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 23, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 388.96, "r_x1": 480.59, "r_y1": 388.96, "r_x2": 480.59, "r_y2": 380.16, "r_x3": 134.76, "r_y3": 380.16, "coord_origin": "TOPLEFT" }, "text": "signed for Im2Seq models. As such, they have some serious drawbacks. First, the", "orig": "signed for Im2Seq models. As such, they have some serious drawbacks. First, the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 24, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 400.91, "r_x1": 480.59, "r_y1": 400.91, "r_x2": 480.59, "r_y2": 392.12, "r_x3": 134.76, "r_y3": 392.12, "coord_origin": "TOPLEFT" }, "text": "token vocabulary needs to be artificially large in order to describe all plausible", "orig": "token vocabulary needs to be artificially large in order to describe all plausible", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 25, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 412.87, "r_x1": 480.59, "r_y1": 412.87, "r_x2": 480.59, "r_y2": 404.07, "r_x3": 134.76, "r_y3": 404.07, "coord_origin": "TOPLEFT" }, "text": "tabular structures. Since most Im2Seq models use an autoregressive approach,", "orig": "tabular structures. Since most Im2Seq models use an autoregressive approach,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 26, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 424.82, "r_x1": 480.59, "r_y1": 424.82, "r_x2": 480.59, "r_y2": 416.03, "r_x3": 134.76, "r_y3": 416.03, "coord_origin": "TOPLEFT" }, "text": "they generate the sequence token by token. Therefore, to reduce inference time,", "orig": "they generate the sequence token by token. Therefore, to reduce inference time,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 27, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 436.78, "r_x1": 480.59, "r_y1": 436.78, "r_x2": 480.59, "r_y2": 427.98, "r_x3": 134.76, "r_y3": 427.98, "coord_origin": "TOPLEFT" }, "text": "a shorter sequence length is critical. Every table-cell is represented by at least", "orig": "a shorter sequence length is critical. Every table-cell is represented by at least", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 28, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 448.73, "r_x1": 187.93, "r_y1": 448.73, "r_x2": 187.93, "r_y2": 439.94, "r_x3": 134.76, "r_y3": 439.94, "coord_origin": "TOPLEFT" }, "text": "two tokens (", "orig": "two tokens (", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 29, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 187.93, "r_y0": 448.73, "r_x1": 211.6, "r_y1": 448.73, "r_x2": 211.6, "r_y2": 439.94, "r_x3": 187.93, "r_y3": 439.94, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 30, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 214.75, "r_y0": 448.73, "r_x1": 230.8, "r_y1": 448.73, "r_x2": 230.8, "r_y2": 439.94, "r_x3": 214.75, "r_y3": 439.94, "coord_origin": "TOPLEFT" }, "text": "and", "orig": "and", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 31, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 233.84, "r_y0": 448.73, "r_x1": 262.6, "r_y1": 448.73, "r_x2": 262.6, "r_y2": 439.94, "r_x3": 233.84, "r_y3": 439.94, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 32, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 262.72, "r_y0": 448.73, "r_x1": 480.59, "r_y1": 448.73, "r_x2": 480.59, "r_y2": 439.94, "r_x3": 262.72, "r_y3": 439.94, "coord_origin": "TOPLEFT" }, "text": "). Furthermore, when tokenizing the HTML struc-", "orig": "). Furthermore, when tokenizing the HTML struc-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 33, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.77, "r_y0": 460.69, "r_x1": 480.59, "r_y1": 460.69, "r_x2": 480.59, "r_y2": 451.89, "r_x3": 134.77, "r_y3": 451.89, "coord_origin": "TOPLEFT" }, "text": "ture, one needs to explicitly enumerate possible column-spans and row-spans", "orig": "ture, one needs to explicitly enumerate possible column-spans and row-spans", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 34, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.77, "r_y0": 472.64, "r_x1": 480.59, "r_y1": 472.64, "r_x2": 480.59, "r_y2": 463.85, "r_x3": 134.77, "r_y3": 463.85, "coord_origin": "TOPLEFT" }, "text": "as words. In practice, this ends up requiring 28 different HTML tokens (when", "orig": "as words. In practice, this ends up requiring 28 different HTML tokens (when", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 35, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.77, "r_y0": 484.6, "r_x1": 480.59, "r_y1": 484.6, "r_x2": 480.59, "r_y2": 475.8, "r_x3": 134.77, "r_y3": 475.8, "coord_origin": "TOPLEFT" }, "text": "including column- and row-spans up to 10 cells) just to describe every table in", "orig": "including column- and row-spans up to 10 cells) just to describe every table in", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 36, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.77, "r_y0": 496.56, "r_x1": 480.59, "r_y1": 496.56, "r_x2": 480.59, "r_y2": 487.76, "r_x3": 134.77, "r_y3": 487.76, "coord_origin": "TOPLEFT" }, "text": "the PubTabNet dataset. Clearly, not every token is equally represented, as is", "orig": "the PubTabNet dataset. Clearly, not every token is equally represented, as is", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 37, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.77, "r_y0": 508.51, "r_x1": 480.59, "r_y1": 508.51, "r_x2": 480.59, "r_y2": 499.71, "r_x3": 134.77, "r_y3": 499.71, "coord_origin": "TOPLEFT" }, "text": "depicted in Figure 2. This skewed distribution of tokens in combination with", "orig": "depicted in Figure 2. This skewed distribution of tokens in combination with", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 38, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.77, "r_y0": 520.47, "r_x1": 480.59, "r_y1": 520.47, "r_x2": 480.59, "r_y2": 511.67, "r_x3": 134.77, "r_y3": 511.67, "coord_origin": "TOPLEFT" }, "text": "variable token row-length makes it challenging for models to learn the HTML", "orig": "variable token row-length makes it challenging for models to learn the HTML", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 39, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.77, "r_y0": 532.42, "r_x1": 176.93, "r_y1": 532.42, "r_x2": 176.93, "r_y2": 523.62, "r_x3": 134.77, "r_y3": 523.62, "coord_origin": "TOPLEFT" }, "text": "structure.", "orig": "structure.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "Obviously, HTML and other general-purpose markup languages were not designed for Im2Seq models. As such, they have some serious drawbacks. First, the token vocabulary needs to be artificially large in order to describe all plausible tabular structures. Since most Im2Seq models use an autoregressive approach, they generate the sequence token by token. Therefore, to reduce inference time, a shorter sequence length is critical. Every table-cell is represented by at least two tokens ( and ). Furthermore, when tokenizing the HTML structure, one needs to explicitly enumerate possible column-spans and row-spans as words. In practice, this ends up requiring 28 different HTML tokens (when including column- and row-spans up to 10 cells) just to describe every table in the PubTabNet dataset. Clearly, not every token is equally represented, as is depicted in Figure 2. This skewed distribution of tokens in combination with variable token row-length makes it challenging for models to learn the HTML structure." }, { "label": "text", "id": 3, "page_no": 4, "cluster": { "id": 3, "label": "text", "bbox": { "l": 134.77, "t": 536.04, "r": 480.59, "b": 580.71, "coord_origin": "TOPLEFT" }, "confidence": 0.978, "cells": [ { "index": 40, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 149.71, "r_y0": 544.84, "r_x1": 480.59, "r_y1": 544.84, "r_x2": 480.59, "r_y2": 536.04, "r_x3": 149.71, "r_y3": 536.04, "coord_origin": "TOPLEFT" }, "text": "Additionally, it would be desirable if the representation would easily allow", "orig": "Additionally, it would be desirable if the representation would easily allow", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 41, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.77, "r_y0": 556.79, "r_x1": 480.59, "r_y1": 556.79, "r_x2": 480.59, "r_y2": 548.0, "r_x3": 134.77, "r_y3": 548.0, "coord_origin": "TOPLEFT" }, "text": "an early detection of invalid sequences on-the-go, before the prediction of the", "orig": "an early detection of invalid sequences on-the-go, before the prediction of the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 42, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.77, "r_y0": 568.75, "r_x1": 480.59, "r_y1": 568.75, "r_x2": 480.59, "r_y2": 559.95, "r_x3": 134.77, "r_y3": 559.95, "coord_origin": "TOPLEFT" }, "text": "entire table structure is completed. HTML is not well-suited for this purpose as", "orig": "entire table structure is completed. HTML is not well-suited for this purpose as", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 43, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.77, "r_y0": 580.71, "r_x1": 452.19, "r_y1": 580.71, "r_x2": 452.19, "r_y2": 571.91, "r_x3": 134.77, "r_y3": 571.91, "coord_origin": "TOPLEFT" }, "text": "the verification of incomplete sequences is non-trivial or even impossible.", "orig": "the verification of incomplete sequences is non-trivial or even impossible.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "Additionally, it would be desirable if the representation would easily allow an early detection of invalid sequences on-the-go, before the prediction of the entire table structure is completed. HTML is not well-suited for this purpose as the verification of incomplete sequences is non-trivial or even impossible." }, { "label": "text", "id": 2, "page_no": 4, "cluster": { "id": 2, "label": "text", "bbox": { "l": 134.77, "t": 584.33, "r": 480.59, "b": 664.85, "coord_origin": "TOPLEFT" }, "confidence": 0.984, "cells": [ { "index": 44, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 149.71, "r_y0": 593.12, "r_x1": 480.59, "r_y1": 593.12, "r_x2": 480.59, "r_y2": 584.33, "r_x3": 149.71, "r_y3": 584.33, "coord_origin": "TOPLEFT" }, "text": "In a valid HTML table, the token sequence must describe a 2D grid of table", "orig": "In a valid HTML table, the token sequence must describe a 2D grid of table", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 45, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.77, "r_y0": 605.08, "r_x1": 480.59, "r_y1": 605.08, "r_x2": 480.59, "r_y2": 596.28, "r_x3": 134.77, "r_y3": 596.28, "coord_origin": "TOPLEFT" }, "text": "cells, serialised in row-major ordering, where each row and each column have", "orig": "cells, serialised in row-major ordering, where each row and each column have", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 46, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.77, "r_y0": 617.03, "r_x1": 480.59, "r_y1": 617.03, "r_x2": 480.59, "r_y2": 608.24, "r_x3": 134.77, "r_y3": 608.24, "coord_origin": "TOPLEFT" }, "text": "the same length (while considering row- and column-spans). Furthermore, every", "orig": "the same length (while considering row- and column-spans). Furthermore, every", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 47, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.77, "r_y0": 628.99, "r_x1": 480.59, "r_y1": 628.99, "r_x2": 480.59, "r_y2": 620.19, "r_x3": 134.77, "r_y3": 620.19, "coord_origin": "TOPLEFT" }, "text": "opening tag in HTML needs to be matched by a closing tag in a correct hierar-", "orig": "opening tag in HTML needs to be matched by a closing tag in a correct hierar-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 48, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.77, "r_y0": 640.94, "r_x1": 480.59, "r_y1": 640.94, "r_x2": 480.59, "r_y2": 632.15, "r_x3": 134.77, "r_y3": 632.15, "coord_origin": "TOPLEFT" }, "text": "chical manner. Since the number of tokens for each table row and column can", "orig": "chical manner. Since the number of tokens for each table row and column can", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 49, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.77, "r_y0": 652.9, "r_x1": 480.59, "r_y1": 652.9, "r_x2": 480.59, "r_y2": 644.1, "r_x3": 134.77, "r_y3": 644.1, "coord_origin": "TOPLEFT" }, "text": "vary significantly, especially for large tables with many row- and column-spans,", "orig": "vary significantly, especially for large tables with many row- and column-spans,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 50, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.77, "r_y0": 664.85, "r_x1": 480.59, "r_y1": 664.85, "r_x2": 480.59, "r_y2": 656.06, "r_x3": 134.77, "r_y3": 656.06, "coord_origin": "TOPLEFT" }, "text": "it is complex to verify the consistency of predicted structures during sequence", "orig": "it is complex to verify the consistency of predicted structures during sequence", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "In a valid HTML table, the token sequence must describe a 2D grid of table cells, serialised in row-major ordering, where each row and each column have the same length (while considering row- and column-spans). Furthermore, every opening tag in HTML needs to be matched by a closing tag in a correct hierarchical manner. Since the number of tokens for each table row and column can vary significantly, especially for large tables with many row- and column-spans, it is complex to verify the consistency of predicted structures during sequence" }, { "label": "picture", "id": 4, "page_no": 4, "cluster": { "id": 4, "label": "picture", "bbox": { "l": 137.41, "t": 233.51, "r": 476.56, "b": 340.23, "coord_origin": "TOPLEFT" }, "confidence": 0.939, "cells": [], "children": [] }, "text": "", "annotations": [], "provenance": null, "predicted_class": null, "confidence": null } ], "headers": [ { "label": "page_header", "id": 5, "page_no": 4, "cluster": { "id": 5, "label": "page_header", "bbox": { "l": 194.48, "t": 93.77, "r": 447.54, "b": 101.84, "coord_origin": "TOPLEFT" }, "confidence": 0.927, "cells": [ { "index": 0, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 194.48, "r_y0": 101.84, "r_x1": 447.54, "r_y1": 101.84, "r_x2": 447.54, "r_y2": 93.77, "r_x3": 194.48, "r_y3": 93.77, "coord_origin": "TOPLEFT" }, "text": "Optimized Table Tokenization for Table Structure Recognition", "orig": "Optimized Table Tokenization for Table Structure Recognition", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "Optimized Table Tokenization for Table Structure Recognition" }, { "label": "page_header", "id": 6, "page_no": 4, "cluster": { "id": 6, "label": "page_header", "bbox": { "l": 475.98, "t": 93.77, "r": 480.59, "b": 101.84, "coord_origin": "TOPLEFT" }, "confidence": 0.87, "cells": [ { "index": 1, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 475.98, "r_y0": 101.84, "r_x1": 480.59, "r_y1": 101.84, "r_x2": 480.59, "r_y2": 93.77, "r_x3": 475.98, "r_y3": 93.77, "coord_origin": "TOPLEFT" }, "text": "5", "orig": "5", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "5" } ] } }, { "page_no": 5, "size": { "width": 612.0, "height": 792.0 }, "parsed_page": { "dimension": { "angle": 0.0, "rect": { "r_x0": 0.0, "r_y0": 0.0, "r_x1": 612.0, "r_y1": 0.0, "r_x2": 612.0, "r_y2": 792.0, "r_x3": 0.0, "r_y3": 792.0, "coord_origin": "BOTTOMLEFT" }, "boundary_type": "crop_box", "art_bbox": { "l": 0.0, "t": 792.0, "r": 612.0, "b": 0.0, "coord_origin": "BOTTOMLEFT" }, "bleed_bbox": { "l": 0.0, "t": 792.0, "r": 612.0, "b": 0.0, "coord_origin": "BOTTOMLEFT" }, "crop_bbox": { "l": 0.0, "t": 792.0, "r": 612.0, "b": 0.0, "coord_origin": "BOTTOMLEFT" }, "media_bbox": { "l": 0.0, "t": 792.0, "r": 612.0, "b": 0.0, "coord_origin": "BOTTOMLEFT" }, "trim_bbox": { "l": 0.0, "t": 792.0, "r": 612.0, "b": 0.0, "coord_origin": "BOTTOMLEFT" } }, "bitmap_resources": [], "char_cells": [], "word_cells": [], "textline_cells": [ { "index": 0, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 101.84, "r_x1": 139.37, "r_y1": 101.84, "r_x2": 139.37, "r_y2": 93.77, "r_x3": 134.76, "r_y3": 93.77, "coord_origin": "TOPLEFT" }, "text": "6", "orig": "6", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 1, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 167.81, "r_y0": 101.84, "r_x1": 178.08, "r_y1": 101.84, "r_x2": 178.08, "r_y2": 93.77, "r_x3": 167.81, "r_y3": 93.77, "coord_origin": "TOPLEFT" }, "text": "M.", "orig": "M.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 2, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 182.37, "r_y0": 101.84, "r_x1": 231.72, "r_y1": 101.84, "r_x2": 231.72, "r_y2": 93.77, "r_x3": 182.37, "r_y3": 93.77, "coord_origin": "TOPLEFT" }, "text": "Lysak, et al.", "orig": "Lysak, et al.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 3, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 127.73, "r_x1": 480.59, "r_y1": 127.73, "r_x2": 480.59, "r_y2": 118.93, "r_x3": 134.76, "r_y3": 118.93, "coord_origin": "TOPLEFT" }, "text": "generation. Implicitly, this also means that Im2Seq models need to learn these", "orig": "generation. Implicitly, this also means that Im2Seq models need to learn these", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 4, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 139.69, "r_x1": 364.63, "r_y1": 139.69, "r_x2": 364.63, "r_y2": 130.89, "r_x3": 134.76, "r_y3": 130.89, "coord_origin": "TOPLEFT" }, "text": "complex syntax rules, simply to deliver valid output.", "orig": "complex syntax rules, simply to deliver valid output.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 5, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 149.71, "r_y0": 152.28, "r_x1": 480.59, "r_y1": 152.28, "r_x2": 480.59, "r_y2": 143.48, "r_x3": 149.71, "r_y3": 143.48, "coord_origin": "TOPLEFT" }, "text": "In practice, we observe two major issues with prediction quality when train-", "orig": "In practice, we observe two major issues with prediction quality when train-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 6, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 164.23, "r_x1": 480.59, "r_y1": 164.23, "r_x2": 480.59, "r_y2": 155.44, "r_x3": 134.76, "r_y3": 155.44, "coord_origin": "TOPLEFT" }, "text": "ing Im2Seq models on HTML table structure generation from images. On the", "orig": "ing Im2Seq models on HTML table structure generation from images. On the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 7, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 176.19, "r_x1": 480.59, "r_y1": 176.19, "r_x2": 480.59, "r_y2": 167.39, "r_x3": 134.76, "r_y3": 167.39, "coord_origin": "TOPLEFT" }, "text": "one hand, we find that on large tables, the visual attention of the model often", "orig": "one hand, we find that on large tables, the visual attention of the model often", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 8, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 188.14, "r_x1": 480.59, "r_y1": 188.14, "r_x2": 480.59, "r_y2": 179.35, "r_x3": 134.76, "r_y3": 179.35, "coord_origin": "TOPLEFT" }, "text": "starts to drift and is not accurately moving forward cell by cell anymore. This", "orig": "starts to drift and is not accurately moving forward cell by cell anymore. This", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 9, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 200.1, "r_x1": 314.28, "r_y1": 200.1, "r_x2": 314.28, "r_y2": 191.3, "r_x3": 134.76, "r_y3": 191.3, "coord_origin": "TOPLEFT" }, "text": "manifests itself in either in an increasing", "orig": "manifests itself in either in an increasing", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 10, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 318.06, "r_y0": 200.1, "r_x1": 374.09, "r_y1": 200.1, "r_x2": 374.09, "r_y2": 191.3, "r_x3": 318.06, "r_y3": 191.3, "coord_origin": "TOPLEFT" }, "text": "location drift", "orig": "location drift", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 11, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 378.81, "r_y0": 200.1, "r_x1": 480.59, "r_y1": 200.1, "r_x2": 480.59, "r_y2": 191.3, "r_x3": 378.81, "r_y3": 191.3, "coord_origin": "TOPLEFT" }, "text": "for proposed table-cells", "orig": "for proposed table-cells", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 12, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 212.06, "r_x1": 480.59, "r_y1": 212.06, "r_x2": 480.59, "r_y2": 203.26, "r_x3": 134.76, "r_y3": 203.26, "coord_origin": "TOPLEFT" }, "text": "in later rows on the same column or even complete loss of vertical alignment, as", "orig": "in later rows on the same column or even complete loss of vertical alignment, as", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 13, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 224.01, "r_x1": 480.6, "r_y1": 224.01, "r_x2": 480.6, "r_y2": 215.21, "r_x3": 134.76, "r_y3": 215.21, "coord_origin": "TOPLEFT" }, "text": "illustrated in Figure 5. Addressing this with post-processing is partially possible,", "orig": "illustrated in Figure 5. Addressing this with post-processing is partially possible,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 14, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 235.97, "r_x1": 480.59, "r_y1": 235.97, "r_x2": 480.59, "r_y2": 227.17, "r_x3": 134.76, "r_y3": 227.17, "coord_origin": "TOPLEFT" }, "text": "but clearly undesired. On the other hand, we find many instances of predictions", "orig": "but clearly undesired. On the other hand, we find many instances of predictions", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 15, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 247.92, "r_x1": 480.59, "r_y1": 247.92, "r_x2": 480.59, "r_y2": 239.12, "r_x3": 134.76, "r_y3": 239.12, "coord_origin": "TOPLEFT" }, "text": "with structural inconsistencies or plain invalid HTML output, as shown in Fig-", "orig": "with structural inconsistencies or plain invalid HTML output, as shown in Fig-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 16, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 259.88, "r_x1": 480.59, "r_y1": 259.88, "r_x2": 480.59, "r_y2": 251.08, "r_x3": 134.76, "r_y3": 251.08, "coord_origin": "TOPLEFT" }, "text": "ure 6, which are nearly impossible to properly correct. Both problems seriously", "orig": "ure 6, which are nearly impossible to properly correct. Both problems seriously", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 17, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 271.83, "r_x1": 480.59, "r_y1": 271.83, "r_x2": 480.59, "r_y2": 263.03, "r_x3": 134.76, "r_y3": 263.03, "coord_origin": "TOPLEFT" }, "text": "impact the TSR model performance, since they reflect not only in the task of", "orig": "impact the TSR model performance, since they reflect not only in the task of", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 18, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 283.79, "r_x1": 480.59, "r_y1": 283.79, "r_x2": 480.59, "r_y2": 274.99, "r_x3": 134.76, "r_y3": 274.99, "coord_origin": "TOPLEFT" }, "text": "pure structure recognition but also in the equally crucial recognition or matching", "orig": "pure structure recognition but also in the equally crucial recognition or matching", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 19, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 295.74, "r_x1": 223.57, "r_y1": 295.74, "r_x2": 223.57, "r_y2": 286.94, "r_x3": 134.76, "r_y3": 286.94, "coord_origin": "TOPLEFT" }, "text": "of table cell content.", "orig": "of table cell content.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 20, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 331.2, "r_x1": 141.49, "r_y1": 331.2, "r_x2": 141.49, "r_y2": 320.63, "r_x3": 134.76, "r_y3": 320.63, "coord_origin": "TOPLEFT" }, "text": "4", "orig": "4", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 21, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 154.94, "r_y0": 331.2, "r_x1": 372.51, "r_y1": 331.2, "r_x2": 372.51, "r_y2": 320.63, "r_x3": 154.94, "r_y3": 320.63, "coord_origin": "TOPLEFT" }, "text": "Optimised Table Structure Language", "orig": "Optimised Table Structure Language", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 22, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 357.91, "r_x1": 480.59, "r_y1": 357.91, "r_x2": 480.59, "r_y2": 349.12, "r_x3": 134.76, "r_y3": 349.12, "coord_origin": "TOPLEFT" }, "text": "To mitigate the issues with HTML in Im2Seq-based TSR models laid out before,", "orig": "To mitigate the issues with HTML in Im2Seq-based TSR models laid out before,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 23, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 369.87, "r_x1": 480.59, "r_y1": 369.87, "r_x2": 480.59, "r_y2": 361.07, "r_x3": 134.76, "r_y3": 361.07, "coord_origin": "TOPLEFT" }, "text": "we propose here our Optimised Table Structure Language (OTSL). OTSL is", "orig": "we propose here our Optimised Table Structure Language (OTSL). OTSL is", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 24, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 381.82, "r_x1": 480.59, "r_y1": 381.82, "r_x2": 480.59, "r_y2": 373.03, "r_x3": 134.76, "r_y3": 373.03, "coord_origin": "TOPLEFT" }, "text": "designed to express table structure with a minimized vocabulary and a simple", "orig": "designed to express table structure with a minimized vocabulary and a simple", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 25, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 393.78, "r_x1": 480.59, "r_y1": 393.78, "r_x2": 480.59, "r_y2": 384.98, "r_x3": 134.76, "r_y3": 384.98, "coord_origin": "TOPLEFT" }, "text": "set of rules, which are both significantly reduced compared to HTML. At the", "orig": "set of rules, which are both significantly reduced compared to HTML. At the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 26, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 405.73, "r_x1": 480.59, "r_y1": 405.73, "r_x2": 480.59, "r_y2": 396.94, "r_x3": 134.76, "r_y3": 396.94, "coord_origin": "TOPLEFT" }, "text": "same time, OTSL enables easy error detection and correction during sequence", "orig": "same time, OTSL enables easy error detection and correction during sequence", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 27, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 417.69, "r_x1": 480.59, "r_y1": 417.69, "r_x2": 480.59, "r_y2": 408.89, "r_x3": 134.76, "r_y3": 408.89, "coord_origin": "TOPLEFT" }, "text": "generation. We further demonstrate how the compact structure representation", "orig": "generation. We further demonstrate how the compact structure representation", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 28, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 429.64, "r_x1": 480.59, "r_y1": 429.64, "r_x2": 480.59, "r_y2": 420.85, "r_x3": 134.76, "r_y3": 420.85, "coord_origin": "TOPLEFT" }, "text": "and minimized sequence length improves prediction accuracy and inference time", "orig": "and minimized sequence length improves prediction accuracy and inference time", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 29, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 441.6, "r_x1": 276.67, "r_y1": 441.6, "r_x2": 276.67, "r_y2": 432.8, "r_x3": 134.76, "r_y3": 432.8, "coord_origin": "TOPLEFT" }, "text": "in the TableFormer architecture.", "orig": "in the TableFormer architecture.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 30, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 474.68, "r_x1": 149.4, "r_y1": 474.68, "r_x2": 149.4, "r_y2": 465.87, "r_x3": 134.76, "r_y3": 465.87, "coord_origin": "TOPLEFT" }, "text": "4.1", "orig": "4.1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 31, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 160.86, "r_y0": 474.68, "r_x1": 261.8, "r_y1": 474.68, "r_x2": 261.8, "r_y2": 465.87, "r_x3": 160.86, "r_y3": 465.87, "coord_origin": "TOPLEFT" }, "text": "Language Definition", "orig": "Language Definition", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 32, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 497.79, "r_x1": 480.59, "r_y1": 497.79, "r_x2": 480.59, "r_y2": 489.0, "r_x3": 134.76, "r_y3": 489.0, "coord_origin": "TOPLEFT" }, "text": "In Figure 3, we illustrate how the OTSL is defined. In essence, the OTSL defines", "orig": "In Figure 3, we illustrate how the OTSL is defined. In essence, the OTSL defines", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 33, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 509.75, "r_x1": 480.59, "r_y1": 509.75, "r_x2": 480.59, "r_y2": 500.95, "r_x3": 134.76, "r_y3": 500.95, "coord_origin": "TOPLEFT" }, "text": "only 5 tokens that directly describe a tabular structure based on an atomic 2D", "orig": "only 5 tokens that directly describe a tabular structure based on an atomic 2D", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 34, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 521.71, "r_x1": 154.71, "r_y1": 521.71, "r_x2": 154.71, "r_y2": 512.91, "r_x3": 134.76, "r_y3": 512.91, "coord_origin": "TOPLEFT" }, "text": "grid.", "orig": "grid.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 35, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 149.71, "r_y0": 534.3, "r_x1": 409.31, "r_y1": 534.3, "r_x2": 409.31, "r_y2": 525.5, "r_x3": 149.71, "r_y3": 525.5, "coord_origin": "TOPLEFT" }, "text": "The OTSL vocabulary is comprised of the following tokens:", "orig": "The OTSL vocabulary is comprised of the following tokens:", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 36, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 140.99, "r_y0": 556.78, "r_x1": 146.72, "r_y1": 556.78, "r_x2": 146.72, "r_y2": 547.97, "r_x3": 140.99, "r_y3": 547.97, "coord_origin": "TOPLEFT" }, "text": "-", "orig": "-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 37, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.7, "r_y0": 556.78, "r_x1": 193.21, "r_y1": 556.78, "r_x2": 193.21, "r_y2": 547.98, "r_x3": 151.7, "r_y3": 547.98, "coord_origin": "TOPLEFT" }, "text": "\"C\" cell -", "orig": "\"C\" cell -", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 38, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 196.52, "r_y0": 556.78, "r_x1": 263.47, "r_y1": 556.78, "r_x2": 263.47, "r_y2": 547.98, "r_x3": 196.52, "r_y3": 547.98, "coord_origin": "TOPLEFT" }, "text": "a new table cell", "orig": "a new table cell", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 39, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 267.81, "r_y0": 556.78, "r_x1": 460.54, "r_y1": 556.78, "r_x2": 460.54, "r_y2": 547.98, "r_x3": 267.81, "r_y3": 547.98, "coord_origin": "TOPLEFT" }, "text": "that either has or does not have cell content", "orig": "that either has or does not have cell content", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 40, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 140.99, "r_y0": 569.37, "r_x1": 146.72, "r_y1": 569.37, "r_x2": 146.72, "r_y2": 560.56, "r_x3": 140.99, "r_y3": 560.56, "coord_origin": "TOPLEFT" }, "text": "-", "orig": "-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 41, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.7, "r_y0": 569.37, "r_x1": 194.3, "r_y1": 569.37, "r_x2": 194.3, "r_y2": 560.57, "r_x3": 151.7, "r_y3": 560.57, "coord_origin": "TOPLEFT" }, "text": "\"L\" cell -", "orig": "\"L\" cell -", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 42, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 198.66, "r_y0": 569.37, "r_x1": 264.52, "r_y1": 569.37, "r_x2": 264.52, "r_y2": 560.57, "r_x3": 198.66, "r_y3": 560.57, "coord_origin": "TOPLEFT" }, "text": "left-looking cell", "orig": "left-looking cell", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 43, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 264.52, "r_y0": 569.37, "r_x1": 480.59, "r_y1": 569.37, "r_x2": 480.59, "r_y2": 560.57, "r_x3": 264.52, "r_y3": 560.57, "coord_origin": "TOPLEFT" }, "text": ", merging with the left neighbor cell to create a", "orig": ", merging with the left neighbor cell to create a", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 44, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.7, "r_y0": 581.32, "r_x1": 171.68, "r_y1": 581.32, "r_x2": 171.68, "r_y2": 572.53, "r_x3": 151.7, "r_y3": 572.53, "coord_origin": "TOPLEFT" }, "text": "span", "orig": "span", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 45, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 140.99, "r_y0": 593.92, "r_x1": 146.72, "r_y1": 593.92, "r_x2": 146.72, "r_y2": 585.11, "r_x3": 140.99, "r_y3": 585.11, "coord_origin": "TOPLEFT" }, "text": "-", "orig": "-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 46, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.7, "r_y0": 593.92, "r_x1": 194.11, "r_y1": 593.92, "r_x2": 194.11, "r_y2": 585.12, "r_x3": 151.7, "r_y3": 585.12, "coord_origin": "TOPLEFT" }, "text": "\"U\" cell -", "orig": "\"U\" cell -", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 47, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 197.75, "r_y0": 593.92, "r_x1": 259.89, "r_y1": 593.92, "r_x2": 259.89, "r_y2": 585.12, "r_x3": 197.75, "r_y3": 585.12, "coord_origin": "TOPLEFT" }, "text": "up-looking cell", "orig": "up-looking cell", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 48, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 259.89, "r_y0": 593.92, "r_x1": 480.59, "r_y1": 593.92, "r_x2": 480.59, "r_y2": 585.12, "r_x3": 259.89, "r_y3": 585.12, "coord_origin": "TOPLEFT" }, "text": ", merging with the upper neighbor cell to create a", "orig": ", merging with the upper neighbor cell to create a", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 49, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.7, "r_y0": 605.87, "r_x1": 171.68, "r_y1": 605.87, "r_x2": 171.68, "r_y2": 597.08, "r_x3": 151.7, "r_y3": 597.08, "coord_origin": "TOPLEFT" }, "text": "span", "orig": "span", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 50, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 140.99, "r_y0": 618.47, "r_x1": 146.72, "r_y1": 618.47, "r_x2": 146.72, "r_y2": 609.66, "r_x3": 140.99, "r_y3": 609.66, "coord_origin": "TOPLEFT" }, "text": "-", "orig": "-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 51, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.7, "r_y0": 618.47, "r_x1": 193.48, "r_y1": 618.47, "r_x2": 193.48, "r_y2": 609.67, "r_x3": 151.7, "r_y3": 609.67, "coord_origin": "TOPLEFT" }, "text": "\"X\" cell -", "orig": "\"X\" cell -", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 52, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 196.8, "r_y0": 618.47, "r_x1": 236.12, "r_y1": 618.47, "r_x2": 236.12, "r_y2": 609.67, "r_x3": 196.8, "r_y3": 609.67, "coord_origin": "TOPLEFT" }, "text": "cross cell", "orig": "cross cell", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 53, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 236.13, "r_y0": 618.47, "r_x1": 454.55, "r_y1": 618.47, "r_x2": 454.55, "r_y2": 609.67, "r_x3": 236.13, "r_y3": 609.67, "coord_origin": "TOPLEFT" }, "text": ", to merge with both left and upper neighbor cells", "orig": ", to merge with both left and upper neighbor cells", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 54, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 140.99, "r_y0": 631.06, "r_x1": 146.72, "r_y1": 631.06, "r_x2": 146.72, "r_y2": 622.25, "r_x3": 140.99, "r_y3": 622.25, "coord_origin": "TOPLEFT" }, "text": "-", "orig": "-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 55, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.7, "r_y0": 631.06, "r_x1": 181.99, "r_y1": 631.06, "r_x2": 181.99, "r_y2": 622.26, "r_x3": 151.7, "r_y3": 622.26, "coord_origin": "TOPLEFT" }, "text": "\"NL\" -", "orig": "\"NL\" -", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 56, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 185.32, "r_y0": 631.06, "r_x1": 221.46, "r_y1": 631.06, "r_x2": 221.46, "r_y2": 622.26, "r_x3": 185.32, "r_y3": 622.26, "coord_origin": "TOPLEFT" }, "text": "new-line", "orig": "new-line", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 57, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 221.46, "r_y0": 631.06, "r_x1": 328.62, "r_y1": 631.06, "r_x2": 328.62, "r_y2": 622.26, "r_x3": 221.46, "r_y3": 622.26, "coord_origin": "TOPLEFT" }, "text": ", switch to the next row.", "orig": ", switch to the next row.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 58, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 149.71, "r_y0": 652.9, "r_x1": 480.59, "r_y1": 652.9, "r_x2": 480.59, "r_y2": 644.1, "r_x3": 149.71, "r_y3": 644.1, "coord_origin": "TOPLEFT" }, "text": "A notable attribute of OTSL is that it has the capability of achieving lossless", "orig": "A notable attribute of OTSL is that it has the capability of achieving lossless", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 59, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.77, "r_y0": 664.85, "r_x1": 228.22, "r_y1": 664.85, "r_x2": 228.22, "r_y2": 656.06, "r_x3": 134.77, "r_y3": 656.06, "coord_origin": "TOPLEFT" }, "text": "conversion to HTML.", "orig": "conversion to HTML.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "has_chars": false, "has_words": false, "has_lines": true, "image": null, "lines": [] }, "predictions": { "layout": { "clusters": [ { "id": 14, "label": "page_header", "bbox": { "l": 134.76, "t": 93.77, "r": 139.37, "b": 101.84, "coord_origin": "TOPLEFT" }, "confidence": 0.838, "cells": [ { "index": 0, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 101.84, "r_x1": 139.37, "r_y1": 101.84, "r_x2": 139.37, "r_y2": 93.77, "r_x3": 134.76, "r_y3": 93.77, "coord_origin": "TOPLEFT" }, "text": "6", "orig": "6", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 11, "label": "page_header", "bbox": { "l": 167.81, "t": 93.77, "r": 231.72, "b": 101.84, "coord_origin": "TOPLEFT" }, "confidence": 0.892, "cells": [ { "index": 1, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 167.81, "r_y0": 101.84, "r_x1": 178.08, "r_y1": 101.84, "r_x2": 178.08, "r_y2": 93.77, "r_x3": 167.81, "r_y3": 93.77, "coord_origin": "TOPLEFT" }, "text": "M.", "orig": "M.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 2, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 182.37, "r_y0": 101.84, "r_x1": 231.72, "r_y1": 101.84, "r_x2": 231.72, "r_y2": 93.77, "r_x3": 182.37, "r_y3": 93.77, "coord_origin": "TOPLEFT" }, "text": "Lysak, et al.", "orig": "Lysak, et al.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 3, "label": "text", "bbox": { "l": 134.76, "t": 118.93, "r": 480.59, "b": 139.69, "coord_origin": "TOPLEFT" }, "confidence": 0.963, "cells": [ { "index": 3, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 127.73, "r_x1": 480.59, "r_y1": 127.73, "r_x2": 480.59, "r_y2": 118.93, "r_x3": 134.76, "r_y3": 118.93, "coord_origin": "TOPLEFT" }, "text": "generation. Implicitly, this also means that Im2Seq models need to learn these", "orig": "generation. Implicitly, this also means that Im2Seq models need to learn these", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 4, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 139.69, "r_x1": 364.63, "r_y1": 139.69, "r_x2": 364.63, "r_y2": 130.89, "r_x3": 134.76, "r_y3": 130.89, "coord_origin": "TOPLEFT" }, "text": "complex syntax rules, simply to deliver valid output.", "orig": "complex syntax rules, simply to deliver valid output.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 1, "label": "text", "bbox": { "l": 134.76, "t": 143.48, "r": 480.6, "b": 295.74, "coord_origin": "TOPLEFT" }, "confidence": 0.986, "cells": [ { "index": 5, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 149.71, "r_y0": 152.28, "r_x1": 480.59, "r_y1": 152.28, "r_x2": 480.59, "r_y2": 143.48, "r_x3": 149.71, "r_y3": 143.48, "coord_origin": "TOPLEFT" }, "text": "In practice, we observe two major issues with prediction quality when train-", "orig": "In practice, we observe two major issues with prediction quality when train-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 6, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 164.23, "r_x1": 480.59, "r_y1": 164.23, "r_x2": 480.59, "r_y2": 155.44, "r_x3": 134.76, "r_y3": 155.44, "coord_origin": "TOPLEFT" }, "text": "ing Im2Seq models on HTML table structure generation from images. On the", "orig": "ing Im2Seq models on HTML table structure generation from images. On the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 7, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 176.19, "r_x1": 480.59, "r_y1": 176.19, "r_x2": 480.59, "r_y2": 167.39, "r_x3": 134.76, "r_y3": 167.39, "coord_origin": "TOPLEFT" }, "text": "one hand, we find that on large tables, the visual attention of the model often", "orig": "one hand, we find that on large tables, the visual attention of the model often", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 8, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 188.14, "r_x1": 480.59, "r_y1": 188.14, "r_x2": 480.59, "r_y2": 179.35, "r_x3": 134.76, "r_y3": 179.35, "coord_origin": "TOPLEFT" }, "text": "starts to drift and is not accurately moving forward cell by cell anymore. This", "orig": "starts to drift and is not accurately moving forward cell by cell anymore. This", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 9, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 200.1, "r_x1": 314.28, "r_y1": 200.1, "r_x2": 314.28, "r_y2": 191.3, "r_x3": 134.76, "r_y3": 191.3, "coord_origin": "TOPLEFT" }, "text": "manifests itself in either in an increasing", "orig": "manifests itself in either in an increasing", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 10, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 318.06, "r_y0": 200.1, "r_x1": 374.09, "r_y1": 200.1, "r_x2": 374.09, "r_y2": 191.3, "r_x3": 318.06, "r_y3": 191.3, "coord_origin": "TOPLEFT" }, "text": "location drift", "orig": "location drift", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 11, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 378.81, "r_y0": 200.1, "r_x1": 480.59, "r_y1": 200.1, "r_x2": 480.59, "r_y2": 191.3, "r_x3": 378.81, "r_y3": 191.3, "coord_origin": "TOPLEFT" }, "text": "for proposed table-cells", "orig": "for proposed table-cells", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 12, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 212.06, "r_x1": 480.59, "r_y1": 212.06, "r_x2": 480.59, "r_y2": 203.26, "r_x3": 134.76, "r_y3": 203.26, "coord_origin": "TOPLEFT" }, "text": "in later rows on the same column or even complete loss of vertical alignment, as", "orig": "in later rows on the same column or even complete loss of vertical alignment, as", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 13, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 224.01, "r_x1": 480.6, "r_y1": 224.01, "r_x2": 480.6, "r_y2": 215.21, "r_x3": 134.76, "r_y3": 215.21, "coord_origin": "TOPLEFT" }, "text": "illustrated in Figure 5. Addressing this with post-processing is partially possible,", "orig": "illustrated in Figure 5. Addressing this with post-processing is partially possible,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 14, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 235.97, "r_x1": 480.59, "r_y1": 235.97, "r_x2": 480.59, "r_y2": 227.17, "r_x3": 134.76, "r_y3": 227.17, "coord_origin": "TOPLEFT" }, "text": "but clearly undesired. On the other hand, we find many instances of predictions", "orig": "but clearly undesired. On the other hand, we find many instances of predictions", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 15, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 247.92, "r_x1": 480.59, "r_y1": 247.92, "r_x2": 480.59, "r_y2": 239.12, "r_x3": 134.76, "r_y3": 239.12, "coord_origin": "TOPLEFT" }, "text": "with structural inconsistencies or plain invalid HTML output, as shown in Fig-", "orig": "with structural inconsistencies or plain invalid HTML output, as shown in Fig-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 16, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 259.88, "r_x1": 480.59, "r_y1": 259.88, "r_x2": 480.59, "r_y2": 251.08, "r_x3": 134.76, "r_y3": 251.08, "coord_origin": "TOPLEFT" }, "text": "ure 6, which are nearly impossible to properly correct. Both problems seriously", "orig": "ure 6, which are nearly impossible to properly correct. Both problems seriously", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 17, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 271.83, "r_x1": 480.59, "r_y1": 271.83, "r_x2": 480.59, "r_y2": 263.03, "r_x3": 134.76, "r_y3": 263.03, "coord_origin": "TOPLEFT" }, "text": "impact the TSR model performance, since they reflect not only in the task of", "orig": "impact the TSR model performance, since they reflect not only in the task of", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 18, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 283.79, "r_x1": 480.59, "r_y1": 283.79, "r_x2": 480.59, "r_y2": 274.99, "r_x3": 134.76, "r_y3": 274.99, "coord_origin": "TOPLEFT" }, "text": "pure structure recognition but also in the equally crucial recognition or matching", "orig": "pure structure recognition but also in the equally crucial recognition or matching", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 19, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 295.74, "r_x1": 223.57, "r_y1": 295.74, "r_x2": 223.57, "r_y2": 286.94, "r_x3": 134.76, "r_y3": 286.94, "coord_origin": "TOPLEFT" }, "text": "of table cell content.", "orig": "of table cell content.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 4, "label": "section_header", "bbox": { "l": 134.76, "t": 320.63, "r": 372.51, "b": 331.2, "coord_origin": "TOPLEFT" }, "confidence": 0.957, "cells": [ { "index": 20, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 331.2, "r_x1": 141.49, "r_y1": 331.2, "r_x2": 141.49, "r_y2": 320.63, "r_x3": 134.76, "r_y3": 320.63, "coord_origin": "TOPLEFT" }, "text": "4", "orig": "4", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 21, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 154.94, "r_y0": 331.2, "r_x1": 372.51, "r_y1": 331.2, "r_x2": 372.51, "r_y2": 320.63, "r_x3": 154.94, "r_y3": 320.63, "coord_origin": "TOPLEFT" }, "text": "Optimised Table Structure Language", "orig": "Optimised Table Structure Language", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 0, "label": "text", "bbox": { "l": 134.76, "t": 349.12, "r": 480.59, "b": 441.6, "coord_origin": "TOPLEFT" }, "confidence": 0.988, "cells": [ { "index": 22, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 357.91, "r_x1": 480.59, "r_y1": 357.91, "r_x2": 480.59, "r_y2": 349.12, "r_x3": 134.76, "r_y3": 349.12, "coord_origin": "TOPLEFT" }, "text": "To mitigate the issues with HTML in Im2Seq-based TSR models laid out before,", "orig": "To mitigate the issues with HTML in Im2Seq-based TSR models laid out before,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 23, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 369.87, "r_x1": 480.59, "r_y1": 369.87, "r_x2": 480.59, "r_y2": 361.07, "r_x3": 134.76, "r_y3": 361.07, "coord_origin": "TOPLEFT" }, "text": "we propose here our Optimised Table Structure Language (OTSL). OTSL is", "orig": "we propose here our Optimised Table Structure Language (OTSL). OTSL is", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 24, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 381.82, "r_x1": 480.59, "r_y1": 381.82, "r_x2": 480.59, "r_y2": 373.03, "r_x3": 134.76, "r_y3": 373.03, "coord_origin": "TOPLEFT" }, "text": "designed to express table structure with a minimized vocabulary and a simple", "orig": "designed to express table structure with a minimized vocabulary and a simple", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 25, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 393.78, "r_x1": 480.59, "r_y1": 393.78, "r_x2": 480.59, "r_y2": 384.98, "r_x3": 134.76, "r_y3": 384.98, "coord_origin": "TOPLEFT" }, "text": "set of rules, which are both significantly reduced compared to HTML. At the", "orig": "set of rules, which are both significantly reduced compared to HTML. At the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 26, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 405.73, "r_x1": 480.59, "r_y1": 405.73, "r_x2": 480.59, "r_y2": 396.94, "r_x3": 134.76, "r_y3": 396.94, "coord_origin": "TOPLEFT" }, "text": "same time, OTSL enables easy error detection and correction during sequence", "orig": "same time, OTSL enables easy error detection and correction during sequence", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 27, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 417.69, "r_x1": 480.59, "r_y1": 417.69, "r_x2": 480.59, "r_y2": 408.89, "r_x3": 134.76, "r_y3": 408.89, "coord_origin": "TOPLEFT" }, "text": "generation. We further demonstrate how the compact structure representation", "orig": "generation. We further demonstrate how the compact structure representation", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 28, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 429.64, "r_x1": 480.59, "r_y1": 429.64, "r_x2": 480.59, "r_y2": 420.85, "r_x3": 134.76, "r_y3": 420.85, "coord_origin": "TOPLEFT" }, "text": "and minimized sequence length improves prediction accuracy and inference time", "orig": "and minimized sequence length improves prediction accuracy and inference time", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 29, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 441.6, "r_x1": 276.67, "r_y1": 441.6, "r_x2": 276.67, "r_y2": 432.8, "r_x3": 134.76, "r_y3": 432.8, "coord_origin": "TOPLEFT" }, "text": "in the TableFormer architecture.", "orig": "in the TableFormer architecture.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 5, "label": "section_header", "bbox": { "l": 134.76, "t": 465.87, "r": 261.8, "b": 474.68, "coord_origin": "TOPLEFT" }, "confidence": 0.956, "cells": [ { "index": 30, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 474.68, "r_x1": 149.4, "r_y1": 474.68, "r_x2": 149.4, "r_y2": 465.87, "r_x3": 134.76, "r_y3": 465.87, "coord_origin": "TOPLEFT" }, "text": "4.1", "orig": "4.1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 31, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 160.86, "r_y0": 474.68, "r_x1": 261.8, "r_y1": 474.68, "r_x2": 261.8, "r_y2": 465.87, "r_x3": 160.86, "r_y3": 465.87, "coord_origin": "TOPLEFT" }, "text": "Language Definition", "orig": "Language Definition", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 2, "label": "text", "bbox": { "l": 134.76, "t": 489.0, "r": 480.59, "b": 521.71, "coord_origin": "TOPLEFT" }, "confidence": 0.967, "cells": [ { "index": 32, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 497.79, "r_x1": 480.59, "r_y1": 497.79, "r_x2": 480.59, "r_y2": 489.0, "r_x3": 134.76, "r_y3": 489.0, "coord_origin": "TOPLEFT" }, "text": "In Figure 3, we illustrate how the OTSL is defined. In essence, the OTSL defines", "orig": "In Figure 3, we illustrate how the OTSL is defined. In essence, the OTSL defines", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 33, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 509.75, "r_x1": 480.59, "r_y1": 509.75, "r_x2": 480.59, "r_y2": 500.95, "r_x3": 134.76, "r_y3": 500.95, "coord_origin": "TOPLEFT" }, "text": "only 5 tokens that directly describe a tabular structure based on an atomic 2D", "orig": "only 5 tokens that directly describe a tabular structure based on an atomic 2D", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 34, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 521.71, "r_x1": 154.71, "r_y1": 521.71, "r_x2": 154.71, "r_y2": 512.91, "r_x3": 134.76, "r_y3": 512.91, "coord_origin": "TOPLEFT" }, "text": "grid.", "orig": "grid.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 13, "label": "text", "bbox": { "l": 149.71, "t": 525.5, "r": 409.31, "b": 534.3, "coord_origin": "TOPLEFT" }, "confidence": 0.856, "cells": [ { "index": 35, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 149.71, "r_y0": 534.3, "r_x1": 409.31, "r_y1": 534.3, "r_x2": 409.31, "r_y2": 525.5, "r_x3": 149.71, "r_y3": 525.5, "coord_origin": "TOPLEFT" }, "text": "The OTSL vocabulary is comprised of the following tokens:", "orig": "The OTSL vocabulary is comprised of the following tokens:", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 9, "label": "list_item", "bbox": { "l": 140.99, "t": 547.97, "r": 460.54, "b": 556.78, "coord_origin": "TOPLEFT" }, "confidence": 0.918, "cells": [ { "index": 36, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 140.99, "r_y0": 556.78, "r_x1": 146.72, "r_y1": 556.78, "r_x2": 146.72, "r_y2": 547.97, "r_x3": 140.99, "r_y3": 547.97, "coord_origin": "TOPLEFT" }, "text": "-", "orig": "-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 37, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.7, "r_y0": 556.78, "r_x1": 193.21, "r_y1": 556.78, "r_x2": 193.21, "r_y2": 547.98, "r_x3": 151.7, "r_y3": 547.98, "coord_origin": "TOPLEFT" }, "text": "\"C\" cell -", "orig": "\"C\" cell -", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 38, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 196.52, "r_y0": 556.78, "r_x1": 263.47, "r_y1": 556.78, "r_x2": 263.47, "r_y2": 547.98, "r_x3": 196.52, "r_y3": 547.98, "coord_origin": "TOPLEFT" }, "text": "a new table cell", "orig": "a new table cell", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 39, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 267.81, "r_y0": 556.78, "r_x1": 460.54, "r_y1": 556.78, "r_x2": 460.54, "r_y2": 547.98, "r_x3": 267.81, "r_y3": 547.98, "coord_origin": "TOPLEFT" }, "text": "that either has or does not have cell content", "orig": "that either has or does not have cell content", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 8, "label": "list_item", "bbox": { "l": 140.99, "t": 560.56, "r": 480.59, "b": 581.32, "coord_origin": "TOPLEFT" }, "confidence": 0.932, "cells": [ { "index": 40, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 140.99, "r_y0": 569.37, "r_x1": 146.72, "r_y1": 569.37, "r_x2": 146.72, "r_y2": 560.56, "r_x3": 140.99, "r_y3": 560.56, "coord_origin": "TOPLEFT" }, "text": "-", "orig": "-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 41, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.7, "r_y0": 569.37, "r_x1": 194.3, "r_y1": 569.37, "r_x2": 194.3, "r_y2": 560.57, "r_x3": 151.7, "r_y3": 560.57, "coord_origin": "TOPLEFT" }, "text": "\"L\" cell -", "orig": "\"L\" cell -", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 42, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 198.66, "r_y0": 569.37, "r_x1": 264.52, "r_y1": 569.37, "r_x2": 264.52, "r_y2": 560.57, "r_x3": 198.66, "r_y3": 560.57, "coord_origin": "TOPLEFT" }, "text": "left-looking cell", "orig": "left-looking cell", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 43, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 264.52, "r_y0": 569.37, "r_x1": 480.59, "r_y1": 569.37, "r_x2": 480.59, "r_y2": 560.57, "r_x3": 264.52, "r_y3": 560.57, "coord_origin": "TOPLEFT" }, "text": ", merging with the left neighbor cell to create a", "orig": ", merging with the left neighbor cell to create a", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 44, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.7, "r_y0": 581.32, "r_x1": 171.68, "r_y1": 581.32, "r_x2": 171.68, "r_y2": 572.53, "r_x3": 151.7, "r_y3": 572.53, "coord_origin": "TOPLEFT" }, "text": "span", "orig": "span", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 7, "label": "list_item", "bbox": { "l": 140.99, "t": 585.11, "r": 480.59, "b": 605.87, "coord_origin": "TOPLEFT" }, "confidence": 0.944, "cells": [ { "index": 45, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 140.99, "r_y0": 593.92, "r_x1": 146.72, "r_y1": 593.92, "r_x2": 146.72, "r_y2": 585.11, "r_x3": 140.99, "r_y3": 585.11, "coord_origin": "TOPLEFT" }, "text": "-", "orig": "-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 46, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.7, "r_y0": 593.92, "r_x1": 194.11, "r_y1": 593.92, "r_x2": 194.11, "r_y2": 585.12, "r_x3": 151.7, "r_y3": 585.12, "coord_origin": "TOPLEFT" }, "text": "\"U\" cell -", "orig": "\"U\" cell -", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 47, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 197.75, "r_y0": 593.92, "r_x1": 259.89, "r_y1": 593.92, "r_x2": 259.89, "r_y2": 585.12, "r_x3": 197.75, "r_y3": 585.12, "coord_origin": "TOPLEFT" }, "text": "up-looking cell", "orig": "up-looking cell", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 48, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 259.89, "r_y0": 593.92, "r_x1": 480.59, "r_y1": 593.92, "r_x2": 480.59, "r_y2": 585.12, "r_x3": 259.89, "r_y3": 585.12, "coord_origin": "TOPLEFT" }, "text": ", merging with the upper neighbor cell to create a", "orig": ", merging with the upper neighbor cell to create a", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 49, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.7, "r_y0": 605.87, "r_x1": 171.68, "r_y1": 605.87, "r_x2": 171.68, "r_y2": 597.08, "r_x3": 151.7, "r_y3": 597.08, "coord_origin": "TOPLEFT" }, "text": "span", "orig": "span", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 10, "label": "list_item", "bbox": { "l": 140.99, "t": 609.66, "r": 454.55, "b": 618.47, "coord_origin": "TOPLEFT" }, "confidence": 0.904, "cells": [ { "index": 50, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 140.99, "r_y0": 618.47, "r_x1": 146.72, "r_y1": 618.47, "r_x2": 146.72, "r_y2": 609.66, "r_x3": 140.99, "r_y3": 609.66, "coord_origin": "TOPLEFT" }, "text": "-", "orig": "-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 51, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.7, "r_y0": 618.47, "r_x1": 193.48, "r_y1": 618.47, "r_x2": 193.48, "r_y2": 609.67, "r_x3": 151.7, "r_y3": 609.67, "coord_origin": "TOPLEFT" }, "text": "\"X\" cell -", "orig": "\"X\" cell -", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 52, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 196.8, "r_y0": 618.47, "r_x1": 236.12, "r_y1": 618.47, "r_x2": 236.12, "r_y2": 609.67, "r_x3": 196.8, "r_y3": 609.67, "coord_origin": "TOPLEFT" }, "text": "cross cell", "orig": "cross cell", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 53, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 236.13, "r_y0": 618.47, "r_x1": 454.55, "r_y1": 618.47, "r_x2": 454.55, "r_y2": 609.67, "r_x3": 236.13, "r_y3": 609.67, "coord_origin": "TOPLEFT" }, "text": ", to merge with both left and upper neighbor cells", "orig": ", to merge with both left and upper neighbor cells", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 12, "label": "list_item", "bbox": { "l": 140.99, "t": 622.25, "r": 328.62, "b": 631.06, "coord_origin": "TOPLEFT" }, "confidence": 0.864, "cells": [ { "index": 54, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 140.99, "r_y0": 631.06, "r_x1": 146.72, "r_y1": 631.06, "r_x2": 146.72, "r_y2": 622.25, "r_x3": 140.99, "r_y3": 622.25, "coord_origin": "TOPLEFT" }, "text": "-", "orig": "-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 55, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.7, "r_y0": 631.06, "r_x1": 181.99, "r_y1": 631.06, "r_x2": 181.99, "r_y2": 622.26, "r_x3": 151.7, "r_y3": 622.26, "coord_origin": "TOPLEFT" }, "text": "\"NL\" -", "orig": "\"NL\" -", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 56, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 185.32, "r_y0": 631.06, "r_x1": 221.46, "r_y1": 631.06, "r_x2": 221.46, "r_y2": 622.26, "r_x3": 185.32, "r_y3": 622.26, "coord_origin": "TOPLEFT" }, "text": "new-line", "orig": "new-line", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 57, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 221.46, "r_y0": 631.06, "r_x1": 328.62, "r_y1": 631.06, "r_x2": 328.62, "r_y2": 622.26, "r_x3": 221.46, "r_y3": 622.26, "coord_origin": "TOPLEFT" }, "text": ", switch to the next row.", "orig": ", switch to the next row.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 6, "label": "text", "bbox": { "l": 134.77, "t": 644.1, "r": 480.59, "b": 664.85, "coord_origin": "TOPLEFT" }, "confidence": 0.944, "cells": [ { "index": 58, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 149.71, "r_y0": 652.9, "r_x1": 480.59, "r_y1": 652.9, "r_x2": 480.59, "r_y2": 644.1, "r_x3": 149.71, "r_y3": 644.1, "coord_origin": "TOPLEFT" }, "text": "A notable attribute of OTSL is that it has the capability of achieving lossless", "orig": "A notable attribute of OTSL is that it has the capability of achieving lossless", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 59, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.77, "r_y0": 664.85, "r_x1": 228.22, "r_y1": 664.85, "r_x2": 228.22, "r_y2": 656.06, "r_x3": 134.77, "r_y3": 656.06, "coord_origin": "TOPLEFT" }, "text": "conversion to HTML.", "orig": "conversion to HTML.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] } ] }, "tablestructure": { "table_map": {} }, "figures_classification": null, "equations_prediction": null, "vlm_response": null }, "assembled": { "elements": [ { "label": "page_header", "id": 14, "page_no": 5, "cluster": { "id": 14, "label": "page_header", "bbox": { "l": 134.76, "t": 93.77, "r": 139.37, "b": 101.84, "coord_origin": "TOPLEFT" }, "confidence": 0.838, "cells": [ { "index": 0, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 101.84, "r_x1": 139.37, "r_y1": 101.84, "r_x2": 139.37, "r_y2": 93.77, "r_x3": 134.76, "r_y3": 93.77, "coord_origin": "TOPLEFT" }, "text": "6", "orig": "6", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "6" }, { "label": "page_header", "id": 11, "page_no": 5, "cluster": { "id": 11, "label": "page_header", "bbox": { "l": 167.81, "t": 93.77, "r": 231.72, "b": 101.84, "coord_origin": "TOPLEFT" }, "confidence": 0.892, "cells": [ { "index": 1, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 167.81, "r_y0": 101.84, "r_x1": 178.08, "r_y1": 101.84, "r_x2": 178.08, "r_y2": 93.77, "r_x3": 167.81, "r_y3": 93.77, "coord_origin": "TOPLEFT" }, "text": "M.", "orig": "M.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 2, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 182.37, "r_y0": 101.84, "r_x1": 231.72, "r_y1": 101.84, "r_x2": 231.72, "r_y2": 93.77, "r_x3": 182.37, "r_y3": 93.77, "coord_origin": "TOPLEFT" }, "text": "Lysak, et al.", "orig": "Lysak, et al.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "M. Lysak, et al." }, { "label": "text", "id": 3, "page_no": 5, "cluster": { "id": 3, "label": "text", "bbox": { "l": 134.76, "t": 118.93, "r": 480.59, "b": 139.69, "coord_origin": "TOPLEFT" }, "confidence": 0.963, "cells": [ { "index": 3, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 127.73, "r_x1": 480.59, "r_y1": 127.73, "r_x2": 480.59, "r_y2": 118.93, "r_x3": 134.76, "r_y3": 118.93, "coord_origin": "TOPLEFT" }, "text": "generation. Implicitly, this also means that Im2Seq models need to learn these", "orig": "generation. Implicitly, this also means that Im2Seq models need to learn these", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 4, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 139.69, "r_x1": 364.63, "r_y1": 139.69, "r_x2": 364.63, "r_y2": 130.89, "r_x3": 134.76, "r_y3": 130.89, "coord_origin": "TOPLEFT" }, "text": "complex syntax rules, simply to deliver valid output.", "orig": "complex syntax rules, simply to deliver valid output.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "generation. Implicitly, this also means that Im2Seq models need to learn these complex syntax rules, simply to deliver valid output." }, { "label": "text", "id": 1, "page_no": 5, "cluster": { "id": 1, "label": "text", "bbox": { "l": 134.76, "t": 143.48, "r": 480.6, "b": 295.74, "coord_origin": "TOPLEFT" }, "confidence": 0.986, "cells": [ { "index": 5, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 149.71, "r_y0": 152.28, "r_x1": 480.59, "r_y1": 152.28, "r_x2": 480.59, "r_y2": 143.48, "r_x3": 149.71, "r_y3": 143.48, "coord_origin": "TOPLEFT" }, "text": "In practice, we observe two major issues with prediction quality when train-", "orig": "In practice, we observe two major issues with prediction quality when train-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 6, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 164.23, "r_x1": 480.59, "r_y1": 164.23, "r_x2": 480.59, "r_y2": 155.44, "r_x3": 134.76, "r_y3": 155.44, "coord_origin": "TOPLEFT" }, "text": "ing Im2Seq models on HTML table structure generation from images. On the", "orig": "ing Im2Seq models on HTML table structure generation from images. On the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 7, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 176.19, "r_x1": 480.59, "r_y1": 176.19, "r_x2": 480.59, "r_y2": 167.39, "r_x3": 134.76, "r_y3": 167.39, "coord_origin": "TOPLEFT" }, "text": "one hand, we find that on large tables, the visual attention of the model often", "orig": "one hand, we find that on large tables, the visual attention of the model often", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 8, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 188.14, "r_x1": 480.59, "r_y1": 188.14, "r_x2": 480.59, "r_y2": 179.35, "r_x3": 134.76, "r_y3": 179.35, "coord_origin": "TOPLEFT" }, "text": "starts to drift and is not accurately moving forward cell by cell anymore. This", "orig": "starts to drift and is not accurately moving forward cell by cell anymore. This", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 9, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 200.1, "r_x1": 314.28, "r_y1": 200.1, "r_x2": 314.28, "r_y2": 191.3, "r_x3": 134.76, "r_y3": 191.3, "coord_origin": "TOPLEFT" }, "text": "manifests itself in either in an increasing", "orig": "manifests itself in either in an increasing", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 10, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 318.06, "r_y0": 200.1, "r_x1": 374.09, "r_y1": 200.1, "r_x2": 374.09, "r_y2": 191.3, "r_x3": 318.06, "r_y3": 191.3, "coord_origin": "TOPLEFT" }, "text": "location drift", "orig": "location drift", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 11, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 378.81, "r_y0": 200.1, "r_x1": 480.59, "r_y1": 200.1, "r_x2": 480.59, "r_y2": 191.3, "r_x3": 378.81, "r_y3": 191.3, "coord_origin": "TOPLEFT" }, "text": "for proposed table-cells", "orig": "for proposed table-cells", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 12, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 212.06, "r_x1": 480.59, "r_y1": 212.06, "r_x2": 480.59, "r_y2": 203.26, "r_x3": 134.76, "r_y3": 203.26, "coord_origin": "TOPLEFT" }, "text": "in later rows on the same column or even complete loss of vertical alignment, as", "orig": "in later rows on the same column or even complete loss of vertical alignment, as", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 13, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 224.01, "r_x1": 480.6, "r_y1": 224.01, "r_x2": 480.6, "r_y2": 215.21, "r_x3": 134.76, "r_y3": 215.21, "coord_origin": "TOPLEFT" }, "text": "illustrated in Figure 5. Addressing this with post-processing is partially possible,", "orig": "illustrated in Figure 5. Addressing this with post-processing is partially possible,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 14, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 235.97, "r_x1": 480.59, "r_y1": 235.97, "r_x2": 480.59, "r_y2": 227.17, "r_x3": 134.76, "r_y3": 227.17, "coord_origin": "TOPLEFT" }, "text": "but clearly undesired. On the other hand, we find many instances of predictions", "orig": "but clearly undesired. On the other hand, we find many instances of predictions", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 15, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 247.92, "r_x1": 480.59, "r_y1": 247.92, "r_x2": 480.59, "r_y2": 239.12, "r_x3": 134.76, "r_y3": 239.12, "coord_origin": "TOPLEFT" }, "text": "with structural inconsistencies or plain invalid HTML output, as shown in Fig-", "orig": "with structural inconsistencies or plain invalid HTML output, as shown in Fig-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 16, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 259.88, "r_x1": 480.59, "r_y1": 259.88, "r_x2": 480.59, "r_y2": 251.08, "r_x3": 134.76, "r_y3": 251.08, "coord_origin": "TOPLEFT" }, "text": "ure 6, which are nearly impossible to properly correct. Both problems seriously", "orig": "ure 6, which are nearly impossible to properly correct. Both problems seriously", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 17, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 271.83, "r_x1": 480.59, "r_y1": 271.83, "r_x2": 480.59, "r_y2": 263.03, "r_x3": 134.76, "r_y3": 263.03, "coord_origin": "TOPLEFT" }, "text": "impact the TSR model performance, since they reflect not only in the task of", "orig": "impact the TSR model performance, since they reflect not only in the task of", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 18, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 283.79, "r_x1": 480.59, "r_y1": 283.79, "r_x2": 480.59, "r_y2": 274.99, "r_x3": 134.76, "r_y3": 274.99, "coord_origin": "TOPLEFT" }, "text": "pure structure recognition but also in the equally crucial recognition or matching", "orig": "pure structure recognition but also in the equally crucial recognition or matching", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 19, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 295.74, "r_x1": 223.57, "r_y1": 295.74, "r_x2": 223.57, "r_y2": 286.94, "r_x3": 134.76, "r_y3": 286.94, "coord_origin": "TOPLEFT" }, "text": "of table cell content.", "orig": "of table cell content.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "In practice, we observe two major issues with prediction quality when training Im2Seq models on HTML table structure generation from images. On the one hand, we find that on large tables, the visual attention of the model often starts to drift and is not accurately moving forward cell by cell anymore. This manifests itself in either in an increasing location drift for proposed table-cells in later rows on the same column or even complete loss of vertical alignment, as illustrated in Figure 5. Addressing this with post-processing is partially possible, but clearly undesired. On the other hand, we find many instances of predictions with structural inconsistencies or plain invalid HTML output, as shown in Figure 6, which are nearly impossible to properly correct. Both problems seriously impact the TSR model performance, since they reflect not only in the task of pure structure recognition but also in the equally crucial recognition or matching of table cell content." }, { "label": "section_header", "id": 4, "page_no": 5, "cluster": { "id": 4, "label": "section_header", "bbox": { "l": 134.76, "t": 320.63, "r": 372.51, "b": 331.2, "coord_origin": "TOPLEFT" }, "confidence": 0.957, "cells": [ { "index": 20, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 331.2, "r_x1": 141.49, "r_y1": 331.2, "r_x2": 141.49, "r_y2": 320.63, "r_x3": 134.76, "r_y3": 320.63, "coord_origin": "TOPLEFT" }, "text": "4", "orig": "4", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 21, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 154.94, "r_y0": 331.2, "r_x1": 372.51, "r_y1": 331.2, "r_x2": 372.51, "r_y2": 320.63, "r_x3": 154.94, "r_y3": 320.63, "coord_origin": "TOPLEFT" }, "text": "Optimised Table Structure Language", "orig": "Optimised Table Structure Language", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "4 Optimised Table Structure Language" }, { "label": "text", "id": 0, "page_no": 5, "cluster": { "id": 0, "label": "text", "bbox": { "l": 134.76, "t": 349.12, "r": 480.59, "b": 441.6, "coord_origin": "TOPLEFT" }, "confidence": 0.988, "cells": [ { "index": 22, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 357.91, "r_x1": 480.59, "r_y1": 357.91, "r_x2": 480.59, "r_y2": 349.12, "r_x3": 134.76, "r_y3": 349.12, "coord_origin": "TOPLEFT" }, "text": "To mitigate the issues with HTML in Im2Seq-based TSR models laid out before,", "orig": "To mitigate the issues with HTML in Im2Seq-based TSR models laid out before,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 23, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 369.87, "r_x1": 480.59, "r_y1": 369.87, "r_x2": 480.59, "r_y2": 361.07, "r_x3": 134.76, "r_y3": 361.07, "coord_origin": "TOPLEFT" }, "text": "we propose here our Optimised Table Structure Language (OTSL). OTSL is", "orig": "we propose here our Optimised Table Structure Language (OTSL). OTSL is", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 24, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 381.82, "r_x1": 480.59, "r_y1": 381.82, "r_x2": 480.59, "r_y2": 373.03, "r_x3": 134.76, "r_y3": 373.03, "coord_origin": "TOPLEFT" }, "text": "designed to express table structure with a minimized vocabulary and a simple", "orig": "designed to express table structure with a minimized vocabulary and a simple", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 25, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 393.78, "r_x1": 480.59, "r_y1": 393.78, "r_x2": 480.59, "r_y2": 384.98, "r_x3": 134.76, "r_y3": 384.98, "coord_origin": "TOPLEFT" }, "text": "set of rules, which are both significantly reduced compared to HTML. At the", "orig": "set of rules, which are both significantly reduced compared to HTML. At the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 26, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 405.73, "r_x1": 480.59, "r_y1": 405.73, "r_x2": 480.59, "r_y2": 396.94, "r_x3": 134.76, "r_y3": 396.94, "coord_origin": "TOPLEFT" }, "text": "same time, OTSL enables easy error detection and correction during sequence", "orig": "same time, OTSL enables easy error detection and correction during sequence", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 27, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 417.69, "r_x1": 480.59, "r_y1": 417.69, "r_x2": 480.59, "r_y2": 408.89, "r_x3": 134.76, "r_y3": 408.89, "coord_origin": "TOPLEFT" }, "text": "generation. We further demonstrate how the compact structure representation", "orig": "generation. We further demonstrate how the compact structure representation", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 28, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 429.64, "r_x1": 480.59, "r_y1": 429.64, "r_x2": 480.59, "r_y2": 420.85, "r_x3": 134.76, "r_y3": 420.85, "coord_origin": "TOPLEFT" }, "text": "and minimized sequence length improves prediction accuracy and inference time", "orig": "and minimized sequence length improves prediction accuracy and inference time", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 29, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 441.6, "r_x1": 276.67, "r_y1": 441.6, "r_x2": 276.67, "r_y2": 432.8, "r_x3": 134.76, "r_y3": 432.8, "coord_origin": "TOPLEFT" }, "text": "in the TableFormer architecture.", "orig": "in the TableFormer architecture.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "To mitigate the issues with HTML in Im2Seq-based TSR models laid out before, we propose here our Optimised Table Structure Language (OTSL). OTSL is designed to express table structure with a minimized vocabulary and a simple set of rules, which are both significantly reduced compared to HTML. At the same time, OTSL enables easy error detection and correction during sequence generation. We further demonstrate how the compact structure representation and minimized sequence length improves prediction accuracy and inference time in the TableFormer architecture." }, { "label": "section_header", "id": 5, "page_no": 5, "cluster": { "id": 5, "label": "section_header", "bbox": { "l": 134.76, "t": 465.87, "r": 261.8, "b": 474.68, "coord_origin": "TOPLEFT" }, "confidence": 0.956, "cells": [ { "index": 30, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 474.68, "r_x1": 149.4, "r_y1": 474.68, "r_x2": 149.4, "r_y2": 465.87, "r_x3": 134.76, "r_y3": 465.87, "coord_origin": "TOPLEFT" }, "text": "4.1", "orig": "4.1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 31, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 160.86, "r_y0": 474.68, "r_x1": 261.8, "r_y1": 474.68, "r_x2": 261.8, "r_y2": 465.87, "r_x3": 160.86, "r_y3": 465.87, "coord_origin": "TOPLEFT" }, "text": "Language Definition", "orig": "Language Definition", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "4.1 Language Definition" }, { "label": "text", "id": 2, "page_no": 5, "cluster": { "id": 2, "label": "text", "bbox": { "l": 134.76, "t": 489.0, "r": 480.59, "b": 521.71, "coord_origin": "TOPLEFT" }, "confidence": 0.967, "cells": [ { "index": 32, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 497.79, "r_x1": 480.59, "r_y1": 497.79, "r_x2": 480.59, "r_y2": 489.0, "r_x3": 134.76, "r_y3": 489.0, "coord_origin": "TOPLEFT" }, "text": "In Figure 3, we illustrate how the OTSL is defined. In essence, the OTSL defines", "orig": "In Figure 3, we illustrate how the OTSL is defined. In essence, the OTSL defines", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 33, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 509.75, "r_x1": 480.59, "r_y1": 509.75, "r_x2": 480.59, "r_y2": 500.95, "r_x3": 134.76, "r_y3": 500.95, "coord_origin": "TOPLEFT" }, "text": "only 5 tokens that directly describe a tabular structure based on an atomic 2D", "orig": "only 5 tokens that directly describe a tabular structure based on an atomic 2D", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 34, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 521.71, "r_x1": 154.71, "r_y1": 521.71, "r_x2": 154.71, "r_y2": 512.91, "r_x3": 134.76, "r_y3": 512.91, "coord_origin": "TOPLEFT" }, "text": "grid.", "orig": "grid.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "In Figure 3, we illustrate how the OTSL is defined. In essence, the OTSL defines only 5 tokens that directly describe a tabular structure based on an atomic 2D grid." }, { "label": "text", "id": 13, "page_no": 5, "cluster": { "id": 13, "label": "text", "bbox": { "l": 149.71, "t": 525.5, "r": 409.31, "b": 534.3, "coord_origin": "TOPLEFT" }, "confidence": 0.856, "cells": [ { "index": 35, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 149.71, "r_y0": 534.3, "r_x1": 409.31, "r_y1": 534.3, "r_x2": 409.31, "r_y2": 525.5, "r_x3": 149.71, "r_y3": 525.5, "coord_origin": "TOPLEFT" }, "text": "The OTSL vocabulary is comprised of the following tokens:", "orig": "The OTSL vocabulary is comprised of the following tokens:", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "The OTSL vocabulary is comprised of the following tokens:" }, { "label": "list_item", "id": 9, "page_no": 5, "cluster": { "id": 9, "label": "list_item", "bbox": { "l": 140.99, "t": 547.97, "r": 460.54, "b": 556.78, "coord_origin": "TOPLEFT" }, "confidence": 0.918, "cells": [ { "index": 36, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 140.99, "r_y0": 556.78, "r_x1": 146.72, "r_y1": 556.78, "r_x2": 146.72, "r_y2": 547.97, "r_x3": 140.99, "r_y3": 547.97, "coord_origin": "TOPLEFT" }, "text": "-", "orig": "-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 37, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.7, "r_y0": 556.78, "r_x1": 193.21, "r_y1": 556.78, "r_x2": 193.21, "r_y2": 547.98, "r_x3": 151.7, "r_y3": 547.98, "coord_origin": "TOPLEFT" }, "text": "\"C\" cell -", "orig": "\"C\" cell -", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 38, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 196.52, "r_y0": 556.78, "r_x1": 263.47, "r_y1": 556.78, "r_x2": 263.47, "r_y2": 547.98, "r_x3": 196.52, "r_y3": 547.98, "coord_origin": "TOPLEFT" }, "text": "a new table cell", "orig": "a new table cell", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 39, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 267.81, "r_y0": 556.78, "r_x1": 460.54, "r_y1": 556.78, "r_x2": 460.54, "r_y2": 547.98, "r_x3": 267.81, "r_y3": 547.98, "coord_origin": "TOPLEFT" }, "text": "that either has or does not have cell content", "orig": "that either has or does not have cell content", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "-\"C\" cell a new table cell that either has or does not have cell content" }, { "label": "list_item", "id": 8, "page_no": 5, "cluster": { "id": 8, "label": "list_item", "bbox": { "l": 140.99, "t": 560.56, "r": 480.59, "b": 581.32, "coord_origin": "TOPLEFT" }, "confidence": 0.932, "cells": [ { "index": 40, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 140.99, "r_y0": 569.37, "r_x1": 146.72, "r_y1": 569.37, "r_x2": 146.72, "r_y2": 560.56, "r_x3": 140.99, "r_y3": 560.56, "coord_origin": "TOPLEFT" }, "text": "-", "orig": "-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 41, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.7, "r_y0": 569.37, "r_x1": 194.3, "r_y1": 569.37, "r_x2": 194.3, "r_y2": 560.57, "r_x3": 151.7, "r_y3": 560.57, "coord_origin": "TOPLEFT" }, "text": "\"L\" cell -", "orig": "\"L\" cell -", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 42, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 198.66, "r_y0": 569.37, "r_x1": 264.52, "r_y1": 569.37, "r_x2": 264.52, "r_y2": 560.57, "r_x3": 198.66, "r_y3": 560.57, "coord_origin": "TOPLEFT" }, "text": "left-looking cell", "orig": "left-looking cell", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 43, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 264.52, "r_y0": 569.37, "r_x1": 480.59, "r_y1": 569.37, "r_x2": 480.59, "r_y2": 560.57, "r_x3": 264.52, "r_y3": 560.57, "coord_origin": "TOPLEFT" }, "text": ", merging with the left neighbor cell to create a", "orig": ", merging with the left neighbor cell to create a", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 44, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.7, "r_y0": 581.32, "r_x1": 171.68, "r_y1": 581.32, "r_x2": 171.68, "r_y2": 572.53, "r_x3": 151.7, "r_y3": 572.53, "coord_origin": "TOPLEFT" }, "text": "span", "orig": "span", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "-\"L\" cell left-looking cell , merging with the left neighbor cell to create a span" }, { "label": "list_item", "id": 7, "page_no": 5, "cluster": { "id": 7, "label": "list_item", "bbox": { "l": 140.99, "t": 585.11, "r": 480.59, "b": 605.87, "coord_origin": "TOPLEFT" }, "confidence": 0.944, "cells": [ { "index": 45, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 140.99, "r_y0": 593.92, "r_x1": 146.72, "r_y1": 593.92, "r_x2": 146.72, "r_y2": 585.11, "r_x3": 140.99, "r_y3": 585.11, "coord_origin": "TOPLEFT" }, "text": "-", "orig": "-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 46, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.7, "r_y0": 593.92, "r_x1": 194.11, "r_y1": 593.92, "r_x2": 194.11, "r_y2": 585.12, "r_x3": 151.7, "r_y3": 585.12, "coord_origin": "TOPLEFT" }, "text": "\"U\" cell -", "orig": "\"U\" cell -", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 47, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 197.75, "r_y0": 593.92, "r_x1": 259.89, "r_y1": 593.92, "r_x2": 259.89, "r_y2": 585.12, "r_x3": 197.75, "r_y3": 585.12, "coord_origin": "TOPLEFT" }, "text": "up-looking cell", "orig": "up-looking cell", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 48, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 259.89, "r_y0": 593.92, "r_x1": 480.59, "r_y1": 593.92, "r_x2": 480.59, "r_y2": 585.12, "r_x3": 259.89, "r_y3": 585.12, "coord_origin": "TOPLEFT" }, "text": ", merging with the upper neighbor cell to create a", "orig": ", merging with the upper neighbor cell to create a", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 49, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.7, "r_y0": 605.87, "r_x1": 171.68, "r_y1": 605.87, "r_x2": 171.68, "r_y2": 597.08, "r_x3": 151.7, "r_y3": 597.08, "coord_origin": "TOPLEFT" }, "text": "span", "orig": "span", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "-\"U\" cell up-looking cell , merging with the upper neighbor cell to create a span" }, { "label": "list_item", "id": 10, "page_no": 5, "cluster": { "id": 10, "label": "list_item", "bbox": { "l": 140.99, "t": 609.66, "r": 454.55, "b": 618.47, "coord_origin": "TOPLEFT" }, "confidence": 0.904, "cells": [ { "index": 50, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 140.99, "r_y0": 618.47, "r_x1": 146.72, "r_y1": 618.47, "r_x2": 146.72, "r_y2": 609.66, "r_x3": 140.99, "r_y3": 609.66, "coord_origin": "TOPLEFT" }, "text": "-", "orig": "-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 51, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.7, "r_y0": 618.47, "r_x1": 193.48, "r_y1": 618.47, "r_x2": 193.48, "r_y2": 609.67, "r_x3": 151.7, "r_y3": 609.67, "coord_origin": "TOPLEFT" }, "text": "\"X\" cell -", "orig": "\"X\" cell -", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 52, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 196.8, "r_y0": 618.47, "r_x1": 236.12, "r_y1": 618.47, "r_x2": 236.12, "r_y2": 609.67, "r_x3": 196.8, "r_y3": 609.67, "coord_origin": "TOPLEFT" }, "text": "cross cell", "orig": "cross cell", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 53, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 236.13, "r_y0": 618.47, "r_x1": 454.55, "r_y1": 618.47, "r_x2": 454.55, "r_y2": 609.67, "r_x3": 236.13, "r_y3": 609.67, "coord_origin": "TOPLEFT" }, "text": ", to merge with both left and upper neighbor cells", "orig": ", to merge with both left and upper neighbor cells", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "-\"X\" cell cross cell , to merge with both left and upper neighbor cells" }, { "label": "list_item", "id": 12, "page_no": 5, "cluster": { "id": 12, "label": "list_item", "bbox": { "l": 140.99, "t": 622.25, "r": 328.62, "b": 631.06, "coord_origin": "TOPLEFT" }, "confidence": 0.864, "cells": [ { "index": 54, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 140.99, "r_y0": 631.06, "r_x1": 146.72, "r_y1": 631.06, "r_x2": 146.72, "r_y2": 622.25, "r_x3": 140.99, "r_y3": 622.25, "coord_origin": "TOPLEFT" }, "text": "-", "orig": "-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 55, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.7, "r_y0": 631.06, "r_x1": 181.99, "r_y1": 631.06, "r_x2": 181.99, "r_y2": 622.26, "r_x3": 151.7, "r_y3": 622.26, "coord_origin": "TOPLEFT" }, "text": "\"NL\" -", "orig": "\"NL\" -", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 56, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 185.32, "r_y0": 631.06, "r_x1": 221.46, "r_y1": 631.06, "r_x2": 221.46, "r_y2": 622.26, "r_x3": 185.32, "r_y3": 622.26, "coord_origin": "TOPLEFT" }, "text": "new-line", "orig": "new-line", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 57, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 221.46, "r_y0": 631.06, "r_x1": 328.62, "r_y1": 631.06, "r_x2": 328.62, "r_y2": 622.26, "r_x3": 221.46, "r_y3": 622.26, "coord_origin": "TOPLEFT" }, "text": ", switch to the next row.", "orig": ", switch to the next row.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "-\"NL\" new-line , switch to the next row." }, { "label": "text", "id": 6, "page_no": 5, "cluster": { "id": 6, "label": "text", "bbox": { "l": 134.77, "t": 644.1, "r": 480.59, "b": 664.85, "coord_origin": "TOPLEFT" }, "confidence": 0.944, "cells": [ { "index": 58, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 149.71, "r_y0": 652.9, "r_x1": 480.59, "r_y1": 652.9, "r_x2": 480.59, "r_y2": 644.1, "r_x3": 149.71, "r_y3": 644.1, "coord_origin": "TOPLEFT" }, "text": "A notable attribute of OTSL is that it has the capability of achieving lossless", "orig": "A notable attribute of OTSL is that it has the capability of achieving lossless", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 59, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.77, "r_y0": 664.85, "r_x1": 228.22, "r_y1": 664.85, "r_x2": 228.22, "r_y2": 656.06, "r_x3": 134.77, "r_y3": 656.06, "coord_origin": "TOPLEFT" }, "text": "conversion to HTML.", "orig": "conversion to HTML.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "A notable attribute of OTSL is that it has the capability of achieving lossless conversion to HTML." } ], "body": [ { "label": "text", "id": 3, "page_no": 5, "cluster": { "id": 3, "label": "text", "bbox": { "l": 134.76, "t": 118.93, "r": 480.59, "b": 139.69, "coord_origin": "TOPLEFT" }, "confidence": 0.963, "cells": [ { "index": 3, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 127.73, "r_x1": 480.59, "r_y1": 127.73, "r_x2": 480.59, "r_y2": 118.93, "r_x3": 134.76, "r_y3": 118.93, "coord_origin": "TOPLEFT" }, "text": "generation. Implicitly, this also means that Im2Seq models need to learn these", "orig": "generation. Implicitly, this also means that Im2Seq models need to learn these", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 4, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 139.69, "r_x1": 364.63, "r_y1": 139.69, "r_x2": 364.63, "r_y2": 130.89, "r_x3": 134.76, "r_y3": 130.89, "coord_origin": "TOPLEFT" }, "text": "complex syntax rules, simply to deliver valid output.", "orig": "complex syntax rules, simply to deliver valid output.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "generation. Implicitly, this also means that Im2Seq models need to learn these complex syntax rules, simply to deliver valid output." }, { "label": "text", "id": 1, "page_no": 5, "cluster": { "id": 1, "label": "text", "bbox": { "l": 134.76, "t": 143.48, "r": 480.6, "b": 295.74, "coord_origin": "TOPLEFT" }, "confidence": 0.986, "cells": [ { "index": 5, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 149.71, "r_y0": 152.28, "r_x1": 480.59, "r_y1": 152.28, "r_x2": 480.59, "r_y2": 143.48, "r_x3": 149.71, "r_y3": 143.48, "coord_origin": "TOPLEFT" }, "text": "In practice, we observe two major issues with prediction quality when train-", "orig": "In practice, we observe two major issues with prediction quality when train-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 6, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 164.23, "r_x1": 480.59, "r_y1": 164.23, "r_x2": 480.59, "r_y2": 155.44, "r_x3": 134.76, "r_y3": 155.44, "coord_origin": "TOPLEFT" }, "text": "ing Im2Seq models on HTML table structure generation from images. On the", "orig": "ing Im2Seq models on HTML table structure generation from images. On the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 7, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 176.19, "r_x1": 480.59, "r_y1": 176.19, "r_x2": 480.59, "r_y2": 167.39, "r_x3": 134.76, "r_y3": 167.39, "coord_origin": "TOPLEFT" }, "text": "one hand, we find that on large tables, the visual attention of the model often", "orig": "one hand, we find that on large tables, the visual attention of the model often", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 8, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 188.14, "r_x1": 480.59, "r_y1": 188.14, "r_x2": 480.59, "r_y2": 179.35, "r_x3": 134.76, "r_y3": 179.35, "coord_origin": "TOPLEFT" }, "text": "starts to drift and is not accurately moving forward cell by cell anymore. This", "orig": "starts to drift and is not accurately moving forward cell by cell anymore. This", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 9, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 200.1, "r_x1": 314.28, "r_y1": 200.1, "r_x2": 314.28, "r_y2": 191.3, "r_x3": 134.76, "r_y3": 191.3, "coord_origin": "TOPLEFT" }, "text": "manifests itself in either in an increasing", "orig": "manifests itself in either in an increasing", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 10, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 318.06, "r_y0": 200.1, "r_x1": 374.09, "r_y1": 200.1, "r_x2": 374.09, "r_y2": 191.3, "r_x3": 318.06, "r_y3": 191.3, "coord_origin": "TOPLEFT" }, "text": "location drift", "orig": "location drift", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 11, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 378.81, "r_y0": 200.1, "r_x1": 480.59, "r_y1": 200.1, "r_x2": 480.59, "r_y2": 191.3, "r_x3": 378.81, "r_y3": 191.3, "coord_origin": "TOPLEFT" }, "text": "for proposed table-cells", "orig": "for proposed table-cells", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 12, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 212.06, "r_x1": 480.59, "r_y1": 212.06, "r_x2": 480.59, "r_y2": 203.26, "r_x3": 134.76, "r_y3": 203.26, "coord_origin": "TOPLEFT" }, "text": "in later rows on the same column or even complete loss of vertical alignment, as", "orig": "in later rows on the same column or even complete loss of vertical alignment, as", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 13, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 224.01, "r_x1": 480.6, "r_y1": 224.01, "r_x2": 480.6, "r_y2": 215.21, "r_x3": 134.76, "r_y3": 215.21, "coord_origin": "TOPLEFT" }, "text": "illustrated in Figure 5. Addressing this with post-processing is partially possible,", "orig": "illustrated in Figure 5. Addressing this with post-processing is partially possible,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 14, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 235.97, "r_x1": 480.59, "r_y1": 235.97, "r_x2": 480.59, "r_y2": 227.17, "r_x3": 134.76, "r_y3": 227.17, "coord_origin": "TOPLEFT" }, "text": "but clearly undesired. On the other hand, we find many instances of predictions", "orig": "but clearly undesired. On the other hand, we find many instances of predictions", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 15, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 247.92, "r_x1": 480.59, "r_y1": 247.92, "r_x2": 480.59, "r_y2": 239.12, "r_x3": 134.76, "r_y3": 239.12, "coord_origin": "TOPLEFT" }, "text": "with structural inconsistencies or plain invalid HTML output, as shown in Fig-", "orig": "with structural inconsistencies or plain invalid HTML output, as shown in Fig-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 16, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 259.88, "r_x1": 480.59, "r_y1": 259.88, "r_x2": 480.59, "r_y2": 251.08, "r_x3": 134.76, "r_y3": 251.08, "coord_origin": "TOPLEFT" }, "text": "ure 6, which are nearly impossible to properly correct. Both problems seriously", "orig": "ure 6, which are nearly impossible to properly correct. Both problems seriously", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 17, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 271.83, "r_x1": 480.59, "r_y1": 271.83, "r_x2": 480.59, "r_y2": 263.03, "r_x3": 134.76, "r_y3": 263.03, "coord_origin": "TOPLEFT" }, "text": "impact the TSR model performance, since they reflect not only in the task of", "orig": "impact the TSR model performance, since they reflect not only in the task of", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 18, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 283.79, "r_x1": 480.59, "r_y1": 283.79, "r_x2": 480.59, "r_y2": 274.99, "r_x3": 134.76, "r_y3": 274.99, "coord_origin": "TOPLEFT" }, "text": "pure structure recognition but also in the equally crucial recognition or matching", "orig": "pure structure recognition but also in the equally crucial recognition or matching", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 19, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 295.74, "r_x1": 223.57, "r_y1": 295.74, "r_x2": 223.57, "r_y2": 286.94, "r_x3": 134.76, "r_y3": 286.94, "coord_origin": "TOPLEFT" }, "text": "of table cell content.", "orig": "of table cell content.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "In practice, we observe two major issues with prediction quality when training Im2Seq models on HTML table structure generation from images. On the one hand, we find that on large tables, the visual attention of the model often starts to drift and is not accurately moving forward cell by cell anymore. This manifests itself in either in an increasing location drift for proposed table-cells in later rows on the same column or even complete loss of vertical alignment, as illustrated in Figure 5. Addressing this with post-processing is partially possible, but clearly undesired. On the other hand, we find many instances of predictions with structural inconsistencies or plain invalid HTML output, as shown in Figure 6, which are nearly impossible to properly correct. Both problems seriously impact the TSR model performance, since they reflect not only in the task of pure structure recognition but also in the equally crucial recognition or matching of table cell content." }, { "label": "section_header", "id": 4, "page_no": 5, "cluster": { "id": 4, "label": "section_header", "bbox": { "l": 134.76, "t": 320.63, "r": 372.51, "b": 331.2, "coord_origin": "TOPLEFT" }, "confidence": 0.957, "cells": [ { "index": 20, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 331.2, "r_x1": 141.49, "r_y1": 331.2, "r_x2": 141.49, "r_y2": 320.63, "r_x3": 134.76, "r_y3": 320.63, "coord_origin": "TOPLEFT" }, "text": "4", "orig": "4", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 21, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 154.94, "r_y0": 331.2, "r_x1": 372.51, "r_y1": 331.2, "r_x2": 372.51, "r_y2": 320.63, "r_x3": 154.94, "r_y3": 320.63, "coord_origin": "TOPLEFT" }, "text": "Optimised Table Structure Language", "orig": "Optimised Table Structure Language", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "4 Optimised Table Structure Language" }, { "label": "text", "id": 0, "page_no": 5, "cluster": { "id": 0, "label": "text", "bbox": { "l": 134.76, "t": 349.12, "r": 480.59, "b": 441.6, "coord_origin": "TOPLEFT" }, "confidence": 0.988, "cells": [ { "index": 22, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 357.91, "r_x1": 480.59, "r_y1": 357.91, "r_x2": 480.59, "r_y2": 349.12, "r_x3": 134.76, "r_y3": 349.12, "coord_origin": "TOPLEFT" }, "text": "To mitigate the issues with HTML in Im2Seq-based TSR models laid out before,", "orig": "To mitigate the issues with HTML in Im2Seq-based TSR models laid out before,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 23, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 369.87, "r_x1": 480.59, "r_y1": 369.87, "r_x2": 480.59, "r_y2": 361.07, "r_x3": 134.76, "r_y3": 361.07, "coord_origin": "TOPLEFT" }, "text": "we propose here our Optimised Table Structure Language (OTSL). OTSL is", "orig": "we propose here our Optimised Table Structure Language (OTSL). OTSL is", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 24, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 381.82, "r_x1": 480.59, "r_y1": 381.82, "r_x2": 480.59, "r_y2": 373.03, "r_x3": 134.76, "r_y3": 373.03, "coord_origin": "TOPLEFT" }, "text": "designed to express table structure with a minimized vocabulary and a simple", "orig": "designed to express table structure with a minimized vocabulary and a simple", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 25, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 393.78, "r_x1": 480.59, "r_y1": 393.78, "r_x2": 480.59, "r_y2": 384.98, "r_x3": 134.76, "r_y3": 384.98, "coord_origin": "TOPLEFT" }, "text": "set of rules, which are both significantly reduced compared to HTML. At the", "orig": "set of rules, which are both significantly reduced compared to HTML. At the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 26, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 405.73, "r_x1": 480.59, "r_y1": 405.73, "r_x2": 480.59, "r_y2": 396.94, "r_x3": 134.76, "r_y3": 396.94, "coord_origin": "TOPLEFT" }, "text": "same time, OTSL enables easy error detection and correction during sequence", "orig": "same time, OTSL enables easy error detection and correction during sequence", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 27, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 417.69, "r_x1": 480.59, "r_y1": 417.69, "r_x2": 480.59, "r_y2": 408.89, "r_x3": 134.76, "r_y3": 408.89, "coord_origin": "TOPLEFT" }, "text": "generation. We further demonstrate how the compact structure representation", "orig": "generation. We further demonstrate how the compact structure representation", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 28, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 429.64, "r_x1": 480.59, "r_y1": 429.64, "r_x2": 480.59, "r_y2": 420.85, "r_x3": 134.76, "r_y3": 420.85, "coord_origin": "TOPLEFT" }, "text": "and minimized sequence length improves prediction accuracy and inference time", "orig": "and minimized sequence length improves prediction accuracy and inference time", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 29, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 441.6, "r_x1": 276.67, "r_y1": 441.6, "r_x2": 276.67, "r_y2": 432.8, "r_x3": 134.76, "r_y3": 432.8, "coord_origin": "TOPLEFT" }, "text": "in the TableFormer architecture.", "orig": "in the TableFormer architecture.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "To mitigate the issues with HTML in Im2Seq-based TSR models laid out before, we propose here our Optimised Table Structure Language (OTSL). OTSL is designed to express table structure with a minimized vocabulary and a simple set of rules, which are both significantly reduced compared to HTML. At the same time, OTSL enables easy error detection and correction during sequence generation. We further demonstrate how the compact structure representation and minimized sequence length improves prediction accuracy and inference time in the TableFormer architecture." }, { "label": "section_header", "id": 5, "page_no": 5, "cluster": { "id": 5, "label": "section_header", "bbox": { "l": 134.76, "t": 465.87, "r": 261.8, "b": 474.68, "coord_origin": "TOPLEFT" }, "confidence": 0.956, "cells": [ { "index": 30, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 474.68, "r_x1": 149.4, "r_y1": 474.68, "r_x2": 149.4, "r_y2": 465.87, "r_x3": 134.76, "r_y3": 465.87, "coord_origin": "TOPLEFT" }, "text": "4.1", "orig": "4.1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 31, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 160.86, "r_y0": 474.68, "r_x1": 261.8, "r_y1": 474.68, "r_x2": 261.8, "r_y2": 465.87, "r_x3": 160.86, "r_y3": 465.87, "coord_origin": "TOPLEFT" }, "text": "Language Definition", "orig": "Language Definition", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "4.1 Language Definition" }, { "label": "text", "id": 2, "page_no": 5, "cluster": { "id": 2, "label": "text", "bbox": { "l": 134.76, "t": 489.0, "r": 480.59, "b": 521.71, "coord_origin": "TOPLEFT" }, "confidence": 0.967, "cells": [ { "index": 32, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 497.79, "r_x1": 480.59, "r_y1": 497.79, "r_x2": 480.59, "r_y2": 489.0, "r_x3": 134.76, "r_y3": 489.0, "coord_origin": "TOPLEFT" }, "text": "In Figure 3, we illustrate how the OTSL is defined. In essence, the OTSL defines", "orig": "In Figure 3, we illustrate how the OTSL is defined. In essence, the OTSL defines", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 33, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 509.75, "r_x1": 480.59, "r_y1": 509.75, "r_x2": 480.59, "r_y2": 500.95, "r_x3": 134.76, "r_y3": 500.95, "coord_origin": "TOPLEFT" }, "text": "only 5 tokens that directly describe a tabular structure based on an atomic 2D", "orig": "only 5 tokens that directly describe a tabular structure based on an atomic 2D", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 34, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 521.71, "r_x1": 154.71, "r_y1": 521.71, "r_x2": 154.71, "r_y2": 512.91, "r_x3": 134.76, "r_y3": 512.91, "coord_origin": "TOPLEFT" }, "text": "grid.", "orig": "grid.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "In Figure 3, we illustrate how the OTSL is defined. In essence, the OTSL defines only 5 tokens that directly describe a tabular structure based on an atomic 2D grid." }, { "label": "text", "id": 13, "page_no": 5, "cluster": { "id": 13, "label": "text", "bbox": { "l": 149.71, "t": 525.5, "r": 409.31, "b": 534.3, "coord_origin": "TOPLEFT" }, "confidence": 0.856, "cells": [ { "index": 35, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 149.71, "r_y0": 534.3, "r_x1": 409.31, "r_y1": 534.3, "r_x2": 409.31, "r_y2": 525.5, "r_x3": 149.71, "r_y3": 525.5, "coord_origin": "TOPLEFT" }, "text": "The OTSL vocabulary is comprised of the following tokens:", "orig": "The OTSL vocabulary is comprised of the following tokens:", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "The OTSL vocabulary is comprised of the following tokens:" }, { "label": "list_item", "id": 9, "page_no": 5, "cluster": { "id": 9, "label": "list_item", "bbox": { "l": 140.99, "t": 547.97, "r": 460.54, "b": 556.78, "coord_origin": "TOPLEFT" }, "confidence": 0.918, "cells": [ { "index": 36, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 140.99, "r_y0": 556.78, "r_x1": 146.72, "r_y1": 556.78, "r_x2": 146.72, "r_y2": 547.97, "r_x3": 140.99, "r_y3": 547.97, "coord_origin": "TOPLEFT" }, "text": "-", "orig": "-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 37, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.7, "r_y0": 556.78, "r_x1": 193.21, "r_y1": 556.78, "r_x2": 193.21, "r_y2": 547.98, "r_x3": 151.7, "r_y3": 547.98, "coord_origin": "TOPLEFT" }, "text": "\"C\" cell -", "orig": "\"C\" cell -", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 38, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 196.52, "r_y0": 556.78, "r_x1": 263.47, "r_y1": 556.78, "r_x2": 263.47, "r_y2": 547.98, "r_x3": 196.52, "r_y3": 547.98, "coord_origin": "TOPLEFT" }, "text": "a new table cell", "orig": "a new table cell", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 39, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 267.81, "r_y0": 556.78, "r_x1": 460.54, "r_y1": 556.78, "r_x2": 460.54, "r_y2": 547.98, "r_x3": 267.81, "r_y3": 547.98, "coord_origin": "TOPLEFT" }, "text": "that either has or does not have cell content", "orig": "that either has or does not have cell content", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "-\"C\" cell a new table cell that either has or does not have cell content" }, { "label": "list_item", "id": 8, "page_no": 5, "cluster": { "id": 8, "label": "list_item", "bbox": { "l": 140.99, "t": 560.56, "r": 480.59, "b": 581.32, "coord_origin": "TOPLEFT" }, "confidence": 0.932, "cells": [ { "index": 40, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 140.99, "r_y0": 569.37, "r_x1": 146.72, "r_y1": 569.37, "r_x2": 146.72, "r_y2": 560.56, "r_x3": 140.99, "r_y3": 560.56, "coord_origin": "TOPLEFT" }, "text": "-", "orig": "-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 41, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.7, "r_y0": 569.37, "r_x1": 194.3, "r_y1": 569.37, "r_x2": 194.3, "r_y2": 560.57, "r_x3": 151.7, "r_y3": 560.57, "coord_origin": "TOPLEFT" }, "text": "\"L\" cell -", "orig": "\"L\" cell -", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 42, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 198.66, "r_y0": 569.37, "r_x1": 264.52, "r_y1": 569.37, "r_x2": 264.52, "r_y2": 560.57, "r_x3": 198.66, "r_y3": 560.57, "coord_origin": "TOPLEFT" }, "text": "left-looking cell", "orig": "left-looking cell", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 43, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 264.52, "r_y0": 569.37, "r_x1": 480.59, "r_y1": 569.37, "r_x2": 480.59, "r_y2": 560.57, "r_x3": 264.52, "r_y3": 560.57, "coord_origin": "TOPLEFT" }, "text": ", merging with the left neighbor cell to create a", "orig": ", merging with the left neighbor cell to create a", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 44, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.7, "r_y0": 581.32, "r_x1": 171.68, "r_y1": 581.32, "r_x2": 171.68, "r_y2": 572.53, "r_x3": 151.7, "r_y3": 572.53, "coord_origin": "TOPLEFT" }, "text": "span", "orig": "span", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "-\"L\" cell left-looking cell , merging with the left neighbor cell to create a span" }, { "label": "list_item", "id": 7, "page_no": 5, "cluster": { "id": 7, "label": "list_item", "bbox": { "l": 140.99, "t": 585.11, "r": 480.59, "b": 605.87, "coord_origin": "TOPLEFT" }, "confidence": 0.944, "cells": [ { "index": 45, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 140.99, "r_y0": 593.92, "r_x1": 146.72, "r_y1": 593.92, "r_x2": 146.72, "r_y2": 585.11, "r_x3": 140.99, "r_y3": 585.11, "coord_origin": "TOPLEFT" }, "text": "-", "orig": "-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 46, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.7, "r_y0": 593.92, "r_x1": 194.11, "r_y1": 593.92, "r_x2": 194.11, "r_y2": 585.12, "r_x3": 151.7, "r_y3": 585.12, "coord_origin": "TOPLEFT" }, "text": "\"U\" cell -", "orig": "\"U\" cell -", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 47, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 197.75, "r_y0": 593.92, "r_x1": 259.89, "r_y1": 593.92, "r_x2": 259.89, "r_y2": 585.12, "r_x3": 197.75, "r_y3": 585.12, "coord_origin": "TOPLEFT" }, "text": "up-looking cell", "orig": "up-looking cell", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 48, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 259.89, "r_y0": 593.92, "r_x1": 480.59, "r_y1": 593.92, "r_x2": 480.59, "r_y2": 585.12, "r_x3": 259.89, "r_y3": 585.12, "coord_origin": "TOPLEFT" }, "text": ", merging with the upper neighbor cell to create a", "orig": ", merging with the upper neighbor cell to create a", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 49, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.7, "r_y0": 605.87, "r_x1": 171.68, "r_y1": 605.87, "r_x2": 171.68, "r_y2": 597.08, "r_x3": 151.7, "r_y3": 597.08, "coord_origin": "TOPLEFT" }, "text": "span", "orig": "span", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "-\"U\" cell up-looking cell , merging with the upper neighbor cell to create a span" }, { "label": "list_item", "id": 10, "page_no": 5, "cluster": { "id": 10, "label": "list_item", "bbox": { "l": 140.99, "t": 609.66, "r": 454.55, "b": 618.47, "coord_origin": "TOPLEFT" }, "confidence": 0.904, "cells": [ { "index": 50, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 140.99, "r_y0": 618.47, "r_x1": 146.72, "r_y1": 618.47, "r_x2": 146.72, "r_y2": 609.66, "r_x3": 140.99, "r_y3": 609.66, "coord_origin": "TOPLEFT" }, "text": "-", "orig": "-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 51, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.7, "r_y0": 618.47, "r_x1": 193.48, "r_y1": 618.47, "r_x2": 193.48, "r_y2": 609.67, "r_x3": 151.7, "r_y3": 609.67, "coord_origin": "TOPLEFT" }, "text": "\"X\" cell -", "orig": "\"X\" cell -", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 52, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 196.8, "r_y0": 618.47, "r_x1": 236.12, "r_y1": 618.47, "r_x2": 236.12, "r_y2": 609.67, "r_x3": 196.8, "r_y3": 609.67, "coord_origin": "TOPLEFT" }, "text": "cross cell", "orig": "cross cell", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 53, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 236.13, "r_y0": 618.47, "r_x1": 454.55, "r_y1": 618.47, "r_x2": 454.55, "r_y2": 609.67, "r_x3": 236.13, "r_y3": 609.67, "coord_origin": "TOPLEFT" }, "text": ", to merge with both left and upper neighbor cells", "orig": ", to merge with both left and upper neighbor cells", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "-\"X\" cell cross cell , to merge with both left and upper neighbor cells" }, { "label": "list_item", "id": 12, "page_no": 5, "cluster": { "id": 12, "label": "list_item", "bbox": { "l": 140.99, "t": 622.25, "r": 328.62, "b": 631.06, "coord_origin": "TOPLEFT" }, "confidence": 0.864, "cells": [ { "index": 54, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 140.99, "r_y0": 631.06, "r_x1": 146.72, "r_y1": 631.06, "r_x2": 146.72, "r_y2": 622.25, "r_x3": 140.99, "r_y3": 622.25, "coord_origin": "TOPLEFT" }, "text": "-", "orig": "-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 55, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.7, "r_y0": 631.06, "r_x1": 181.99, "r_y1": 631.06, "r_x2": 181.99, "r_y2": 622.26, "r_x3": 151.7, "r_y3": 622.26, "coord_origin": "TOPLEFT" }, "text": "\"NL\" -", "orig": "\"NL\" -", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 56, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 185.32, "r_y0": 631.06, "r_x1": 221.46, "r_y1": 631.06, "r_x2": 221.46, "r_y2": 622.26, "r_x3": 185.32, "r_y3": 622.26, "coord_origin": "TOPLEFT" }, "text": "new-line", "orig": "new-line", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 57, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 221.46, "r_y0": 631.06, "r_x1": 328.62, "r_y1": 631.06, "r_x2": 328.62, "r_y2": 622.26, "r_x3": 221.46, "r_y3": 622.26, "coord_origin": "TOPLEFT" }, "text": ", switch to the next row.", "orig": ", switch to the next row.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "-\"NL\" new-line , switch to the next row." }, { "label": "text", "id": 6, "page_no": 5, "cluster": { "id": 6, "label": "text", "bbox": { "l": 134.77, "t": 644.1, "r": 480.59, "b": 664.85, "coord_origin": "TOPLEFT" }, "confidence": 0.944, "cells": [ { "index": 58, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 149.71, "r_y0": 652.9, "r_x1": 480.59, "r_y1": 652.9, "r_x2": 480.59, "r_y2": 644.1, "r_x3": 149.71, "r_y3": 644.1, "coord_origin": "TOPLEFT" }, "text": "A notable attribute of OTSL is that it has the capability of achieving lossless", "orig": "A notable attribute of OTSL is that it has the capability of achieving lossless", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 59, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.77, "r_y0": 664.85, "r_x1": 228.22, "r_y1": 664.85, "r_x2": 228.22, "r_y2": 656.06, "r_x3": 134.77, "r_y3": 656.06, "coord_origin": "TOPLEFT" }, "text": "conversion to HTML.", "orig": "conversion to HTML.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "A notable attribute of OTSL is that it has the capability of achieving lossless conversion to HTML." } ], "headers": [ { "label": "page_header", "id": 14, "page_no": 5, "cluster": { "id": 14, "label": "page_header", "bbox": { "l": 134.76, "t": 93.77, "r": 139.37, "b": 101.84, "coord_origin": "TOPLEFT" }, "confidence": 0.838, "cells": [ { "index": 0, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 101.84, "r_x1": 139.37, "r_y1": 101.84, "r_x2": 139.37, "r_y2": 93.77, "r_x3": 134.76, "r_y3": 93.77, "coord_origin": "TOPLEFT" }, "text": "6", "orig": "6", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "6" }, { "label": "page_header", "id": 11, "page_no": 5, "cluster": { "id": 11, "label": "page_header", "bbox": { "l": 167.81, "t": 93.77, "r": 231.72, "b": 101.84, "coord_origin": "TOPLEFT" }, "confidence": 0.892, "cells": [ { "index": 1, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 167.81, "r_y0": 101.84, "r_x1": 178.08, "r_y1": 101.84, "r_x2": 178.08, "r_y2": 93.77, "r_x3": 167.81, "r_y3": 93.77, "coord_origin": "TOPLEFT" }, "text": "M.", "orig": "M.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 2, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 182.37, "r_y0": 101.84, "r_x1": 231.72, "r_y1": 101.84, "r_x2": 231.72, "r_y2": 93.77, "r_x3": 182.37, "r_y3": 93.77, "coord_origin": "TOPLEFT" }, "text": "Lysak, et al.", "orig": "Lysak, et al.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "M. Lysak, et al." } ] } }, { "page_no": 6, "size": { "width": 612.0, "height": 792.0 }, "parsed_page": { "dimension": { "angle": 0.0, "rect": { "r_x0": 0.0, "r_y0": 0.0, "r_x1": 612.0, "r_y1": 0.0, "r_x2": 612.0, "r_y2": 792.0, "r_x3": 0.0, "r_y3": 792.0, "coord_origin": "BOTTOMLEFT" }, "boundary_type": "crop_box", "art_bbox": { "l": 0.0, "t": 792.0, "r": 612.0, "b": 0.0, "coord_origin": "BOTTOMLEFT" }, "bleed_bbox": { "l": 0.0, "t": 792.0, "r": 612.0, "b": 0.0, "coord_origin": "BOTTOMLEFT" }, "crop_bbox": { "l": 0.0, "t": 792.0, "r": 612.0, "b": 0.0, "coord_origin": "BOTTOMLEFT" }, "media_bbox": { "l": 0.0, "t": 792.0, "r": 612.0, "b": 0.0, "coord_origin": "BOTTOMLEFT" }, "trim_bbox": { "l": 0.0, "t": 792.0, "r": 612.0, "b": 0.0, "coord_origin": "BOTTOMLEFT" } }, "bitmap_resources": [], "char_cells": [], "word_cells": [], "textline_cells": [ { "index": 0, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 194.48, "r_y0": 101.84, "r_x1": 447.54, "r_y1": 101.84, "r_x2": 447.54, "r_y2": 93.77, "r_x3": 194.48, "r_y3": 93.77, "coord_origin": "TOPLEFT" }, "text": "Optimized Table Tokenization for Table Structure Recognition", "orig": "Optimized Table Tokenization for Table Structure Recognition", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 1, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 475.98, "r_y0": 101.84, "r_x1": 480.59, "r_y1": 101.84, "r_x2": 480.59, "r_y2": 93.77, "r_x3": 475.98, "r_y3": 93.77, "coord_origin": "TOPLEFT" }, "text": "7", "orig": "7", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 2, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 133.73, "r_x1": 162.64, "r_y1": 133.73, "r_x2": 162.64, "r_y2": 125.8, "r_x3": 134.76, "r_y3": 125.8, "coord_origin": "TOPLEFT" }, "text": "Fig. 3.", "orig": "Fig. 3.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 3, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 166.28, "r_y0": 133.93, "r_x1": 480.59, "r_y1": 133.93, "r_x2": 480.59, "r_y2": 125.86, "r_x3": 166.28, "r_y3": 125.86, "coord_origin": "TOPLEFT" }, "text": "OTSL description of table structure: A - table example; B - graphical repre-", "orig": "OTSL description of table structure: A - table example; B - graphical repre-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 4, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 144.89, "r_x1": 480.59, "r_y1": 144.89, "r_x2": 480.59, "r_y2": 136.82, "r_x3": 134.76, "r_y3": 136.82, "coord_origin": "TOPLEFT" }, "text": "sentation of table structure; C - mapping structure on a grid; D - OTSL structure", "orig": "sentation of table structure; C - mapping structure on a grid; D - OTSL structure", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 5, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 155.85, "r_x1": 306.12, "r_y1": 155.85, "r_x2": 306.12, "r_y2": 147.78, "r_x3": 134.76, "r_y3": 147.78, "coord_origin": "TOPLEFT" }, "text": "encoding; E - explanation on cell encoding", "orig": "encoding; E - explanation on cell encoding", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 6, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 374.49, "r_y0": 177.92, "r_x1": 381.67, "r_y1": 177.92, "r_x2": 381.67, "r_y2": 168.59, "r_x3": 374.49, "r_y3": 168.59, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 7, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 398.74, "r_y0": 177.82, "r_x1": 405.92, "r_y1": 177.82, "r_x2": 405.92, "r_y2": 168.5, "r_x3": 398.74, "r_y3": 168.5, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 8, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 373.77, "r_y0": 202.25, "r_x1": 380.94, "r_y1": 202.25, "r_x2": 380.94, "r_y2": 192.93, "r_x3": 373.77, "r_y3": 192.93, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 9, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 386.66, "r_y0": 202.39, "r_x1": 393.84, "r_y1": 202.39, "r_x2": 393.84, "r_y2": 193.07, "r_x3": 386.66, "r_y3": 193.07, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 10, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 386.69, "r_y0": 214.46, "r_x1": 393.86, "r_y1": 214.46, "r_x2": 393.86, "r_y2": 205.14, "r_x3": 386.69, "r_y3": 205.14, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 11, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 398.66, "r_y0": 190.05, "r_x1": 405.83, "r_y1": 190.05, "r_x2": 405.83, "r_y2": 180.73, "r_x3": 398.66, "r_y3": 180.73, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 12, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 410.78, "r_y0": 190.06, "r_x1": 417.95, "r_y1": 190.06, "r_x2": 417.95, "r_y2": 180.74, "r_x3": 410.78, "r_y3": 180.74, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 13, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 422.91, "r_y0": 189.97, "r_x1": 430.08, "r_y1": 189.97, "r_x2": 430.08, "r_y2": 180.65, "r_x3": 422.91, "r_y3": 180.65, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 14, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 398.78, "r_y0": 202.31, "r_x1": 405.96, "r_y1": 202.31, "r_x2": 405.96, "r_y2": 192.99, "r_x3": 398.78, "r_y3": 192.99, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 15, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 410.9, "r_y0": 202.32, "r_x1": 418.08, "r_y1": 202.32, "r_x2": 418.08, "r_y2": 192.99, "r_x3": 410.9, "r_y3": 192.99, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 16, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 423.03, "r_y0": 202.23, "r_x1": 430.2, "r_y1": 202.23, "r_x2": 430.2, "r_y2": 192.91, "r_x3": 423.03, "r_y3": 192.91, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 17, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 398.78, "r_y0": 214.64, "r_x1": 405.96, "r_y1": 214.64, "r_x2": 405.96, "r_y2": 205.32, "r_x3": 398.78, "r_y3": 205.32, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 18, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 410.9, "r_y0": 214.64, "r_x1": 418.08, "r_y1": 214.64, "r_x2": 418.08, "r_y2": 205.32, "r_x3": 410.9, "r_y3": 205.32, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 19, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 423.03, "r_y0": 214.56, "r_x1": 430.21, "r_y1": 214.56, "r_x2": 430.21, "r_y2": 205.24, "r_x3": 423.03, "r_y3": 205.24, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 20, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 386.51, "r_y0": 226.36, "r_x1": 393.68, "r_y1": 226.36, "r_x2": 393.68, "r_y2": 217.04, "r_x3": 386.51, "r_y3": 217.04, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 21, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 398.6, "r_y0": 226.54, "r_x1": 405.78, "r_y1": 226.54, "r_x2": 405.78, "r_y2": 217.22, "r_x3": 398.6, "r_y3": 217.22, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 22, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 410.72, "r_y0": 226.54, "r_x1": 417.9, "r_y1": 226.54, "r_x2": 417.9, "r_y2": 217.22, "r_x3": 410.72, "r_y3": 217.22, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 23, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 422.85, "r_y0": 226.46, "r_x1": 430.02, "r_y1": 226.46, "r_x2": 430.02, "r_y2": 217.14, "r_x3": 422.85, "r_y3": 217.14, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 24, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 435.16, "r_y0": 177.01, "r_x1": 447.86, "r_y1": 177.01, "r_x2": 447.86, "r_y2": 167.69, "r_x3": 435.16, "r_y3": 167.69, "coord_origin": "TOPLEFT" }, "text": "NL", "orig": "NL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 25, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 435.44, "r_y0": 189.52, "r_x1": 448.15, "r_y1": 189.52, "r_x2": 448.15, "r_y2": 180.2, "r_x3": 435.44, "r_y3": 180.2, "coord_origin": "TOPLEFT" }, "text": "NL", "orig": "NL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 26, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 435.47, "r_y0": 201.82, "r_x1": 448.17, "r_y1": 201.82, "r_x2": 448.17, "r_y2": 192.49, "r_x3": 435.47, "r_y3": 192.49, "coord_origin": "TOPLEFT" }, "text": "NL", "orig": "NL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 27, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 435.38, "r_y0": 214.15, "r_x1": 448.08, "r_y1": 214.15, "r_x2": 448.08, "r_y2": 204.83, "r_x3": 435.38, "r_y3": 204.83, "coord_origin": "TOPLEFT" }, "text": "NL", "orig": "NL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 28, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 435.6, "r_y0": 226.56, "r_x1": 448.3, "r_y1": 226.56, "r_x2": 448.3, "r_y2": 217.23, "r_x3": 435.6, "r_y3": 217.23, "coord_origin": "TOPLEFT" }, "text": "NL", "orig": "NL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 29, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 374.15, "r_y0": 214.56, "r_x1": 381.32, "r_y1": 214.56, "r_x2": 381.32, "r_y2": 205.23, "r_x3": 374.15, "r_y3": 205.23, "coord_origin": "TOPLEFT" }, "text": "U", "orig": "U", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 30, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 374.04, "r_y0": 226.47, "r_x1": 381.22, "r_y1": 226.47, "r_x2": 381.22, "r_y2": 217.15, "r_x3": 374.04, "r_y3": 217.15, "coord_origin": "TOPLEFT" }, "text": "U", "orig": "U", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 31, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 374.34, "r_y0": 190.26, "r_x1": 381.52, "r_y1": 190.26, "r_x2": 381.52, "r_y2": 180.93, "r_x3": 374.34, "r_y3": 180.93, "coord_origin": "TOPLEFT" }, "text": "U", "orig": "U", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 32, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 387.76, "r_y0": 177.9, "r_x1": 393.29, "r_y1": 177.9, "r_x2": 393.29, "r_y2": 168.58, "r_x3": 387.76, "r_y3": 168.58, "coord_origin": "TOPLEFT" }, "text": "L", "orig": "L", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 33, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 411.86, "r_y0": 177.38, "r_x1": 417.39, "r_y1": 177.38, "r_x2": 417.39, "r_y2": 168.06, "r_x3": 411.86, "r_y3": 168.06, "coord_origin": "TOPLEFT" }, "text": "L", "orig": "L", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 34, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 423.34, "r_y0": 177.26, "r_x1": 428.86, "r_y1": 177.26, "r_x2": 428.86, "r_y2": 167.93, "r_x3": 423.34, "r_y3": 167.93, "coord_origin": "TOPLEFT" }, "text": "L", "orig": "L", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 35, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 387.14, "r_y0": 190.11, "r_x1": 393.76, "r_y1": 190.11, "r_x2": 393.76, "r_y2": 180.79, "r_x3": 387.14, "r_y3": 180.79, "coord_origin": "TOPLEFT" }, "text": "X", "orig": "X", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 36, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 282.26, "r_y0": 253.83, "r_x1": 289.43, "r_y1": 253.83, "r_x2": 289.43, "r_y2": 244.51, "r_x3": 282.26, "r_y3": 244.51, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 37, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 282.11, "r_y0": 266.17, "r_x1": 289.29, "r_y1": 266.17, "r_x2": 289.29, "r_y2": 256.85, "r_x3": 282.11, "r_y3": 256.85, "coord_origin": "TOPLEFT" }, "text": "U", "orig": "U", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 38, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 282.41, "r_y0": 278.45, "r_x1": 289.58, "r_y1": 278.45, "r_x2": 289.58, "r_y2": 269.13, "r_x3": 282.41, "r_y3": 269.13, "coord_origin": "TOPLEFT" }, "text": "U", "orig": "U", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 39, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 295.53, "r_y0": 253.82, "r_x1": 301.05, "r_y1": 253.82, "r_x2": 301.05, "r_y2": 244.49, "r_x3": 295.53, "r_y3": 244.49, "coord_origin": "TOPLEFT" }, "text": "L", "orig": "L", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 40, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 307.47, "r_y0": 253.9, "r_x1": 312.99, "r_y1": 253.9, "r_x2": 312.99, "r_y2": 244.57, "r_x3": 307.47, "r_y3": 244.57, "coord_origin": "TOPLEFT" }, "text": "L", "orig": "L", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 41, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 318.77, "r_y0": 253.76, "r_x1": 324.29, "r_y1": 253.76, "r_x2": 324.29, "r_y2": 244.44, "r_x3": 318.77, "r_y3": 244.44, "coord_origin": "TOPLEFT" }, "text": "L", "orig": "L", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 42, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 294.9, "r_y0": 266.02, "r_x1": 301.04, "r_y1": 266.02, "r_x2": 301.04, "r_y2": 256.7, "r_x3": 294.9, "r_y3": 256.7, "coord_origin": "TOPLEFT" }, "text": "X", "orig": "X", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 43, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 307.18, "r_y0": 266.02, "r_x1": 325.59, "r_y1": 266.02, "r_x2": 325.59, "r_y2": 256.7, "r_x3": 307.18, "r_y3": 256.7, "coord_origin": "TOPLEFT" }, "text": "X X", "orig": "X X", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 44, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 294.79, "r_y0": 278.58, "r_x1": 300.93, "r_y1": 278.58, "r_x2": 300.93, "r_y2": 269.25, "r_x3": 294.79, "r_y3": 269.25, "coord_origin": "TOPLEFT" }, "text": "X", "orig": "X", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 45, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 307.06, "r_y0": 278.58, "r_x1": 325.48, "r_y1": 278.58, "r_x2": 325.48, "r_y2": 269.25, "r_x3": 307.06, "r_y3": 269.25, "coord_origin": "TOPLEFT" }, "text": "X X", "orig": "X X", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 46, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 195.94, "r_y0": 278.07, "r_x1": 203.11, "r_y1": 278.07, "r_x2": 203.11, "r_y2": 268.75, "r_x3": 195.94, "r_y3": 268.75, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 47, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 209.21, "r_y0": 278.05, "r_x1": 214.73, "r_y1": 278.05, "r_x2": 214.73, "r_y2": 268.73, "r_x3": 209.21, "r_y3": 268.73, "coord_origin": "TOPLEFT" }, "text": "L", "orig": "L", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 48, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 221.15, "r_y0": 278.13, "r_x1": 226.67, "r_y1": 278.13, "r_x2": 226.67, "r_y2": 268.81, "r_x3": 221.15, "r_y3": 268.81, "coord_origin": "TOPLEFT" }, "text": "L", "orig": "L", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 49, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 232.45, "r_y0": 278.0, "r_x1": 237.97, "r_y1": 278.0, "r_x2": 237.97, "r_y2": 268.68, "r_x3": 232.45, "r_y3": 268.68, "coord_origin": "TOPLEFT" }, "text": "L", "orig": "L", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 50, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 196.22, "r_y0": 253.86, "r_x1": 203.39, "r_y1": 253.86, "r_x2": 203.39, "r_y2": 244.54, "r_x3": 196.22, "r_y3": 244.54, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 51, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 250.32, "r_y0": 253.42, "r_x1": 257.5, "r_y1": 253.42, "r_x2": 257.5, "r_y2": 244.1, "r_x3": 250.32, "r_y3": 244.1, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 52, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 250.17, "r_y0": 265.76, "r_x1": 257.35, "r_y1": 265.76, "r_x2": 257.35, "r_y2": 256.44, "r_x3": 250.17, "r_y3": 256.44, "coord_origin": "TOPLEFT" }, "text": "U", "orig": "U", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 53, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 250.47, "r_y0": 278.04, "r_x1": 257.65, "r_y1": 278.04, "r_x2": 257.65, "r_y2": 268.72, "r_x3": 250.47, "r_y3": 268.72, "coord_origin": "TOPLEFT" }, "text": "U", "orig": "U", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 54, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 334.51, "r_y0": 249.21, "r_x1": 337.22, "r_y1": 249.21, "r_x2": 337.22, "r_y2": 242.99, "r_x3": 334.51, "r_y3": 242.99, "coord_origin": "TOPLEFT" }, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 55, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 339.94, "r_y0": 249.21, "r_x1": 391.49, "r_y1": 249.21, "r_x2": 391.49, "r_y2": 242.99, "r_x3": 339.94, "r_y3": 242.99, "coord_origin": "TOPLEFT" }, "text": "- simple cells: \"C\"", "orig": "- simple cells: \"C\"", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 56, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 334.51, "r_y0": 259.15, "r_x1": 337.33, "r_y1": 259.15, "r_x2": 337.33, "r_y2": 252.93, "r_x3": 334.51, "r_y3": 252.93, "coord_origin": "TOPLEFT" }, "text": "2", "orig": "2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 57, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 340.15, "r_y0": 259.15, "r_x1": 421.99, "r_y1": 259.15, "r_x2": 421.99, "r_y2": 252.93, "r_x3": 340.15, "r_y3": 252.93, "coord_origin": "TOPLEFT" }, "text": "- horizontal merges: \"C\", \"L\"", "orig": "- horizontal merges: \"C\", \"L\"", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 58, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 334.51, "r_y0": 269.08, "r_x1": 337.3, "r_y1": 269.08, "r_x2": 337.3, "r_y2": 262.87, "r_x3": 334.51, "r_y3": 262.87, "coord_origin": "TOPLEFT" }, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 59, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 340.09, "r_y0": 269.08, "r_x1": 415.34, "r_y1": 269.08, "r_x2": 415.34, "r_y2": 262.87, "r_x3": 340.09, "r_y3": 262.87, "coord_origin": "TOPLEFT" }, "text": "- vertical merges: \"C\", \"U\"", "orig": "- vertical merges: \"C\", \"U\"", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 60, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 334.51, "r_y0": 279.02, "r_x1": 337.3, "r_y1": 279.02, "r_x2": 337.3, "r_y2": 272.81, "r_x3": 334.51, "r_y3": 272.81, "coord_origin": "TOPLEFT" }, "text": "4", "orig": "4", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 61, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 340.09, "r_y0": 279.02, "r_x1": 426.6, "r_y1": 279.02, "r_x2": 426.6, "r_y2": 272.81, "r_x3": 340.09, "r_y3": 272.81, "coord_origin": "TOPLEFT" }, "text": "- 2d merges: \"C\", \"L\", \"U\", \"X\"", "orig": "- 2d merges: \"C\", \"L\", \"U\", \"X\"", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 62, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 185.67, "r_y0": 250.26, "r_x1": 189.36, "r_y1": 250.26, "r_x2": 189.36, "r_y2": 244.04, "r_x3": 185.67, "r_y3": 244.04, "coord_origin": "TOPLEFT" }, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 63, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 185.97, "r_y0": 274.56, "r_x1": 189.65, "r_y1": 274.56, "r_x2": 189.65, "r_y2": 268.35, "r_x3": 185.97, "r_y3": 268.35, "coord_origin": "TOPLEFT" }, "text": "2", "orig": "2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 64, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 239.34, "r_y0": 249.84, "r_x1": 243.03, "r_y1": 249.84, "r_x2": 243.03, "r_y2": 243.63, "r_x3": 239.34, "r_y3": 243.63, "coord_origin": "TOPLEFT" }, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 65, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 271.33, "r_y0": 249.71, "r_x1": 275.01, "r_y1": 249.71, "r_x2": 275.01, "r_y2": 243.49, "r_x3": 271.33, "r_y3": 243.49, "coord_origin": "TOPLEFT" }, "text": "4", "orig": "4", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 66, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 229.82, "r_y0": 172.73, "r_x1": 233.5, "r_y1": 172.73, "r_x2": 233.5, "r_y2": 166.51, "r_x3": 229.82, "r_y3": 166.51, "coord_origin": "TOPLEFT" }, "text": "2", "orig": "2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 67, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 257.24, "r_y0": 196.18, "r_x1": 260.93, "r_y1": 196.18, "r_x2": 260.93, "r_y2": 189.96, "r_x3": 257.24, "r_y3": 189.96, "coord_origin": "TOPLEFT" }, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 68, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 186.88, "r_y0": 184.19, "r_x1": 190.56, "r_y1": 184.19, "r_x2": 190.56, "r_y2": 177.98, "r_x3": 186.88, "r_y3": 177.98, "coord_origin": "TOPLEFT" }, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 69, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 196.49, "r_y0": 175.23, "r_x1": 200.17, "r_y1": 175.23, "r_x2": 200.17, "r_y2": 169.02, "r_x3": 196.49, "r_y3": 169.02, "coord_origin": "TOPLEFT" }, "text": "4", "orig": "4", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 70, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 169.75, "r_y0": 175.65, "r_x1": 175.73, "r_y1": 175.65, "r_x2": 175.73, "r_y2": 167.88, "r_x3": 169.75, "r_y3": 167.88, "coord_origin": "TOPLEFT" }, "text": "A", "orig": "A", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 71, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 169.75, "r_y0": 214.61, "r_x1": 175.73, "r_y1": 214.61, "r_x2": 175.73, "r_y2": 206.84, "r_x3": 169.75, "r_y3": 206.84, "coord_origin": "TOPLEFT" }, "text": "B", "orig": "B", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 72, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 274.29, "r_y0": 176.05, "r_x1": 280.27, "r_y1": 176.05, "r_x2": 280.27, "r_y2": 168.28, "r_x3": 274.29, "r_y3": 168.28, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 73, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 359.56, "r_y0": 176.05, "r_x1": 365.54, "r_y1": 176.05, "r_x2": 365.54, "r_y2": 168.28, "r_x3": 359.56, "r_y3": 168.28, "coord_origin": "TOPLEFT" }, "text": "D", "orig": "D", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 74, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 169.75, "r_y0": 250.98, "r_x1": 175.27, "r_y1": 250.98, "r_x2": 175.27, "r_y2": 243.21, "r_x3": 169.75, "r_y3": 243.21, "coord_origin": "TOPLEFT" }, "text": "E", "orig": "E", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 75, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 314.1, "r_x1": 149.4, "r_y1": 314.1, "r_x2": 149.4, "r_y2": 305.3, "r_x3": 134.76, "r_y3": 305.3, "coord_origin": "TOPLEFT" }, "text": "4.2", "orig": "4.2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 76, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 160.86, "r_y0": 314.1, "r_x1": 246.65, "r_y1": 314.1, "r_x2": 246.65, "r_y2": 305.3, "r_x3": 160.86, "r_y3": 305.3, "coord_origin": "TOPLEFT" }, "text": "Language Syntax", "orig": "Language Syntax", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 77, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 334.04, "r_x1": 363.8, "r_y1": 334.04, "r_x2": 363.8, "r_y2": 325.25, "r_x3": 134.76, "r_y3": 325.25, "coord_origin": "TOPLEFT" }, "text": "The OTSL representation follows these syntax rules:", "orig": "The OTSL representation follows these syntax rules:", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 78, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 138.97, "r_y0": 355.98, "r_x1": 146.72, "r_y1": 355.98, "r_x2": 146.72, "r_y2": 347.18, "r_x3": 138.97, "r_y3": 347.18, "coord_origin": "TOPLEFT" }, "text": "1.", "orig": "1.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 79, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.7, "r_y0": 355.98, "r_x1": 257.38, "r_y1": 355.98, "r_x2": 257.38, "r_y2": 347.17, "r_x3": 151.7, "r_y3": 347.17, "coord_origin": "TOPLEFT" }, "text": "Left-looking cell rule", "orig": "Left-looking cell rule", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 80, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 257.38, "r_y0": 355.98, "r_x1": 480.59, "r_y1": 355.98, "r_x2": 480.59, "r_y2": 347.18, "r_x3": 257.38, "r_y3": 347.18, "coord_origin": "TOPLEFT" }, "text": ": The left neighbour of an \"L\" cell must be either", "orig": ": The left neighbour of an \"L\" cell must be either", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 81, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.7, "r_y0": 367.93, "r_x1": 283.59, "r_y1": 367.93, "r_x2": 283.59, "r_y2": 359.14, "r_x3": 151.7, "r_y3": 359.14, "coord_origin": "TOPLEFT" }, "text": "another \"L\" cell or a \"C\" cell.", "orig": "another \"L\" cell or a \"C\" cell.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 82, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 138.97, "r_y0": 379.89, "r_x1": 146.72, "r_y1": 379.89, "r_x2": 146.72, "r_y2": 371.09, "r_x3": 138.97, "r_y3": 371.09, "coord_origin": "TOPLEFT" }, "text": "2.", "orig": "2.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 83, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.7, "r_y0": 379.89, "r_x1": 252.11, "r_y1": 379.89, "r_x2": 252.11, "r_y2": 371.08, "r_x3": 151.7, "r_y3": 371.08, "coord_origin": "TOPLEFT" }, "text": "Up-looking cell rule", "orig": "Up-looking cell rule", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 84, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 252.11, "r_y0": 379.89, "r_x1": 480.59, "r_y1": 379.89, "r_x2": 480.59, "r_y2": 371.09, "r_x3": 252.11, "r_y3": 371.09, "coord_origin": "TOPLEFT" }, "text": ": The upper neighbour of a \"U\" cell must be either", "orig": ": The upper neighbour of a \"U\" cell must be either", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 85, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.7, "r_y0": 391.85, "r_x1": 284.84, "r_y1": 391.85, "r_x2": 284.84, "r_y2": 383.05, "r_x3": 151.7, "r_y3": 383.05, "coord_origin": "TOPLEFT" }, "text": "another \"U\" cell or a \"C\" cell.", "orig": "another \"U\" cell or a \"C\" cell.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 86, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 138.97, "r_y0": 403.8, "r_x1": 146.72, "r_y1": 403.8, "r_x2": 146.72, "r_y2": 395.01, "r_x3": 138.97, "r_y3": 395.01, "coord_origin": "TOPLEFT" }, "text": "3.", "orig": "3.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 87, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.7, "r_y0": 403.8, "r_x1": 223.3, "r_y1": 403.8, "r_x2": 223.3, "r_y2": 395.0, "r_x3": 151.7, "r_y3": 395.0, "coord_origin": "TOPLEFT" }, "text": "Cross cell rule", "orig": "Cross cell rule", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 88, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 223.31, "r_y0": 403.8, "r_x1": 226.07, "r_y1": 403.8, "r_x2": 226.07, "r_y2": 395.01, "r_x3": 223.31, "r_y3": 395.01, "coord_origin": "TOPLEFT" }, "text": ":", "orig": ":", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 89, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.7, "r_y0": 415.76, "r_x1": 480.59, "r_y1": 415.76, "r_x2": 480.59, "r_y2": 406.97, "r_x3": 151.7, "r_y3": 406.97, "coord_origin": "TOPLEFT" }, "text": "The left neighbour of an \"X\" cell must be either another \"X\" cell or a \"U\"", "orig": "The left neighbour of an \"X\" cell must be either another \"X\" cell or a \"U\"", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 90, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.7, "r_y0": 427.72, "r_x1": 480.59, "r_y1": 427.72, "r_x2": 480.59, "r_y2": 418.92, "r_x3": 151.7, "r_y3": 418.92, "coord_origin": "TOPLEFT" }, "text": "cell, and the upper neighbour of an \"X\" cell must be either another \"X\" cell", "orig": "cell, and the upper neighbour of an \"X\" cell must be either another \"X\" cell", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 91, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.7, "r_y0": 439.67, "r_x1": 214.4, "r_y1": 439.67, "r_x2": 214.4, "r_y2": 430.88, "r_x3": 151.7, "r_y3": 430.88, "coord_origin": "TOPLEFT" }, "text": "or an \"L\" cell.", "orig": "or an \"L\" cell.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 92, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 138.97, "r_y0": 451.63, "r_x1": 146.72, "r_y1": 451.63, "r_x2": 146.72, "r_y2": 442.84, "r_x3": 138.97, "r_y3": 442.84, "coord_origin": "TOPLEFT" }, "text": "4.", "orig": "4.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 93, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.7, "r_y0": 451.63, "r_x1": 221.32, "r_y1": 451.63, "r_x2": 221.32, "r_y2": 442.83, "r_x3": 151.7, "r_y3": 442.83, "coord_origin": "TOPLEFT" }, "text": "First row rule", "orig": "First row rule", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 94, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 221.33, "r_y0": 451.63, "r_x1": 474.59, "r_y1": 451.63, "r_x2": 474.59, "r_y2": 442.84, "r_x3": 221.33, "r_y3": 442.84, "coord_origin": "TOPLEFT" }, "text": ": Only \"L\" cells and \"C\" cells are allowed in the first row.", "orig": ": Only \"L\" cells and \"C\" cells are allowed in the first row.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 95, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 138.97, "r_y0": 463.59, "r_x1": 146.72, "r_y1": 463.59, "r_x2": 146.72, "r_y2": 454.79, "r_x3": 138.97, "r_y3": 454.79, "coord_origin": "TOPLEFT" }, "text": "5.", "orig": "5.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 96, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.7, "r_y0": 463.59, "r_x1": 240.72, "r_y1": 463.59, "r_x2": 240.72, "r_y2": 454.78, "r_x3": 151.7, "r_y3": 454.78, "coord_origin": "TOPLEFT" }, "text": "First column rule", "orig": "First column rule", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 97, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 240.72, "r_y0": 463.59, "r_x1": 480.59, "r_y1": 463.59, "r_x2": 480.59, "r_y2": 454.79, "r_x3": 240.72, "r_y3": 454.79, "coord_origin": "TOPLEFT" }, "text": ": Only \"U\" cells and \"C\" cells are allowed in the first", "orig": ": Only \"U\" cells and \"C\" cells are allowed in the first", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 98, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.7, "r_y0": 475.55, "r_x1": 186.01, "r_y1": 475.55, "r_x2": 186.01, "r_y2": 466.75, "r_x3": 151.7, "r_y3": 466.75, "coord_origin": "TOPLEFT" }, "text": "column.", "orig": "column.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 99, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 138.97, "r_y0": 487.5, "r_x1": 146.72, "r_y1": 487.5, "r_x2": 146.72, "r_y2": 478.71, "r_x3": 138.97, "r_y3": 478.71, "coord_origin": "TOPLEFT" }, "text": "6.", "orig": "6.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 100, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.7, "r_y0": 487.5, "r_x1": 235.16, "r_y1": 487.5, "r_x2": 235.16, "r_y2": 478.7, "r_x3": 151.7, "r_y3": 478.7, "coord_origin": "TOPLEFT" }, "text": "Rectangular rule", "orig": "Rectangular rule", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 101, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 235.16, "r_y0": 487.5, "r_x1": 480.59, "r_y1": 487.5, "r_x2": 480.59, "r_y2": 478.71, "r_x3": 235.16, "r_y3": 478.71, "coord_origin": "TOPLEFT" }, "text": ": The table representation is always rectangular - all rows", "orig": ": The table representation is always rectangular - all rows", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 102, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.7, "r_y0": 499.46, "r_x1": 448.04, "r_y1": 499.46, "r_x2": 448.04, "r_y2": 490.66, "r_x3": 151.7, "r_y3": 490.66, "coord_origin": "TOPLEFT" }, "text": "must have an equal number of tokens, terminated with \"NL\" token.", "orig": "must have an equal number of tokens, terminated with \"NL\" token.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 103, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 149.71, "r_y0": 521.39, "r_x1": 480.6, "r_y1": 521.39, "r_x2": 480.6, "r_y2": 512.59, "r_x3": 149.71, "r_y3": 512.59, "coord_origin": "TOPLEFT" }, "text": "The application of these rules gives OTSL a set of unique properties. First", "orig": "The application of these rules gives OTSL a set of unique properties. First", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 104, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 533.34, "r_x1": 480.59, "r_y1": 533.34, "r_x2": 480.59, "r_y2": 524.55, "r_x3": 134.76, "r_y3": 524.55, "coord_origin": "TOPLEFT" }, "text": "of all, the OTSL enforces a strictly rectangular structure representation, where", "orig": "of all, the OTSL enforces a strictly rectangular structure representation, where", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 105, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 545.3, "r_x1": 480.59, "r_y1": 545.3, "r_x2": 480.59, "r_y2": 536.5, "r_x3": 134.76, "r_y3": 536.5, "coord_origin": "TOPLEFT" }, "text": "every new-line token starts a new row. As a consequence, all rows and all columns", "orig": "every new-line token starts a new row. As a consequence, all rows and all columns", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 106, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 557.26, "r_x1": 480.59, "r_y1": 557.26, "r_x2": 480.59, "r_y2": 548.46, "r_x3": 134.76, "r_y3": 548.46, "coord_origin": "TOPLEFT" }, "text": "have exactly the same number of tokens, irrespective of cell spans. Secondly, the", "orig": "have exactly the same number of tokens, irrespective of cell spans. Secondly, the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 107, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 569.21, "r_x1": 480.59, "r_y1": 569.21, "r_x2": 480.59, "r_y2": 560.41, "r_x3": 134.76, "r_y3": 560.41, "coord_origin": "TOPLEFT" }, "text": "OTSL representation is unambiguous: Every table structure is represented in one", "orig": "OTSL representation is unambiguous: Every table structure is represented in one", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 108, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 581.17, "r_x1": 480.59, "r_y1": 581.17, "r_x2": 480.59, "r_y2": 572.37, "r_x3": 134.76, "r_y3": 572.37, "coord_origin": "TOPLEFT" }, "text": "way. In this representation every table cell corresponds to a \"C\"-cell token, which", "orig": "way. In this representation every table cell corresponds to a \"C\"-cell token, which", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 109, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 593.12, "r_x1": 480.59, "r_y1": 593.12, "r_x2": 480.59, "r_y2": 584.32, "r_x3": 134.76, "r_y3": 584.32, "coord_origin": "TOPLEFT" }, "text": "in case of spans is always located in the top-left corner of the table cell definition.", "orig": "in case of spans is always located in the top-left corner of the table cell definition.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 110, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 605.08, "r_x1": 480.59, "r_y1": 605.08, "r_x2": 480.59, "r_y2": 596.28, "r_x3": 134.76, "r_y3": 596.28, "coord_origin": "TOPLEFT" }, "text": "Third, OTSL syntax rules are only backward-looking. As a consequence, every", "orig": "Third, OTSL syntax rules are only backward-looking. As a consequence, every", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 111, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 617.03, "r_x1": 480.59, "r_y1": 617.03, "r_x2": 480.59, "r_y2": 608.23, "r_x3": 134.76, "r_y3": 608.23, "coord_origin": "TOPLEFT" }, "text": "predicted token can be validated straight during sequence generation by looking", "orig": "predicted token can be validated straight during sequence generation by looking", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 112, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 628.99, "r_x1": 480.59, "r_y1": 628.99, "r_x2": 480.59, "r_y2": 620.19, "r_x3": 134.76, "r_y3": 620.19, "coord_origin": "TOPLEFT" }, "text": "at the previously predicted sequence. As such, OTSL can guarantee that every", "orig": "at the previously predicted sequence. As such, OTSL can guarantee that every", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 113, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 640.94, "r_x1": 311.2, "r_y1": 640.94, "r_x2": 311.2, "r_y2": 632.14, "r_x3": 134.76, "r_y3": 632.14, "coord_origin": "TOPLEFT" }, "text": "predicted sequence is syntactically valid.", "orig": "predicted sequence is syntactically valid.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 114, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 149.71, "r_y0": 652.9, "r_x1": 480.59, "r_y1": 652.9, "r_x2": 480.59, "r_y2": 644.1, "r_x3": 149.71, "r_y3": 644.1, "coord_origin": "TOPLEFT" }, "text": "These characteristics can be easily learned by sequence generator networks,", "orig": "These characteristics can be easily learned by sequence generator networks,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 115, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 664.85, "r_x1": 480.59, "r_y1": 664.85, "r_x2": 480.59, "r_y2": 656.06, "r_x3": 134.76, "r_y3": 656.06, "coord_origin": "TOPLEFT" }, "text": "as we demonstrate further below. We find strong indications that this pattern", "orig": "as we demonstrate further below. We find strong indications that this pattern", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "has_chars": false, "has_words": false, "has_lines": true, "image": null, "lines": [] }, "predictions": { "layout": { "clusters": [ { "id": 7, "label": "page_header", "bbox": { "l": 194.48, "t": 93.77, "r": 447.54, "b": 101.84, "coord_origin": "TOPLEFT" }, "confidence": 0.933, "cells": [ { "index": 0, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 194.48, "r_y0": 101.84, "r_x1": 447.54, "r_y1": 101.84, "r_x2": 447.54, "r_y2": 93.77, "r_x3": 194.48, "r_y3": 93.77, "coord_origin": "TOPLEFT" }, "text": "Optimized Table Tokenization for Table Structure Recognition", "orig": "Optimized Table Tokenization for Table Structure Recognition", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 11, "label": "page_header", "bbox": { "l": 475.98, "t": 93.77, "r": 480.59, "b": 101.84, "coord_origin": "TOPLEFT" }, "confidence": 0.875, "cells": [ { "index": 1, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 475.98, "r_y0": 101.84, "r_x1": 480.59, "r_y1": 101.84, "r_x2": 480.59, "r_y2": 93.77, "r_x3": 475.98, "r_y3": 93.77, "coord_origin": "TOPLEFT" }, "text": "7", "orig": "7", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 6, "label": "caption", "bbox": { "l": 134.76, "t": 125.8, "r": 480.59, "b": 155.85, "coord_origin": "TOPLEFT" }, "confidence": 0.933, "cells": [ { "index": 2, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 133.73, "r_x1": 162.64, "r_y1": 133.73, "r_x2": 162.64, "r_y2": 125.8, "r_x3": 134.76, "r_y3": 125.8, "coord_origin": "TOPLEFT" }, "text": "Fig. 3.", "orig": "Fig. 3.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 3, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 166.28, "r_y0": 133.93, "r_x1": 480.59, "r_y1": 133.93, "r_x2": 480.59, "r_y2": 125.86, "r_x3": 166.28, "r_y3": 125.86, "coord_origin": "TOPLEFT" }, "text": "OTSL description of table structure: A - table example; B - graphical repre-", "orig": "OTSL description of table structure: A - table example; B - graphical repre-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 4, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 144.89, "r_x1": 480.59, "r_y1": 144.89, "r_x2": 480.59, "r_y2": 136.82, "r_x3": 134.76, "r_y3": 136.82, "coord_origin": "TOPLEFT" }, "text": "sentation of table structure; C - mapping structure on a grid; D - OTSL structure", "orig": "sentation of table structure; C - mapping structure on a grid; D - OTSL structure", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 5, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 155.85, "r_x1": 306.12, "r_y1": 155.85, "r_x2": 306.12, "r_y2": 147.78, "r_x3": 134.76, "r_y3": 147.78, "coord_origin": "TOPLEFT" }, "text": "encoding; E - explanation on cell encoding", "orig": "encoding; E - explanation on cell encoding", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 12, "label": "picture", "bbox": { "l": 164.65, "t": 163.8, "r": 449.55, "b": 280.34, "coord_origin": "TOPLEFT" }, "confidence": 0.787, "cells": [ { "index": 6, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 374.49, "r_y0": 177.92, "r_x1": 381.67, "r_y1": 177.92, "r_x2": 381.67, "r_y2": 168.59, "r_x3": 374.49, "r_y3": 168.59, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 7, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 398.74, "r_y0": 177.82, "r_x1": 405.92, "r_y1": 177.82, "r_x2": 405.92, "r_y2": 168.5, "r_x3": 398.74, "r_y3": 168.5, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 8, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 373.77, "r_y0": 202.25, "r_x1": 380.94, "r_y1": 202.25, "r_x2": 380.94, "r_y2": 192.93, "r_x3": 373.77, "r_y3": 192.93, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 9, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 386.66, "r_y0": 202.39, "r_x1": 393.84, "r_y1": 202.39, "r_x2": 393.84, "r_y2": 193.07, "r_x3": 386.66, "r_y3": 193.07, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 10, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 386.69, "r_y0": 214.46, "r_x1": 393.86, "r_y1": 214.46, "r_x2": 393.86, "r_y2": 205.14, "r_x3": 386.69, "r_y3": 205.14, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 11, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 398.66, "r_y0": 190.05, "r_x1": 405.83, "r_y1": 190.05, "r_x2": 405.83, "r_y2": 180.73, "r_x3": 398.66, "r_y3": 180.73, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 12, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 410.78, "r_y0": 190.06, "r_x1": 417.95, "r_y1": 190.06, "r_x2": 417.95, "r_y2": 180.74, "r_x3": 410.78, "r_y3": 180.74, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 13, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 422.91, "r_y0": 189.97, "r_x1": 430.08, "r_y1": 189.97, "r_x2": 430.08, "r_y2": 180.65, "r_x3": 422.91, "r_y3": 180.65, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 14, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 398.78, "r_y0": 202.31, "r_x1": 405.96, "r_y1": 202.31, "r_x2": 405.96, "r_y2": 192.99, "r_x3": 398.78, "r_y3": 192.99, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 15, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 410.9, "r_y0": 202.32, "r_x1": 418.08, "r_y1": 202.32, "r_x2": 418.08, "r_y2": 192.99, "r_x3": 410.9, "r_y3": 192.99, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 16, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 423.03, "r_y0": 202.23, "r_x1": 430.2, "r_y1": 202.23, "r_x2": 430.2, "r_y2": 192.91, "r_x3": 423.03, "r_y3": 192.91, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 17, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 398.78, "r_y0": 214.64, "r_x1": 405.96, "r_y1": 214.64, "r_x2": 405.96, "r_y2": 205.32, "r_x3": 398.78, "r_y3": 205.32, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 18, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 410.9, "r_y0": 214.64, "r_x1": 418.08, "r_y1": 214.64, "r_x2": 418.08, "r_y2": 205.32, "r_x3": 410.9, "r_y3": 205.32, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 19, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 423.03, "r_y0": 214.56, "r_x1": 430.21, "r_y1": 214.56, "r_x2": 430.21, "r_y2": 205.24, "r_x3": 423.03, "r_y3": 205.24, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 20, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 386.51, "r_y0": 226.36, "r_x1": 393.68, "r_y1": 226.36, "r_x2": 393.68, "r_y2": 217.04, "r_x3": 386.51, "r_y3": 217.04, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 21, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 398.6, "r_y0": 226.54, "r_x1": 405.78, "r_y1": 226.54, "r_x2": 405.78, "r_y2": 217.22, "r_x3": 398.6, "r_y3": 217.22, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 22, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 410.72, "r_y0": 226.54, "r_x1": 417.9, "r_y1": 226.54, "r_x2": 417.9, "r_y2": 217.22, "r_x3": 410.72, "r_y3": 217.22, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 23, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 422.85, "r_y0": 226.46, "r_x1": 430.02, "r_y1": 226.46, "r_x2": 430.02, "r_y2": 217.14, "r_x3": 422.85, "r_y3": 217.14, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 24, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 435.16, "r_y0": 177.01, "r_x1": 447.86, "r_y1": 177.01, "r_x2": 447.86, "r_y2": 167.69, "r_x3": 435.16, "r_y3": 167.69, "coord_origin": "TOPLEFT" }, "text": "NL", "orig": "NL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 25, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 435.44, "r_y0": 189.52, "r_x1": 448.15, "r_y1": 189.52, "r_x2": 448.15, "r_y2": 180.2, "r_x3": 435.44, "r_y3": 180.2, "coord_origin": "TOPLEFT" }, "text": "NL", "orig": "NL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 26, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 435.47, "r_y0": 201.82, "r_x1": 448.17, "r_y1": 201.82, "r_x2": 448.17, "r_y2": 192.49, "r_x3": 435.47, "r_y3": 192.49, "coord_origin": "TOPLEFT" }, "text": "NL", "orig": "NL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 27, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 435.38, "r_y0": 214.15, "r_x1": 448.08, "r_y1": 214.15, "r_x2": 448.08, "r_y2": 204.83, "r_x3": 435.38, "r_y3": 204.83, "coord_origin": "TOPLEFT" }, "text": "NL", "orig": "NL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 28, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 435.6, "r_y0": 226.56, "r_x1": 448.3, "r_y1": 226.56, "r_x2": 448.3, "r_y2": 217.23, "r_x3": 435.6, "r_y3": 217.23, "coord_origin": "TOPLEFT" }, "text": "NL", "orig": "NL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 29, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 374.15, "r_y0": 214.56, "r_x1": 381.32, "r_y1": 214.56, "r_x2": 381.32, "r_y2": 205.23, "r_x3": 374.15, "r_y3": 205.23, "coord_origin": "TOPLEFT" }, "text": "U", "orig": "U", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 30, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 374.04, "r_y0": 226.47, "r_x1": 381.22, "r_y1": 226.47, "r_x2": 381.22, "r_y2": 217.15, "r_x3": 374.04, "r_y3": 217.15, "coord_origin": "TOPLEFT" }, "text": "U", "orig": "U", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 31, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 374.34, "r_y0": 190.26, "r_x1": 381.52, "r_y1": 190.26, "r_x2": 381.52, "r_y2": 180.93, "r_x3": 374.34, "r_y3": 180.93, "coord_origin": "TOPLEFT" }, "text": "U", "orig": "U", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 32, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 387.76, "r_y0": 177.9, "r_x1": 393.29, "r_y1": 177.9, "r_x2": 393.29, "r_y2": 168.58, "r_x3": 387.76, "r_y3": 168.58, "coord_origin": "TOPLEFT" }, "text": "L", "orig": "L", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 33, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 411.86, "r_y0": 177.38, "r_x1": 417.39, "r_y1": 177.38, "r_x2": 417.39, "r_y2": 168.06, "r_x3": 411.86, "r_y3": 168.06, "coord_origin": "TOPLEFT" }, "text": "L", "orig": "L", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 34, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 423.34, "r_y0": 177.26, "r_x1": 428.86, "r_y1": 177.26, "r_x2": 428.86, "r_y2": 167.93, "r_x3": 423.34, "r_y3": 167.93, "coord_origin": "TOPLEFT" }, "text": "L", "orig": "L", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 35, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 387.14, "r_y0": 190.11, "r_x1": 393.76, "r_y1": 190.11, "r_x2": 393.76, "r_y2": 180.79, "r_x3": 387.14, "r_y3": 180.79, "coord_origin": "TOPLEFT" }, "text": "X", "orig": "X", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 36, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 282.26, "r_y0": 253.83, "r_x1": 289.43, "r_y1": 253.83, "r_x2": 289.43, "r_y2": 244.51, "r_x3": 282.26, "r_y3": 244.51, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 37, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 282.11, "r_y0": 266.17, "r_x1": 289.29, "r_y1": 266.17, "r_x2": 289.29, "r_y2": 256.85, "r_x3": 282.11, "r_y3": 256.85, "coord_origin": "TOPLEFT" }, "text": "U", "orig": "U", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 38, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 282.41, "r_y0": 278.45, "r_x1": 289.58, "r_y1": 278.45, "r_x2": 289.58, "r_y2": 269.13, "r_x3": 282.41, "r_y3": 269.13, "coord_origin": "TOPLEFT" }, "text": "U", "orig": "U", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 39, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 295.53, "r_y0": 253.82, "r_x1": 301.05, "r_y1": 253.82, "r_x2": 301.05, "r_y2": 244.49, "r_x3": 295.53, "r_y3": 244.49, "coord_origin": "TOPLEFT" }, "text": "L", "orig": "L", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 40, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 307.47, "r_y0": 253.9, "r_x1": 312.99, "r_y1": 253.9, "r_x2": 312.99, "r_y2": 244.57, "r_x3": 307.47, "r_y3": 244.57, "coord_origin": "TOPLEFT" }, "text": "L", "orig": "L", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 41, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 318.77, "r_y0": 253.76, "r_x1": 324.29, "r_y1": 253.76, "r_x2": 324.29, "r_y2": 244.44, "r_x3": 318.77, "r_y3": 244.44, "coord_origin": "TOPLEFT" }, "text": "L", "orig": "L", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 42, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 294.9, "r_y0": 266.02, "r_x1": 301.04, "r_y1": 266.02, "r_x2": 301.04, "r_y2": 256.7, "r_x3": 294.9, "r_y3": 256.7, "coord_origin": "TOPLEFT" }, "text": "X", "orig": "X", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 43, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 307.18, "r_y0": 266.02, "r_x1": 325.59, "r_y1": 266.02, "r_x2": 325.59, "r_y2": 256.7, "r_x3": 307.18, "r_y3": 256.7, "coord_origin": "TOPLEFT" }, "text": "X X", "orig": "X X", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 44, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 294.79, "r_y0": 278.58, "r_x1": 300.93, "r_y1": 278.58, "r_x2": 300.93, "r_y2": 269.25, "r_x3": 294.79, "r_y3": 269.25, "coord_origin": "TOPLEFT" }, "text": "X", "orig": "X", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 45, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 307.06, "r_y0": 278.58, "r_x1": 325.48, "r_y1": 278.58, "r_x2": 325.48, "r_y2": 269.25, "r_x3": 307.06, "r_y3": 269.25, "coord_origin": "TOPLEFT" }, "text": "X X", "orig": "X X", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 46, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 195.94, "r_y0": 278.07, "r_x1": 203.11, "r_y1": 278.07, "r_x2": 203.11, "r_y2": 268.75, "r_x3": 195.94, "r_y3": 268.75, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 47, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 209.21, "r_y0": 278.05, "r_x1": 214.73, "r_y1": 278.05, "r_x2": 214.73, "r_y2": 268.73, "r_x3": 209.21, "r_y3": 268.73, "coord_origin": "TOPLEFT" }, "text": "L", "orig": "L", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 48, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 221.15, "r_y0": 278.13, "r_x1": 226.67, "r_y1": 278.13, "r_x2": 226.67, "r_y2": 268.81, "r_x3": 221.15, "r_y3": 268.81, "coord_origin": "TOPLEFT" }, "text": "L", "orig": "L", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 49, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 232.45, "r_y0": 278.0, "r_x1": 237.97, "r_y1": 278.0, "r_x2": 237.97, "r_y2": 268.68, "r_x3": 232.45, "r_y3": 268.68, "coord_origin": "TOPLEFT" }, "text": "L", "orig": "L", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 50, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 196.22, "r_y0": 253.86, "r_x1": 203.39, "r_y1": 253.86, "r_x2": 203.39, "r_y2": 244.54, "r_x3": 196.22, "r_y3": 244.54, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 51, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 250.32, "r_y0": 253.42, "r_x1": 257.5, "r_y1": 253.42, "r_x2": 257.5, "r_y2": 244.1, "r_x3": 250.32, "r_y3": 244.1, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 52, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 250.17, "r_y0": 265.76, "r_x1": 257.35, "r_y1": 265.76, "r_x2": 257.35, "r_y2": 256.44, "r_x3": 250.17, "r_y3": 256.44, "coord_origin": "TOPLEFT" }, "text": "U", "orig": "U", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 53, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 250.47, "r_y0": 278.04, "r_x1": 257.65, "r_y1": 278.04, "r_x2": 257.65, "r_y2": 268.72, "r_x3": 250.47, "r_y3": 268.72, "coord_origin": "TOPLEFT" }, "text": "U", "orig": "U", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 54, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 334.51, "r_y0": 249.21, "r_x1": 337.22, "r_y1": 249.21, "r_x2": 337.22, "r_y2": 242.99, "r_x3": 334.51, "r_y3": 242.99, "coord_origin": "TOPLEFT" }, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 55, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 339.94, "r_y0": 249.21, "r_x1": 391.49, "r_y1": 249.21, "r_x2": 391.49, "r_y2": 242.99, "r_x3": 339.94, "r_y3": 242.99, "coord_origin": "TOPLEFT" }, "text": "- simple cells: \"C\"", "orig": "- simple cells: \"C\"", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 56, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 334.51, "r_y0": 259.15, "r_x1": 337.33, "r_y1": 259.15, "r_x2": 337.33, "r_y2": 252.93, "r_x3": 334.51, "r_y3": 252.93, "coord_origin": "TOPLEFT" }, "text": "2", "orig": "2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 57, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 340.15, "r_y0": 259.15, "r_x1": 421.99, "r_y1": 259.15, "r_x2": 421.99, "r_y2": 252.93, "r_x3": 340.15, "r_y3": 252.93, "coord_origin": "TOPLEFT" }, "text": "- horizontal merges: \"C\", \"L\"", "orig": "- horizontal merges: \"C\", \"L\"", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 58, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 334.51, "r_y0": 269.08, "r_x1": 337.3, "r_y1": 269.08, "r_x2": 337.3, "r_y2": 262.87, "r_x3": 334.51, "r_y3": 262.87, "coord_origin": "TOPLEFT" }, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 59, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 340.09, "r_y0": 269.08, "r_x1": 415.34, "r_y1": 269.08, "r_x2": 415.34, "r_y2": 262.87, "r_x3": 340.09, "r_y3": 262.87, "coord_origin": "TOPLEFT" }, "text": "- vertical merges: \"C\", \"U\"", "orig": "- vertical merges: \"C\", \"U\"", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 60, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 334.51, "r_y0": 279.02, "r_x1": 337.3, "r_y1": 279.02, "r_x2": 337.3, "r_y2": 272.81, "r_x3": 334.51, "r_y3": 272.81, "coord_origin": "TOPLEFT" }, "text": "4", "orig": "4", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 61, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 340.09, "r_y0": 279.02, "r_x1": 426.6, "r_y1": 279.02, "r_x2": 426.6, "r_y2": 272.81, "r_x3": 340.09, "r_y3": 272.81, "coord_origin": "TOPLEFT" }, "text": "- 2d merges: \"C\", \"L\", \"U\", \"X\"", "orig": "- 2d merges: \"C\", \"L\", \"U\", \"X\"", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 62, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 185.67, "r_y0": 250.26, "r_x1": 189.36, "r_y1": 250.26, "r_x2": 189.36, "r_y2": 244.04, "r_x3": 185.67, "r_y3": 244.04, "coord_origin": "TOPLEFT" }, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 63, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 185.97, "r_y0": 274.56, "r_x1": 189.65, "r_y1": 274.56, "r_x2": 189.65, "r_y2": 268.35, "r_x3": 185.97, "r_y3": 268.35, "coord_origin": "TOPLEFT" }, "text": "2", "orig": "2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 64, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 239.34, "r_y0": 249.84, "r_x1": 243.03, "r_y1": 249.84, "r_x2": 243.03, "r_y2": 243.63, "r_x3": 239.34, "r_y3": 243.63, "coord_origin": "TOPLEFT" }, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 65, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 271.33, "r_y0": 249.71, "r_x1": 275.01, "r_y1": 249.71, "r_x2": 275.01, "r_y2": 243.49, "r_x3": 271.33, "r_y3": 243.49, "coord_origin": "TOPLEFT" }, "text": "4", "orig": "4", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 66, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 229.82, "r_y0": 172.73, "r_x1": 233.5, "r_y1": 172.73, "r_x2": 233.5, "r_y2": 166.51, "r_x3": 229.82, "r_y3": 166.51, "coord_origin": "TOPLEFT" }, "text": "2", "orig": "2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 67, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 257.24, "r_y0": 196.18, "r_x1": 260.93, "r_y1": 196.18, "r_x2": 260.93, "r_y2": 189.96, "r_x3": 257.24, "r_y3": 189.96, "coord_origin": "TOPLEFT" }, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 68, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 186.88, "r_y0": 184.19, "r_x1": 190.56, "r_y1": 184.19, "r_x2": 190.56, "r_y2": 177.98, "r_x3": 186.88, "r_y3": 177.98, "coord_origin": "TOPLEFT" }, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 69, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 196.49, "r_y0": 175.23, "r_x1": 200.17, "r_y1": 175.23, "r_x2": 200.17, "r_y2": 169.02, "r_x3": 196.49, "r_y3": 169.02, "coord_origin": "TOPLEFT" }, "text": "4", "orig": "4", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 70, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 169.75, "r_y0": 175.65, "r_x1": 175.73, "r_y1": 175.65, "r_x2": 175.73, "r_y2": 167.88, "r_x3": 169.75, "r_y3": 167.88, "coord_origin": "TOPLEFT" }, "text": "A", "orig": "A", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 71, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 169.75, "r_y0": 214.61, "r_x1": 175.73, "r_y1": 214.61, "r_x2": 175.73, "r_y2": 206.84, "r_x3": 169.75, "r_y3": 206.84, "coord_origin": "TOPLEFT" }, "text": "B", "orig": "B", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 72, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 274.29, "r_y0": 176.05, "r_x1": 280.27, "r_y1": 176.05, "r_x2": 280.27, "r_y2": 168.28, "r_x3": 274.29, "r_y3": 168.28, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 73, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 359.56, "r_y0": 176.05, "r_x1": 365.54, "r_y1": 176.05, "r_x2": 365.54, "r_y2": 168.28, "r_x3": 359.56, "r_y3": 168.28, "coord_origin": "TOPLEFT" }, "text": "D", "orig": "D", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 74, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 169.75, "r_y0": 250.98, "r_x1": 175.27, "r_y1": 250.98, "r_x2": 175.27, "r_y2": 243.21, "r_x3": 169.75, "r_y3": 243.21, "coord_origin": "TOPLEFT" }, "text": "E", "orig": "E", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [ { "id": 38, "label": "text", "bbox": { "l": 374.49, "t": 168.59, "r": 381.67, "b": 177.92, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 6, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 374.49, "r_y0": 177.92, "r_x1": 381.67, "r_y1": 177.92, "r_x2": 381.67, "r_y2": 168.59, "r_x3": 374.49, "r_y3": 168.59, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 39, "label": "text", "bbox": { "l": 398.74, "t": 168.5, "r": 405.92, "b": 177.82, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 7, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 398.74, "r_y0": 177.82, "r_x1": 405.92, "r_y1": 177.82, "r_x2": 405.92, "r_y2": 168.5, "r_x3": 398.74, "r_y3": 168.5, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 40, "label": "text", "bbox": { "l": 373.77, "t": 192.93, "r": 380.94, "b": 202.25, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 8, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 373.77, "r_y0": 202.25, "r_x1": 380.94, "r_y1": 202.25, "r_x2": 380.94, "r_y2": 192.93, "r_x3": 373.77, "r_y3": 192.93, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 41, "label": "text", "bbox": { "l": 386.66, "t": 193.07, "r": 393.84, "b": 202.39, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 9, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 386.66, "r_y0": 202.39, "r_x1": 393.84, "r_y1": 202.39, "r_x2": 393.84, "r_y2": 193.07, "r_x3": 386.66, "r_y3": 193.07, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 42, "label": "text", "bbox": { "l": 386.69, "t": 205.14, "r": 393.86, "b": 214.46, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 10, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 386.69, "r_y0": 214.46, "r_x1": 393.86, "r_y1": 214.46, "r_x2": 393.86, "r_y2": 205.14, "r_x3": 386.69, "r_y3": 205.14, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 43, "label": "text", "bbox": { "l": 398.66, "t": 180.73, "r": 405.83, "b": 190.05, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 11, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 398.66, "r_y0": 190.05, "r_x1": 405.83, "r_y1": 190.05, "r_x2": 405.83, "r_y2": 180.73, "r_x3": 398.66, "r_y3": 180.73, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 44, "label": "text", "bbox": { "l": 410.78, "t": 180.74, "r": 417.95, "b": 190.06, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 12, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 410.78, "r_y0": 190.06, "r_x1": 417.95, "r_y1": 190.06, "r_x2": 417.95, "r_y2": 180.74, "r_x3": 410.78, "r_y3": 180.74, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 45, "label": "text", "bbox": { "l": 422.91, "t": 180.65, "r": 430.08, "b": 189.97, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 13, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 422.91, "r_y0": 189.97, "r_x1": 430.08, "r_y1": 189.97, "r_x2": 430.08, "r_y2": 180.65, "r_x3": 422.91, "r_y3": 180.65, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 46, "label": "text", "bbox": { "l": 398.78, "t": 192.99, "r": 405.96, "b": 202.31, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 14, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 398.78, "r_y0": 202.31, "r_x1": 405.96, "r_y1": 202.31, "r_x2": 405.96, "r_y2": 192.99, "r_x3": 398.78, "r_y3": 192.99, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 47, "label": "text", "bbox": { "l": 410.9, "t": 192.99, "r": 418.08, "b": 202.32, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 15, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 410.9, "r_y0": 202.32, "r_x1": 418.08, "r_y1": 202.32, "r_x2": 418.08, "r_y2": 192.99, "r_x3": 410.9, "r_y3": 192.99, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 48, "label": "text", "bbox": { "l": 423.03, "t": 192.91, "r": 430.2, "b": 202.23, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 16, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 423.03, "r_y0": 202.23, "r_x1": 430.2, "r_y1": 202.23, "r_x2": 430.2, "r_y2": 192.91, "r_x3": 423.03, "r_y3": 192.91, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 49, "label": "text", "bbox": { "l": 398.78, "t": 205.32, "r": 405.96, "b": 214.64, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 17, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 398.78, "r_y0": 214.64, "r_x1": 405.96, "r_y1": 214.64, "r_x2": 405.96, "r_y2": 205.32, "r_x3": 398.78, "r_y3": 205.32, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 50, "label": "text", "bbox": { "l": 410.9, "t": 205.32, "r": 418.08, "b": 214.64, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 18, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 410.9, "r_y0": 214.64, "r_x1": 418.08, "r_y1": 214.64, "r_x2": 418.08, "r_y2": 205.32, "r_x3": 410.9, "r_y3": 205.32, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 51, "label": "text", "bbox": { "l": 423.03, "t": 205.24, "r": 430.21, "b": 214.56, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 19, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 423.03, "r_y0": 214.56, "r_x1": 430.21, "r_y1": 214.56, "r_x2": 430.21, "r_y2": 205.24, "r_x3": 423.03, "r_y3": 205.24, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 52, "label": "text", "bbox": { "l": 386.51, "t": 217.04, "r": 393.68, "b": 226.36, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 20, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 386.51, "r_y0": 226.36, "r_x1": 393.68, "r_y1": 226.36, "r_x2": 393.68, "r_y2": 217.04, "r_x3": 386.51, "r_y3": 217.04, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 53, "label": "text", "bbox": { "l": 398.6, "t": 217.22, "r": 405.78, "b": 226.54, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 21, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 398.6, "r_y0": 226.54, "r_x1": 405.78, "r_y1": 226.54, "r_x2": 405.78, "r_y2": 217.22, "r_x3": 398.6, "r_y3": 217.22, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 54, "label": "text", "bbox": { "l": 410.72, "t": 217.22, "r": 417.9, "b": 226.54, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 22, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 410.72, "r_y0": 226.54, "r_x1": 417.9, "r_y1": 226.54, "r_x2": 417.9, "r_y2": 217.22, "r_x3": 410.72, "r_y3": 217.22, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 55, "label": "text", "bbox": { "l": 422.85, "t": 217.14, "r": 430.02, "b": 226.46, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 23, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 422.85, "r_y0": 226.46, "r_x1": 430.02, "r_y1": 226.46, "r_x2": 430.02, "r_y2": 217.14, "r_x3": 422.85, "r_y3": 217.14, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 56, "label": "text", "bbox": { "l": 435.16, "t": 167.69, "r": 447.86, "b": 177.01, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 24, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 435.16, "r_y0": 177.01, "r_x1": 447.86, "r_y1": 177.01, "r_x2": 447.86, "r_y2": 167.69, "r_x3": 435.16, "r_y3": 167.69, "coord_origin": "TOPLEFT" }, "text": "NL", "orig": "NL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 57, "label": "text", "bbox": { "l": 435.44, "t": 180.2, "r": 448.15, "b": 189.52, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 25, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 435.44, "r_y0": 189.52, "r_x1": 448.15, "r_y1": 189.52, "r_x2": 448.15, "r_y2": 180.2, "r_x3": 435.44, "r_y3": 180.2, "coord_origin": "TOPLEFT" }, "text": "NL", "orig": "NL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 58, "label": "text", "bbox": { "l": 435.47, "t": 192.49, "r": 448.17, "b": 201.82, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 26, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 435.47, "r_y0": 201.82, "r_x1": 448.17, "r_y1": 201.82, "r_x2": 448.17, "r_y2": 192.49, "r_x3": 435.47, "r_y3": 192.49, "coord_origin": "TOPLEFT" }, "text": "NL", "orig": "NL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 59, "label": "text", "bbox": { "l": 435.38, "t": 204.83, "r": 448.08, "b": 214.15, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 27, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 435.38, "r_y0": 214.15, "r_x1": 448.08, "r_y1": 214.15, "r_x2": 448.08, "r_y2": 204.83, "r_x3": 435.38, "r_y3": 204.83, "coord_origin": "TOPLEFT" }, "text": "NL", "orig": "NL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 60, "label": "text", "bbox": { "l": 435.6, "t": 217.23, "r": 448.3, "b": 226.56, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 28, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 435.6, "r_y0": 226.56, "r_x1": 448.3, "r_y1": 226.56, "r_x2": 448.3, "r_y2": 217.23, "r_x3": 435.6, "r_y3": 217.23, "coord_origin": "TOPLEFT" }, "text": "NL", "orig": "NL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 61, "label": "text", "bbox": { "l": 374.15, "t": 205.23, "r": 381.32, "b": 214.56, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 29, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 374.15, "r_y0": 214.56, "r_x1": 381.32, "r_y1": 214.56, "r_x2": 381.32, "r_y2": 205.23, "r_x3": 374.15, "r_y3": 205.23, "coord_origin": "TOPLEFT" }, "text": "U", "orig": "U", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 62, "label": "text", "bbox": { "l": 374.04, "t": 217.15, "r": 381.22, "b": 226.47, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 30, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 374.04, "r_y0": 226.47, "r_x1": 381.22, "r_y1": 226.47, "r_x2": 381.22, "r_y2": 217.15, "r_x3": 374.04, "r_y3": 217.15, "coord_origin": "TOPLEFT" }, "text": "U", "orig": "U", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 63, "label": "text", "bbox": { "l": 374.34, "t": 180.93, "r": 381.52, "b": 190.26, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 31, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 374.34, "r_y0": 190.26, "r_x1": 381.52, "r_y1": 190.26, "r_x2": 381.52, "r_y2": 180.93, "r_x3": 374.34, "r_y3": 180.93, "coord_origin": "TOPLEFT" }, "text": "U", "orig": "U", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 64, "label": "text", "bbox": { "l": 387.76, "t": 168.58, "r": 393.29, "b": 177.9, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 32, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 387.76, "r_y0": 177.9, "r_x1": 393.29, "r_y1": 177.9, "r_x2": 393.29, "r_y2": 168.58, "r_x3": 387.76, "r_y3": 168.58, "coord_origin": "TOPLEFT" }, "text": "L", "orig": "L", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 65, "label": "text", "bbox": { "l": 411.86, "t": 168.06, "r": 417.39, "b": 177.38, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 33, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 411.86, "r_y0": 177.38, "r_x1": 417.39, "r_y1": 177.38, "r_x2": 417.39, "r_y2": 168.06, "r_x3": 411.86, "r_y3": 168.06, "coord_origin": "TOPLEFT" }, "text": "L", "orig": "L", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 66, "label": "text", "bbox": { "l": 423.34, "t": 167.93, "r": 428.86, "b": 177.26, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 34, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 423.34, "r_y0": 177.26, "r_x1": 428.86, "r_y1": 177.26, "r_x2": 428.86, "r_y2": 167.93, "r_x3": 423.34, "r_y3": 167.93, "coord_origin": "TOPLEFT" }, "text": "L", "orig": "L", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 67, "label": "text", "bbox": { "l": 387.14, "t": 180.79, "r": 393.76, "b": 190.11, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 35, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 387.14, "r_y0": 190.11, "r_x1": 393.76, "r_y1": 190.11, "r_x2": 393.76, "r_y2": 180.79, "r_x3": 387.14, "r_y3": 180.79, "coord_origin": "TOPLEFT" }, "text": "X", "orig": "X", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 68, "label": "text", "bbox": { "l": 282.26, "t": 244.51, "r": 289.43, "b": 253.83, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 36, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 282.26, "r_y0": 253.83, "r_x1": 289.43, "r_y1": 253.83, "r_x2": 289.43, "r_y2": 244.51, "r_x3": 282.26, "r_y3": 244.51, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 69, "label": "text", "bbox": { "l": 282.11, "t": 256.85, "r": 289.29, "b": 266.17, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 37, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 282.11, "r_y0": 266.17, "r_x1": 289.29, "r_y1": 266.17, "r_x2": 289.29, "r_y2": 256.85, "r_x3": 282.11, "r_y3": 256.85, "coord_origin": "TOPLEFT" }, "text": "U", "orig": "U", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 70, "label": "text", "bbox": { "l": 282.41, "t": 269.13, "r": 289.58, "b": 278.45, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 38, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 282.41, "r_y0": 278.45, "r_x1": 289.58, "r_y1": 278.45, "r_x2": 289.58, "r_y2": 269.13, "r_x3": 282.41, "r_y3": 269.13, "coord_origin": "TOPLEFT" }, "text": "U", "orig": "U", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 71, "label": "text", "bbox": { "l": 295.53, "t": 244.49, "r": 301.05, "b": 253.82, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 39, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 295.53, "r_y0": 253.82, "r_x1": 301.05, "r_y1": 253.82, "r_x2": 301.05, "r_y2": 244.49, "r_x3": 295.53, "r_y3": 244.49, "coord_origin": "TOPLEFT" }, "text": "L", "orig": "L", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 72, "label": "text", "bbox": { "l": 307.47, "t": 244.57, "r": 312.99, "b": 253.9, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 40, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 307.47, "r_y0": 253.9, "r_x1": 312.99, "r_y1": 253.9, "r_x2": 312.99, "r_y2": 244.57, "r_x3": 307.47, "r_y3": 244.57, "coord_origin": "TOPLEFT" }, "text": "L", "orig": "L", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 73, "label": "text", "bbox": { "l": 318.77, "t": 244.44, "r": 324.29, "b": 253.76, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 41, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 318.77, "r_y0": 253.76, "r_x1": 324.29, "r_y1": 253.76, "r_x2": 324.29, "r_y2": 244.44, "r_x3": 318.77, "r_y3": 244.44, "coord_origin": "TOPLEFT" }, "text": "L", "orig": "L", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 74, "label": "text", "bbox": { "l": 294.9, "t": 256.7, "r": 301.04, "b": 266.02, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 42, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 294.9, "r_y0": 266.02, "r_x1": 301.04, "r_y1": 266.02, "r_x2": 301.04, "r_y2": 256.7, "r_x3": 294.9, "r_y3": 256.7, "coord_origin": "TOPLEFT" }, "text": "X", "orig": "X", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 75, "label": "text", "bbox": { "l": 307.18, "t": 256.7, "r": 325.59, "b": 266.02, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 43, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 307.18, "r_y0": 266.02, "r_x1": 325.59, "r_y1": 266.02, "r_x2": 325.59, "r_y2": 256.7, "r_x3": 307.18, "r_y3": 256.7, "coord_origin": "TOPLEFT" }, "text": "X X", "orig": "X X", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 76, "label": "text", "bbox": { "l": 294.79, "t": 269.25, "r": 300.93, "b": 278.58, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 44, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 294.79, "r_y0": 278.58, "r_x1": 300.93, "r_y1": 278.58, "r_x2": 300.93, "r_y2": 269.25, "r_x3": 294.79, "r_y3": 269.25, "coord_origin": "TOPLEFT" }, "text": "X", "orig": "X", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 77, "label": "text", "bbox": { "l": 307.06, "t": 269.25, "r": 325.48, "b": 278.58, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 45, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 307.06, "r_y0": 278.58, "r_x1": 325.48, "r_y1": 278.58, "r_x2": 325.48, "r_y2": 269.25, "r_x3": 307.06, "r_y3": 269.25, "coord_origin": "TOPLEFT" }, "text": "X X", "orig": "X X", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 78, "label": "text", "bbox": { "l": 195.94, "t": 268.75, "r": 203.11, "b": 278.07, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 46, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 195.94, "r_y0": 278.07, "r_x1": 203.11, "r_y1": 278.07, "r_x2": 203.11, "r_y2": 268.75, "r_x3": 195.94, "r_y3": 268.75, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 79, "label": "text", "bbox": { "l": 209.21, "t": 268.73, "r": 214.73, "b": 278.05, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 47, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 209.21, "r_y0": 278.05, "r_x1": 214.73, "r_y1": 278.05, "r_x2": 214.73, "r_y2": 268.73, "r_x3": 209.21, "r_y3": 268.73, "coord_origin": "TOPLEFT" }, "text": "L", "orig": "L", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 80, "label": "text", "bbox": { "l": 221.15, "t": 268.81, "r": 226.67, "b": 278.13, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 48, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 221.15, "r_y0": 278.13, "r_x1": 226.67, "r_y1": 278.13, "r_x2": 226.67, "r_y2": 268.81, "r_x3": 221.15, "r_y3": 268.81, "coord_origin": "TOPLEFT" }, "text": "L", "orig": "L", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 81, "label": "text", "bbox": { "l": 232.45, "t": 268.68, "r": 237.97, "b": 278.0, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 49, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 232.45, "r_y0": 278.0, "r_x1": 237.97, "r_y1": 278.0, "r_x2": 237.97, "r_y2": 268.68, "r_x3": 232.45, "r_y3": 268.68, "coord_origin": "TOPLEFT" }, "text": "L", "orig": "L", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 82, "label": "text", "bbox": { "l": 196.22, "t": 244.54, "r": 203.39, "b": 253.86, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 50, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 196.22, "r_y0": 253.86, "r_x1": 203.39, "r_y1": 253.86, "r_x2": 203.39, "r_y2": 244.54, "r_x3": 196.22, "r_y3": 244.54, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 83, "label": "text", "bbox": { "l": 250.32, "t": 244.1, "r": 257.5, "b": 253.42, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 51, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 250.32, "r_y0": 253.42, "r_x1": 257.5, "r_y1": 253.42, "r_x2": 257.5, "r_y2": 244.1, "r_x3": 250.32, "r_y3": 244.1, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 84, "label": "text", "bbox": { "l": 250.17, "t": 256.44, "r": 257.35, "b": 265.76, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 52, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 250.17, "r_y0": 265.76, "r_x1": 257.35, "r_y1": 265.76, "r_x2": 257.35, "r_y2": 256.44, "r_x3": 250.17, "r_y3": 256.44, "coord_origin": "TOPLEFT" }, "text": "U", "orig": "U", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 85, "label": "text", "bbox": { "l": 250.47, "t": 268.72, "r": 257.65, "b": 278.04, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 53, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 250.47, "r_y0": 278.04, "r_x1": 257.65, "r_y1": 278.04, "r_x2": 257.65, "r_y2": 268.72, "r_x3": 250.47, "r_y3": 268.72, "coord_origin": "TOPLEFT" }, "text": "U", "orig": "U", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 86, "label": "text", "bbox": { "l": 334.51, "t": 242.99, "r": 337.22, "b": 249.21, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 54, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 334.51, "r_y0": 249.21, "r_x1": 337.22, "r_y1": 249.21, "r_x2": 337.22, "r_y2": 242.99, "r_x3": 334.51, "r_y3": 242.99, "coord_origin": "TOPLEFT" }, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 87, "label": "text", "bbox": { "l": 339.94, "t": 242.99, "r": 391.49, "b": 249.21, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 55, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 339.94, "r_y0": 249.21, "r_x1": 391.49, "r_y1": 249.21, "r_x2": 391.49, "r_y2": 242.99, "r_x3": 339.94, "r_y3": 242.99, "coord_origin": "TOPLEFT" }, "text": "- simple cells: \"C\"", "orig": "- simple cells: \"C\"", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 88, "label": "text", "bbox": { "l": 334.51, "t": 252.93, "r": 337.33, "b": 259.15, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 56, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 334.51, "r_y0": 259.15, "r_x1": 337.33, "r_y1": 259.15, "r_x2": 337.33, "r_y2": 252.93, "r_x3": 334.51, "r_y3": 252.93, "coord_origin": "TOPLEFT" }, "text": "2", "orig": "2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 89, "label": "text", "bbox": { "l": 340.15, "t": 252.93, "r": 421.99, "b": 259.15, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 57, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 340.15, "r_y0": 259.15, "r_x1": 421.99, "r_y1": 259.15, "r_x2": 421.99, "r_y2": 252.93, "r_x3": 340.15, "r_y3": 252.93, "coord_origin": "TOPLEFT" }, "text": "- horizontal merges: \"C\", \"L\"", "orig": "- horizontal merges: \"C\", \"L\"", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 90, "label": "text", "bbox": { "l": 334.51, "t": 262.87, "r": 337.3, "b": 269.08, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 58, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 334.51, "r_y0": 269.08, "r_x1": 337.3, "r_y1": 269.08, "r_x2": 337.3, "r_y2": 262.87, "r_x3": 334.51, "r_y3": 262.87, "coord_origin": "TOPLEFT" }, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 91, "label": "text", "bbox": { "l": 340.09, "t": 262.87, "r": 415.34, "b": 269.08, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 59, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 340.09, "r_y0": 269.08, "r_x1": 415.34, "r_y1": 269.08, "r_x2": 415.34, "r_y2": 262.87, "r_x3": 340.09, "r_y3": 262.87, "coord_origin": "TOPLEFT" }, "text": "- vertical merges: \"C\", \"U\"", "orig": "- vertical merges: \"C\", \"U\"", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 18, "label": "list_item", "bbox": { "l": 334.51, "t": 272.81, "r": 426.6, "b": 279.02, "coord_origin": "TOPLEFT" }, "confidence": 0.525, "cells": [ { "index": 60, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 334.51, "r_y0": 279.02, "r_x1": 337.3, "r_y1": 279.02, "r_x2": 337.3, "r_y2": 272.81, "r_x3": 334.51, "r_y3": 272.81, "coord_origin": "TOPLEFT" }, "text": "4", "orig": "4", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 61, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 340.09, "r_y0": 279.02, "r_x1": 426.6, "r_y1": 279.02, "r_x2": 426.6, "r_y2": 272.81, "r_x3": 340.09, "r_y3": 272.81, "coord_origin": "TOPLEFT" }, "text": "- 2d merges: \"C\", \"L\", \"U\", \"X\"", "orig": "- 2d merges: \"C\", \"L\", \"U\", \"X\"", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 92, "label": "text", "bbox": { "l": 185.67, "t": 244.04, "r": 189.36, "b": 250.26, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 62, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 185.67, "r_y0": 250.26, "r_x1": 189.36, "r_y1": 250.26, "r_x2": 189.36, "r_y2": 244.04, "r_x3": 185.67, "r_y3": 244.04, "coord_origin": "TOPLEFT" }, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 93, "label": "text", "bbox": { "l": 185.97, "t": 268.35, "r": 189.65, "b": 274.56, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 63, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 185.97, "r_y0": 274.56, "r_x1": 189.65, "r_y1": 274.56, "r_x2": 189.65, "r_y2": 268.35, "r_x3": 185.97, "r_y3": 268.35, "coord_origin": "TOPLEFT" }, "text": "2", "orig": "2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 94, "label": "text", "bbox": { "l": 239.34, "t": 243.63, "r": 243.03, "b": 249.84, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 64, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 239.34, "r_y0": 249.84, "r_x1": 243.03, "r_y1": 249.84, "r_x2": 243.03, "r_y2": 243.63, "r_x3": 239.34, "r_y3": 243.63, "coord_origin": "TOPLEFT" }, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 95, "label": "text", "bbox": { "l": 271.33, "t": 243.49, "r": 275.01, "b": 249.71, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 65, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 271.33, "r_y0": 249.71, "r_x1": 275.01, "r_y1": 249.71, "r_x2": 275.01, "r_y2": 243.49, "r_x3": 271.33, "r_y3": 243.49, "coord_origin": "TOPLEFT" }, "text": "4", "orig": "4", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 96, "label": "text", "bbox": { "l": 229.82, "t": 166.51, "r": 233.5, "b": 172.73, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 66, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 229.82, "r_y0": 172.73, "r_x1": 233.5, "r_y1": 172.73, "r_x2": 233.5, "r_y2": 166.51, "r_x3": 229.82, "r_y3": 166.51, "coord_origin": "TOPLEFT" }, "text": "2", "orig": "2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 97, "label": "text", "bbox": { "l": 257.24, "t": 189.96, "r": 260.93, "b": 196.18, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 67, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 257.24, "r_y0": 196.18, "r_x1": 260.93, "r_y1": 196.18, "r_x2": 260.93, "r_y2": 189.96, "r_x3": 257.24, "r_y3": 189.96, "coord_origin": "TOPLEFT" }, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 98, "label": "text", "bbox": { "l": 186.88, "t": 177.98, "r": 190.56, "b": 184.19, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 68, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 186.88, "r_y0": 184.19, "r_x1": 190.56, "r_y1": 184.19, "r_x2": 190.56, "r_y2": 177.98, "r_x3": 186.88, "r_y3": 177.98, "coord_origin": "TOPLEFT" }, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 99, "label": "text", "bbox": { "l": 196.49, "t": 169.02, "r": 200.17, "b": 175.23, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 69, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 196.49, "r_y0": 175.23, "r_x1": 200.17, "r_y1": 175.23, "r_x2": 200.17, "r_y2": 169.02, "r_x3": 196.49, "r_y3": 169.02, "coord_origin": "TOPLEFT" }, "text": "4", "orig": "4", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 100, "label": "text", "bbox": { "l": 169.75, "t": 167.88, "r": 175.73, "b": 175.65, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 70, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 169.75, "r_y0": 175.65, "r_x1": 175.73, "r_y1": 175.65, "r_x2": 175.73, "r_y2": 167.88, "r_x3": 169.75, "r_y3": 167.88, "coord_origin": "TOPLEFT" }, "text": "A", "orig": "A", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 101, "label": "text", "bbox": { "l": 169.75, "t": 206.84, "r": 175.73, "b": 214.61, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 71, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 169.75, "r_y0": 214.61, "r_x1": 175.73, "r_y1": 214.61, "r_x2": 175.73, "r_y2": 206.84, "r_x3": 169.75, "r_y3": 206.84, "coord_origin": "TOPLEFT" }, "text": "B", "orig": "B", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 102, "label": "text", "bbox": { "l": 274.29, "t": 168.28, "r": 280.27, "b": 176.05, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 72, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 274.29, "r_y0": 176.05, "r_x1": 280.27, "r_y1": 176.05, "r_x2": 280.27, "r_y2": 168.28, "r_x3": 274.29, "r_y3": 168.28, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 103, "label": "text", "bbox": { "l": 359.56, "t": 168.28, "r": 365.54, "b": 176.05, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 73, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 359.56, "r_y0": 176.05, "r_x1": 365.54, "r_y1": 176.05, "r_x2": 365.54, "r_y2": 168.28, "r_x3": 359.56, "r_y3": 168.28, "coord_origin": "TOPLEFT" }, "text": "D", "orig": "D", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 104, "label": "text", "bbox": { "l": 169.75, "t": 243.21, "r": 175.27, "b": 250.98, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 74, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 169.75, "r_y0": 250.98, "r_x1": 175.27, "r_y1": 250.98, "r_x2": 175.27, "r_y2": 243.21, "r_x3": 169.75, "r_y3": 243.21, "coord_origin": "TOPLEFT" }, "text": "E", "orig": "E", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] } ] }, { "id": 9, "label": "section_header", "bbox": { "l": 134.76, "t": 305.3, "r": 246.65, "b": 314.1, "coord_origin": "TOPLEFT" }, "confidence": 0.923, "cells": [ { "index": 75, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 314.1, "r_x1": 149.4, "r_y1": 314.1, "r_x2": 149.4, "r_y2": 305.3, "r_x3": 134.76, "r_y3": 305.3, "coord_origin": "TOPLEFT" }, "text": "4.2", "orig": "4.2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 76, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 160.86, "r_y0": 314.1, "r_x1": 246.65, "r_y1": 314.1, "r_x2": 246.65, "r_y2": 305.3, "r_x3": 160.86, "r_y3": 305.3, "coord_origin": "TOPLEFT" }, "text": "Language Syntax", "orig": "Language Syntax", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 10, "label": "text", "bbox": { "l": 134.76, "t": 325.25, "r": 363.8, "b": 334.04, "coord_origin": "TOPLEFT" }, "confidence": 0.917, "cells": [ { "index": 77, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 334.04, "r_x1": 363.8, "r_y1": 334.04, "r_x2": 363.8, "r_y2": 325.25, "r_x3": 134.76, "r_y3": 325.25, "coord_origin": "TOPLEFT" }, "text": "The OTSL representation follows these syntax rules:", "orig": "The OTSL representation follows these syntax rules:", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 3, "label": "list_item", "bbox": { "l": 138.97, "t": 347.17, "r": 480.59, "b": 367.93, "coord_origin": "TOPLEFT" }, "confidence": 0.959, "cells": [ { "index": 78, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 138.97, "r_y0": 355.98, "r_x1": 146.72, "r_y1": 355.98, "r_x2": 146.72, "r_y2": 347.18, "r_x3": 138.97, "r_y3": 347.18, "coord_origin": "TOPLEFT" }, "text": "1.", "orig": "1.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 79, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.7, "r_y0": 355.98, "r_x1": 257.38, "r_y1": 355.98, "r_x2": 257.38, "r_y2": 347.17, "r_x3": 151.7, "r_y3": 347.17, "coord_origin": "TOPLEFT" }, "text": "Left-looking cell rule", "orig": "Left-looking cell rule", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 80, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 257.38, "r_y0": 355.98, "r_x1": 480.59, "r_y1": 355.98, "r_x2": 480.59, "r_y2": 347.18, "r_x3": 257.38, "r_y3": 347.18, "coord_origin": "TOPLEFT" }, "text": ": The left neighbour of an \"L\" cell must be either", "orig": ": The left neighbour of an \"L\" cell must be either", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 81, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.7, "r_y0": 367.93, "r_x1": 283.59, "r_y1": 367.93, "r_x2": 283.59, "r_y2": 359.14, "r_x3": 151.7, "r_y3": 359.14, "coord_origin": "TOPLEFT" }, "text": "another \"L\" cell or a \"C\" cell.", "orig": "another \"L\" cell or a \"C\" cell.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 4, "label": "list_item", "bbox": { "l": 138.97, "t": 371.08, "r": 480.59, "b": 391.85, "coord_origin": "TOPLEFT" }, "confidence": 0.959, "cells": [ { "index": 82, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 138.97, "r_y0": 379.89, "r_x1": 146.72, "r_y1": 379.89, "r_x2": 146.72, "r_y2": 371.09, "r_x3": 138.97, "r_y3": 371.09, "coord_origin": "TOPLEFT" }, "text": "2.", "orig": "2.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 83, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.7, "r_y0": 379.89, "r_x1": 252.11, "r_y1": 379.89, "r_x2": 252.11, "r_y2": 371.08, "r_x3": 151.7, "r_y3": 371.08, "coord_origin": "TOPLEFT" }, "text": "Up-looking cell rule", "orig": "Up-looking cell rule", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 84, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 252.11, "r_y0": 379.89, "r_x1": 480.59, "r_y1": 379.89, "r_x2": 480.59, "r_y2": 371.09, "r_x3": 252.11, "r_y3": 371.09, "coord_origin": "TOPLEFT" }, "text": ": The upper neighbour of a \"U\" cell must be either", "orig": ": The upper neighbour of a \"U\" cell must be either", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 85, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.7, "r_y0": 391.85, "r_x1": 284.84, "r_y1": 391.85, "r_x2": 284.84, "r_y2": 383.05, "r_x3": 151.7, "r_y3": 383.05, "coord_origin": "TOPLEFT" }, "text": "another \"U\" cell or a \"C\" cell.", "orig": "another \"U\" cell or a \"C\" cell.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 14, "label": "section_header", "bbox": { "l": 138.97, "t": 395.0, "r": 226.07, "b": 403.8, "coord_origin": "TOPLEFT" }, "confidence": 0.651, "cells": [ { "index": 86, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 138.97, "r_y0": 403.8, "r_x1": 146.72, "r_y1": 403.8, "r_x2": 146.72, "r_y2": 395.01, "r_x3": 138.97, "r_y3": 395.01, "coord_origin": "TOPLEFT" }, "text": "3.", "orig": "3.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 87, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.7, "r_y0": 403.8, "r_x1": 223.3, "r_y1": 403.8, "r_x2": 223.3, "r_y2": 395.0, "r_x3": 151.7, "r_y3": 395.0, "coord_origin": "TOPLEFT" }, "text": "Cross cell rule", "orig": "Cross cell rule", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 88, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 223.31, "r_y0": 403.8, "r_x1": 226.07, "r_y1": 403.8, "r_x2": 226.07, "r_y2": 395.01, "r_x3": 223.31, "r_y3": 395.01, "coord_origin": "TOPLEFT" }, "text": ":", "orig": ":", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 13, "label": "list_item", "bbox": { "l": 151.7, "t": 406.97, "r": 480.59, "b": 439.67, "coord_origin": "TOPLEFT" }, "confidence": 0.725, "cells": [ { "index": 89, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.7, "r_y0": 415.76, "r_x1": 480.59, "r_y1": 415.76, "r_x2": 480.59, "r_y2": 406.97, "r_x3": 151.7, "r_y3": 406.97, "coord_origin": "TOPLEFT" }, "text": "The left neighbour of an \"X\" cell must be either another \"X\" cell or a \"U\"", "orig": "The left neighbour of an \"X\" cell must be either another \"X\" cell or a \"U\"", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 90, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.7, "r_y0": 427.72, "r_x1": 480.59, "r_y1": 427.72, "r_x2": 480.59, "r_y2": 418.92, "r_x3": 151.7, "r_y3": 418.92, "coord_origin": "TOPLEFT" }, "text": "cell, and the upper neighbour of an \"X\" cell must be either another \"X\" cell", "orig": "cell, and the upper neighbour of an \"X\" cell must be either another \"X\" cell", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 91, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.7, "r_y0": 439.67, "r_x1": 214.4, "r_y1": 439.67, "r_x2": 214.4, "r_y2": 430.88, "r_x3": 151.7, "r_y3": 430.88, "coord_origin": "TOPLEFT" }, "text": "or an \"L\" cell.", "orig": "or an \"L\" cell.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 8, "label": "list_item", "bbox": { "l": 138.97, "t": 442.83, "r": 474.59, "b": 451.63, "coord_origin": "TOPLEFT" }, "confidence": 0.926, "cells": [ { "index": 92, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 138.97, "r_y0": 451.63, "r_x1": 146.72, "r_y1": 451.63, "r_x2": 146.72, "r_y2": 442.84, "r_x3": 138.97, "r_y3": 442.84, "coord_origin": "TOPLEFT" }, "text": "4.", "orig": "4.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 93, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.7, "r_y0": 451.63, "r_x1": 221.32, "r_y1": 451.63, "r_x2": 221.32, "r_y2": 442.83, "r_x3": 151.7, "r_y3": 442.83, "coord_origin": "TOPLEFT" }, "text": "First row rule", "orig": "First row rule", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 94, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 221.33, "r_y0": 451.63, "r_x1": 474.59, "r_y1": 451.63, "r_x2": 474.59, "r_y2": 442.84, "r_x3": 221.33, "r_y3": 442.84, "coord_origin": "TOPLEFT" }, "text": ": Only \"L\" cells and \"C\" cells are allowed in the first row.", "orig": ": Only \"L\" cells and \"C\" cells are allowed in the first row.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 5, "label": "list_item", "bbox": { "l": 138.97, "t": 454.78, "r": 480.59, "b": 475.55, "coord_origin": "TOPLEFT" }, "confidence": 0.942, "cells": [ { "index": 95, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 138.97, "r_y0": 463.59, "r_x1": 146.72, "r_y1": 463.59, "r_x2": 146.72, "r_y2": 454.79, "r_x3": 138.97, "r_y3": 454.79, "coord_origin": "TOPLEFT" }, "text": "5.", "orig": "5.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 96, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.7, "r_y0": 463.59, "r_x1": 240.72, "r_y1": 463.59, "r_x2": 240.72, "r_y2": 454.78, "r_x3": 151.7, "r_y3": 454.78, "coord_origin": "TOPLEFT" }, "text": "First column rule", "orig": "First column rule", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 97, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 240.72, "r_y0": 463.59, "r_x1": 480.59, "r_y1": 463.59, "r_x2": 480.59, "r_y2": 454.79, "r_x3": 240.72, "r_y3": 454.79, "coord_origin": "TOPLEFT" }, "text": ": Only \"U\" cells and \"C\" cells are allowed in the first", "orig": ": Only \"U\" cells and \"C\" cells are allowed in the first", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 98, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.7, "r_y0": 475.55, "r_x1": 186.01, "r_y1": 475.55, "r_x2": 186.01, "r_y2": 466.75, "r_x3": 151.7, "r_y3": 466.75, "coord_origin": "TOPLEFT" }, "text": "column.", "orig": "column.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 1, "label": "list_item", "bbox": { "l": 138.97, "t": 478.7, "r": 480.59, "b": 499.46, "coord_origin": "TOPLEFT" }, "confidence": 0.962, "cells": [ { "index": 99, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 138.97, "r_y0": 487.5, "r_x1": 146.72, "r_y1": 487.5, "r_x2": 146.72, "r_y2": 478.71, "r_x3": 138.97, "r_y3": 478.71, "coord_origin": "TOPLEFT" }, "text": "6.", "orig": "6.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 100, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.7, "r_y0": 487.5, "r_x1": 235.16, "r_y1": 487.5, "r_x2": 235.16, "r_y2": 478.7, "r_x3": 151.7, "r_y3": 478.7, "coord_origin": "TOPLEFT" }, "text": "Rectangular rule", "orig": "Rectangular rule", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 101, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 235.16, "r_y0": 487.5, "r_x1": 480.59, "r_y1": 487.5, "r_x2": 480.59, "r_y2": 478.71, "r_x3": 235.16, "r_y3": 478.71, "coord_origin": "TOPLEFT" }, "text": ": The table representation is always rectangular - all rows", "orig": ": The table representation is always rectangular - all rows", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 102, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.7, "r_y0": 499.46, "r_x1": 448.04, "r_y1": 499.46, "r_x2": 448.04, "r_y2": 490.66, "r_x3": 151.7, "r_y3": 490.66, "coord_origin": "TOPLEFT" }, "text": "must have an equal number of tokens, terminated with \"NL\" token.", "orig": "must have an equal number of tokens, terminated with \"NL\" token.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 0, "label": "text", "bbox": { "l": 134.76, "t": 512.59, "r": 480.6, "b": 640.94, "coord_origin": "TOPLEFT" }, "confidence": 0.979, "cells": [ { "index": 103, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 149.71, "r_y0": 521.39, "r_x1": 480.6, "r_y1": 521.39, "r_x2": 480.6, "r_y2": 512.59, "r_x3": 149.71, "r_y3": 512.59, "coord_origin": "TOPLEFT" }, "text": "The application of these rules gives OTSL a set of unique properties. First", "orig": "The application of these rules gives OTSL a set of unique properties. First", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 104, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 533.34, "r_x1": 480.59, "r_y1": 533.34, "r_x2": 480.59, "r_y2": 524.55, "r_x3": 134.76, "r_y3": 524.55, "coord_origin": "TOPLEFT" }, "text": "of all, the OTSL enforces a strictly rectangular structure representation, where", "orig": "of all, the OTSL enforces a strictly rectangular structure representation, where", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 105, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 545.3, "r_x1": 480.59, "r_y1": 545.3, "r_x2": 480.59, "r_y2": 536.5, "r_x3": 134.76, "r_y3": 536.5, "coord_origin": "TOPLEFT" }, "text": "every new-line token starts a new row. As a consequence, all rows and all columns", "orig": "every new-line token starts a new row. As a consequence, all rows and all columns", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 106, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 557.26, "r_x1": 480.59, "r_y1": 557.26, "r_x2": 480.59, "r_y2": 548.46, "r_x3": 134.76, "r_y3": 548.46, "coord_origin": "TOPLEFT" }, "text": "have exactly the same number of tokens, irrespective of cell spans. Secondly, the", "orig": "have exactly the same number of tokens, irrespective of cell spans. Secondly, the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 107, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 569.21, "r_x1": 480.59, "r_y1": 569.21, "r_x2": 480.59, "r_y2": 560.41, "r_x3": 134.76, "r_y3": 560.41, "coord_origin": "TOPLEFT" }, "text": "OTSL representation is unambiguous: Every table structure is represented in one", "orig": "OTSL representation is unambiguous: Every table structure is represented in one", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 108, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 581.17, "r_x1": 480.59, "r_y1": 581.17, "r_x2": 480.59, "r_y2": 572.37, "r_x3": 134.76, "r_y3": 572.37, "coord_origin": "TOPLEFT" }, "text": "way. In this representation every table cell corresponds to a \"C\"-cell token, which", "orig": "way. In this representation every table cell corresponds to a \"C\"-cell token, which", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 109, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 593.12, "r_x1": 480.59, "r_y1": 593.12, "r_x2": 480.59, "r_y2": 584.32, "r_x3": 134.76, "r_y3": 584.32, "coord_origin": "TOPLEFT" }, "text": "in case of spans is always located in the top-left corner of the table cell definition.", "orig": "in case of spans is always located in the top-left corner of the table cell definition.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 110, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 605.08, "r_x1": 480.59, "r_y1": 605.08, "r_x2": 480.59, "r_y2": 596.28, "r_x3": 134.76, "r_y3": 596.28, "coord_origin": "TOPLEFT" }, "text": "Third, OTSL syntax rules are only backward-looking. As a consequence, every", "orig": "Third, OTSL syntax rules are only backward-looking. As a consequence, every", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 111, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 617.03, "r_x1": 480.59, "r_y1": 617.03, "r_x2": 480.59, "r_y2": 608.23, "r_x3": 134.76, "r_y3": 608.23, "coord_origin": "TOPLEFT" }, "text": "predicted token can be validated straight during sequence generation by looking", "orig": "predicted token can be validated straight during sequence generation by looking", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 112, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 628.99, "r_x1": 480.59, "r_y1": 628.99, "r_x2": 480.59, "r_y2": 620.19, "r_x3": 134.76, "r_y3": 620.19, "coord_origin": "TOPLEFT" }, "text": "at the previously predicted sequence. As such, OTSL can guarantee that every", "orig": "at the previously predicted sequence. As such, OTSL can guarantee that every", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 113, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 640.94, "r_x1": 311.2, "r_y1": 640.94, "r_x2": 311.2, "r_y2": 632.14, "r_x3": 134.76, "r_y3": 632.14, "coord_origin": "TOPLEFT" }, "text": "predicted sequence is syntactically valid.", "orig": "predicted sequence is syntactically valid.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 2, "label": "text", "bbox": { "l": 134.76, "t": 644.1, "r": 480.59, "b": 664.85, "coord_origin": "TOPLEFT" }, "confidence": 0.959, "cells": [ { "index": 114, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 149.71, "r_y0": 652.9, "r_x1": 480.59, "r_y1": 652.9, "r_x2": 480.59, "r_y2": 644.1, "r_x3": 149.71, "r_y3": 644.1, "coord_origin": "TOPLEFT" }, "text": "These characteristics can be easily learned by sequence generator networks,", "orig": "These characteristics can be easily learned by sequence generator networks,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 115, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 664.85, "r_x1": 480.59, "r_y1": 664.85, "r_x2": 480.59, "r_y2": 656.06, "r_x3": 134.76, "r_y3": 656.06, "coord_origin": "TOPLEFT" }, "text": "as we demonstrate further below. We find strong indications that this pattern", "orig": "as we demonstrate further below. We find strong indications that this pattern", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] } ] }, "tablestructure": { "table_map": {} }, "figures_classification": null, "equations_prediction": null, "vlm_response": null }, "assembled": { "elements": [ { "label": "page_header", "id": 7, "page_no": 6, "cluster": { "id": 7, "label": "page_header", "bbox": { "l": 194.48, "t": 93.77, "r": 447.54, "b": 101.84, "coord_origin": "TOPLEFT" }, "confidence": 0.933, "cells": [ { "index": 0, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 194.48, "r_y0": 101.84, "r_x1": 447.54, "r_y1": 101.84, "r_x2": 447.54, "r_y2": 93.77, "r_x3": 194.48, "r_y3": 93.77, "coord_origin": "TOPLEFT" }, "text": "Optimized Table Tokenization for Table Structure Recognition", "orig": "Optimized Table Tokenization for Table Structure Recognition", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "Optimized Table Tokenization for Table Structure Recognition" }, { "label": "page_header", "id": 11, "page_no": 6, "cluster": { "id": 11, "label": "page_header", "bbox": { "l": 475.98, "t": 93.77, "r": 480.59, "b": 101.84, "coord_origin": "TOPLEFT" }, "confidence": 0.875, "cells": [ { "index": 1, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 475.98, "r_y0": 101.84, "r_x1": 480.59, "r_y1": 101.84, "r_x2": 480.59, "r_y2": 93.77, "r_x3": 475.98, "r_y3": 93.77, "coord_origin": "TOPLEFT" }, "text": "7", "orig": "7", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "7" }, { "label": "caption", "id": 6, "page_no": 6, "cluster": { "id": 6, "label": "caption", "bbox": { "l": 134.76, "t": 125.8, "r": 480.59, "b": 155.85, "coord_origin": "TOPLEFT" }, "confidence": 0.933, "cells": [ { "index": 2, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 133.73, "r_x1": 162.64, "r_y1": 133.73, "r_x2": 162.64, "r_y2": 125.8, "r_x3": 134.76, "r_y3": 125.8, "coord_origin": "TOPLEFT" }, "text": "Fig. 3.", "orig": "Fig. 3.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 3, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 166.28, "r_y0": 133.93, "r_x1": 480.59, "r_y1": 133.93, "r_x2": 480.59, "r_y2": 125.86, "r_x3": 166.28, "r_y3": 125.86, "coord_origin": "TOPLEFT" }, "text": "OTSL description of table structure: A - table example; B - graphical repre-", "orig": "OTSL description of table structure: A - table example; B - graphical repre-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 4, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 144.89, "r_x1": 480.59, "r_y1": 144.89, "r_x2": 480.59, "r_y2": 136.82, "r_x3": 134.76, "r_y3": 136.82, "coord_origin": "TOPLEFT" }, "text": "sentation of table structure; C - mapping structure on a grid; D - OTSL structure", "orig": "sentation of table structure; C - mapping structure on a grid; D - OTSL structure", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 5, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 155.85, "r_x1": 306.12, "r_y1": 155.85, "r_x2": 306.12, "r_y2": 147.78, "r_x3": 134.76, "r_y3": 147.78, "coord_origin": "TOPLEFT" }, "text": "encoding; E - explanation on cell encoding", "orig": "encoding; E - explanation on cell encoding", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "Fig. 3. OTSL description of table structure: A - table example; B - graphical representation of table structure; C - mapping structure on a grid; D - OTSL structure encoding; E - explanation on cell encoding" }, { "label": "picture", "id": 12, "page_no": 6, "cluster": { "id": 12, "label": "picture", "bbox": { "l": 164.65, "t": 163.8, "r": 449.55, "b": 280.34, "coord_origin": "TOPLEFT" }, "confidence": 0.787, "cells": [ { "index": 6, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 374.49, "r_y0": 177.92, "r_x1": 381.67, "r_y1": 177.92, "r_x2": 381.67, "r_y2": 168.59, "r_x3": 374.49, "r_y3": 168.59, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 7, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 398.74, "r_y0": 177.82, "r_x1": 405.92, "r_y1": 177.82, "r_x2": 405.92, "r_y2": 168.5, "r_x3": 398.74, "r_y3": 168.5, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 8, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 373.77, "r_y0": 202.25, "r_x1": 380.94, "r_y1": 202.25, "r_x2": 380.94, "r_y2": 192.93, "r_x3": 373.77, "r_y3": 192.93, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 9, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 386.66, "r_y0": 202.39, "r_x1": 393.84, "r_y1": 202.39, "r_x2": 393.84, "r_y2": 193.07, "r_x3": 386.66, "r_y3": 193.07, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 10, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 386.69, "r_y0": 214.46, "r_x1": 393.86, "r_y1": 214.46, "r_x2": 393.86, "r_y2": 205.14, "r_x3": 386.69, "r_y3": 205.14, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 11, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 398.66, "r_y0": 190.05, "r_x1": 405.83, "r_y1": 190.05, "r_x2": 405.83, "r_y2": 180.73, "r_x3": 398.66, "r_y3": 180.73, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 12, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 410.78, "r_y0": 190.06, "r_x1": 417.95, "r_y1": 190.06, "r_x2": 417.95, "r_y2": 180.74, "r_x3": 410.78, "r_y3": 180.74, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 13, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 422.91, "r_y0": 189.97, "r_x1": 430.08, "r_y1": 189.97, "r_x2": 430.08, "r_y2": 180.65, "r_x3": 422.91, "r_y3": 180.65, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 14, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 398.78, "r_y0": 202.31, "r_x1": 405.96, "r_y1": 202.31, "r_x2": 405.96, "r_y2": 192.99, "r_x3": 398.78, "r_y3": 192.99, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 15, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 410.9, "r_y0": 202.32, "r_x1": 418.08, "r_y1": 202.32, "r_x2": 418.08, "r_y2": 192.99, "r_x3": 410.9, "r_y3": 192.99, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 16, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 423.03, "r_y0": 202.23, "r_x1": 430.2, "r_y1": 202.23, "r_x2": 430.2, "r_y2": 192.91, "r_x3": 423.03, "r_y3": 192.91, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 17, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 398.78, "r_y0": 214.64, "r_x1": 405.96, "r_y1": 214.64, "r_x2": 405.96, "r_y2": 205.32, "r_x3": 398.78, "r_y3": 205.32, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 18, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 410.9, "r_y0": 214.64, "r_x1": 418.08, "r_y1": 214.64, "r_x2": 418.08, "r_y2": 205.32, "r_x3": 410.9, "r_y3": 205.32, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 19, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 423.03, "r_y0": 214.56, "r_x1": 430.21, "r_y1": 214.56, "r_x2": 430.21, "r_y2": 205.24, "r_x3": 423.03, "r_y3": 205.24, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 20, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 386.51, "r_y0": 226.36, "r_x1": 393.68, "r_y1": 226.36, "r_x2": 393.68, "r_y2": 217.04, "r_x3": 386.51, "r_y3": 217.04, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 21, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 398.6, "r_y0": 226.54, "r_x1": 405.78, "r_y1": 226.54, "r_x2": 405.78, "r_y2": 217.22, "r_x3": 398.6, "r_y3": 217.22, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 22, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 410.72, "r_y0": 226.54, "r_x1": 417.9, "r_y1": 226.54, "r_x2": 417.9, "r_y2": 217.22, "r_x3": 410.72, "r_y3": 217.22, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 23, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 422.85, "r_y0": 226.46, "r_x1": 430.02, "r_y1": 226.46, "r_x2": 430.02, "r_y2": 217.14, "r_x3": 422.85, "r_y3": 217.14, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 24, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 435.16, "r_y0": 177.01, "r_x1": 447.86, "r_y1": 177.01, "r_x2": 447.86, "r_y2": 167.69, "r_x3": 435.16, "r_y3": 167.69, "coord_origin": "TOPLEFT" }, "text": "NL", "orig": "NL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 25, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 435.44, "r_y0": 189.52, "r_x1": 448.15, "r_y1": 189.52, "r_x2": 448.15, "r_y2": 180.2, "r_x3": 435.44, "r_y3": 180.2, "coord_origin": "TOPLEFT" }, "text": "NL", "orig": "NL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 26, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 435.47, "r_y0": 201.82, "r_x1": 448.17, "r_y1": 201.82, "r_x2": 448.17, "r_y2": 192.49, "r_x3": 435.47, "r_y3": 192.49, "coord_origin": "TOPLEFT" }, "text": "NL", "orig": "NL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 27, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 435.38, "r_y0": 214.15, "r_x1": 448.08, "r_y1": 214.15, "r_x2": 448.08, "r_y2": 204.83, "r_x3": 435.38, "r_y3": 204.83, "coord_origin": "TOPLEFT" }, "text": "NL", "orig": "NL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 28, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 435.6, "r_y0": 226.56, "r_x1": 448.3, "r_y1": 226.56, "r_x2": 448.3, "r_y2": 217.23, "r_x3": 435.6, "r_y3": 217.23, "coord_origin": "TOPLEFT" }, "text": "NL", "orig": "NL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 29, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 374.15, "r_y0": 214.56, "r_x1": 381.32, "r_y1": 214.56, "r_x2": 381.32, "r_y2": 205.23, "r_x3": 374.15, "r_y3": 205.23, "coord_origin": "TOPLEFT" }, "text": "U", "orig": "U", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 30, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 374.04, "r_y0": 226.47, "r_x1": 381.22, "r_y1": 226.47, "r_x2": 381.22, "r_y2": 217.15, "r_x3": 374.04, "r_y3": 217.15, "coord_origin": "TOPLEFT" }, "text": "U", "orig": "U", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 31, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 374.34, "r_y0": 190.26, "r_x1": 381.52, "r_y1": 190.26, "r_x2": 381.52, "r_y2": 180.93, "r_x3": 374.34, "r_y3": 180.93, "coord_origin": "TOPLEFT" }, "text": "U", "orig": "U", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 32, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 387.76, "r_y0": 177.9, "r_x1": 393.29, "r_y1": 177.9, "r_x2": 393.29, "r_y2": 168.58, "r_x3": 387.76, "r_y3": 168.58, "coord_origin": "TOPLEFT" }, "text": "L", "orig": "L", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 33, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 411.86, "r_y0": 177.38, "r_x1": 417.39, "r_y1": 177.38, "r_x2": 417.39, "r_y2": 168.06, "r_x3": 411.86, "r_y3": 168.06, "coord_origin": "TOPLEFT" }, "text": "L", "orig": "L", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 34, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 423.34, "r_y0": 177.26, "r_x1": 428.86, "r_y1": 177.26, "r_x2": 428.86, "r_y2": 167.93, "r_x3": 423.34, "r_y3": 167.93, "coord_origin": "TOPLEFT" }, "text": "L", "orig": "L", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 35, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 387.14, "r_y0": 190.11, "r_x1": 393.76, "r_y1": 190.11, "r_x2": 393.76, "r_y2": 180.79, "r_x3": 387.14, "r_y3": 180.79, "coord_origin": "TOPLEFT" }, "text": "X", "orig": "X", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 36, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 282.26, "r_y0": 253.83, "r_x1": 289.43, "r_y1": 253.83, "r_x2": 289.43, "r_y2": 244.51, "r_x3": 282.26, "r_y3": 244.51, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 37, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 282.11, "r_y0": 266.17, "r_x1": 289.29, "r_y1": 266.17, "r_x2": 289.29, "r_y2": 256.85, "r_x3": 282.11, "r_y3": 256.85, "coord_origin": "TOPLEFT" }, "text": "U", "orig": "U", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 38, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 282.41, "r_y0": 278.45, "r_x1": 289.58, "r_y1": 278.45, "r_x2": 289.58, "r_y2": 269.13, "r_x3": 282.41, "r_y3": 269.13, "coord_origin": "TOPLEFT" }, "text": "U", "orig": "U", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 39, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 295.53, "r_y0": 253.82, "r_x1": 301.05, "r_y1": 253.82, "r_x2": 301.05, "r_y2": 244.49, "r_x3": 295.53, "r_y3": 244.49, "coord_origin": "TOPLEFT" }, "text": "L", "orig": "L", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 40, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 307.47, "r_y0": 253.9, "r_x1": 312.99, "r_y1": 253.9, "r_x2": 312.99, "r_y2": 244.57, "r_x3": 307.47, "r_y3": 244.57, "coord_origin": "TOPLEFT" }, "text": "L", "orig": "L", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 41, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 318.77, "r_y0": 253.76, "r_x1": 324.29, "r_y1": 253.76, "r_x2": 324.29, "r_y2": 244.44, "r_x3": 318.77, "r_y3": 244.44, "coord_origin": "TOPLEFT" }, "text": "L", "orig": "L", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 42, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 294.9, "r_y0": 266.02, "r_x1": 301.04, "r_y1": 266.02, "r_x2": 301.04, "r_y2": 256.7, "r_x3": 294.9, "r_y3": 256.7, "coord_origin": "TOPLEFT" }, "text": "X", "orig": "X", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 43, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 307.18, "r_y0": 266.02, "r_x1": 325.59, "r_y1": 266.02, "r_x2": 325.59, "r_y2": 256.7, "r_x3": 307.18, "r_y3": 256.7, "coord_origin": "TOPLEFT" }, "text": "X X", "orig": "X X", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 44, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 294.79, "r_y0": 278.58, "r_x1": 300.93, "r_y1": 278.58, "r_x2": 300.93, "r_y2": 269.25, "r_x3": 294.79, "r_y3": 269.25, "coord_origin": "TOPLEFT" }, "text": "X", "orig": "X", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 45, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 307.06, "r_y0": 278.58, "r_x1": 325.48, "r_y1": 278.58, "r_x2": 325.48, "r_y2": 269.25, "r_x3": 307.06, "r_y3": 269.25, "coord_origin": "TOPLEFT" }, "text": "X X", "orig": "X X", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 46, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 195.94, "r_y0": 278.07, "r_x1": 203.11, "r_y1": 278.07, "r_x2": 203.11, "r_y2": 268.75, "r_x3": 195.94, "r_y3": 268.75, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 47, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 209.21, "r_y0": 278.05, "r_x1": 214.73, "r_y1": 278.05, "r_x2": 214.73, "r_y2": 268.73, "r_x3": 209.21, "r_y3": 268.73, "coord_origin": "TOPLEFT" }, "text": "L", "orig": "L", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 48, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 221.15, "r_y0": 278.13, "r_x1": 226.67, "r_y1": 278.13, "r_x2": 226.67, "r_y2": 268.81, "r_x3": 221.15, "r_y3": 268.81, "coord_origin": "TOPLEFT" }, "text": "L", "orig": "L", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 49, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 232.45, "r_y0": 278.0, "r_x1": 237.97, "r_y1": 278.0, "r_x2": 237.97, "r_y2": 268.68, "r_x3": 232.45, "r_y3": 268.68, "coord_origin": "TOPLEFT" }, "text": "L", "orig": "L", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 50, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 196.22, "r_y0": 253.86, "r_x1": 203.39, "r_y1": 253.86, "r_x2": 203.39, "r_y2": 244.54, "r_x3": 196.22, "r_y3": 244.54, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 51, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 250.32, "r_y0": 253.42, "r_x1": 257.5, "r_y1": 253.42, "r_x2": 257.5, "r_y2": 244.1, "r_x3": 250.32, "r_y3": 244.1, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 52, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 250.17, "r_y0": 265.76, "r_x1": 257.35, "r_y1": 265.76, "r_x2": 257.35, "r_y2": 256.44, "r_x3": 250.17, "r_y3": 256.44, "coord_origin": "TOPLEFT" }, "text": "U", "orig": "U", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 53, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 250.47, "r_y0": 278.04, "r_x1": 257.65, "r_y1": 278.04, "r_x2": 257.65, "r_y2": 268.72, "r_x3": 250.47, "r_y3": 268.72, "coord_origin": "TOPLEFT" }, "text": "U", "orig": "U", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 54, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 334.51, "r_y0": 249.21, "r_x1": 337.22, "r_y1": 249.21, "r_x2": 337.22, "r_y2": 242.99, "r_x3": 334.51, "r_y3": 242.99, "coord_origin": "TOPLEFT" }, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 55, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 339.94, "r_y0": 249.21, "r_x1": 391.49, "r_y1": 249.21, "r_x2": 391.49, "r_y2": 242.99, "r_x3": 339.94, "r_y3": 242.99, "coord_origin": "TOPLEFT" }, "text": "- simple cells: \"C\"", "orig": "- simple cells: \"C\"", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 56, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 334.51, "r_y0": 259.15, "r_x1": 337.33, "r_y1": 259.15, "r_x2": 337.33, "r_y2": 252.93, "r_x3": 334.51, "r_y3": 252.93, "coord_origin": "TOPLEFT" }, "text": "2", "orig": "2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 57, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 340.15, "r_y0": 259.15, "r_x1": 421.99, "r_y1": 259.15, "r_x2": 421.99, "r_y2": 252.93, "r_x3": 340.15, "r_y3": 252.93, "coord_origin": "TOPLEFT" }, "text": "- horizontal merges: \"C\", \"L\"", "orig": "- horizontal merges: \"C\", \"L\"", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 58, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 334.51, "r_y0": 269.08, "r_x1": 337.3, "r_y1": 269.08, "r_x2": 337.3, "r_y2": 262.87, "r_x3": 334.51, "r_y3": 262.87, "coord_origin": "TOPLEFT" }, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 59, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 340.09, "r_y0": 269.08, "r_x1": 415.34, "r_y1": 269.08, "r_x2": 415.34, "r_y2": 262.87, "r_x3": 340.09, "r_y3": 262.87, "coord_origin": "TOPLEFT" }, "text": "- vertical merges: \"C\", \"U\"", "orig": "- vertical merges: \"C\", \"U\"", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 60, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 334.51, "r_y0": 279.02, "r_x1": 337.3, "r_y1": 279.02, "r_x2": 337.3, "r_y2": 272.81, "r_x3": 334.51, "r_y3": 272.81, "coord_origin": "TOPLEFT" }, "text": "4", "orig": "4", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 61, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 340.09, "r_y0": 279.02, "r_x1": 426.6, "r_y1": 279.02, "r_x2": 426.6, "r_y2": 272.81, "r_x3": 340.09, "r_y3": 272.81, "coord_origin": "TOPLEFT" }, "text": "- 2d merges: \"C\", \"L\", \"U\", \"X\"", "orig": "- 2d merges: \"C\", \"L\", \"U\", \"X\"", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 62, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 185.67, "r_y0": 250.26, "r_x1": 189.36, "r_y1": 250.26, "r_x2": 189.36, "r_y2": 244.04, "r_x3": 185.67, "r_y3": 244.04, "coord_origin": "TOPLEFT" }, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 63, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 185.97, "r_y0": 274.56, "r_x1": 189.65, "r_y1": 274.56, "r_x2": 189.65, "r_y2": 268.35, "r_x3": 185.97, "r_y3": 268.35, "coord_origin": "TOPLEFT" }, "text": "2", "orig": "2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 64, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 239.34, "r_y0": 249.84, "r_x1": 243.03, "r_y1": 249.84, "r_x2": 243.03, "r_y2": 243.63, "r_x3": 239.34, "r_y3": 243.63, "coord_origin": "TOPLEFT" }, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 65, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 271.33, "r_y0": 249.71, "r_x1": 275.01, "r_y1": 249.71, "r_x2": 275.01, "r_y2": 243.49, "r_x3": 271.33, "r_y3": 243.49, "coord_origin": "TOPLEFT" }, "text": "4", "orig": "4", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 66, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 229.82, "r_y0": 172.73, "r_x1": 233.5, "r_y1": 172.73, "r_x2": 233.5, "r_y2": 166.51, "r_x3": 229.82, "r_y3": 166.51, "coord_origin": "TOPLEFT" }, "text": "2", "orig": "2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 67, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 257.24, "r_y0": 196.18, "r_x1": 260.93, "r_y1": 196.18, "r_x2": 260.93, "r_y2": 189.96, "r_x3": 257.24, "r_y3": 189.96, "coord_origin": "TOPLEFT" }, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 68, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 186.88, "r_y0": 184.19, "r_x1": 190.56, "r_y1": 184.19, "r_x2": 190.56, "r_y2": 177.98, "r_x3": 186.88, "r_y3": 177.98, "coord_origin": "TOPLEFT" }, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 69, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 196.49, "r_y0": 175.23, "r_x1": 200.17, "r_y1": 175.23, "r_x2": 200.17, "r_y2": 169.02, "r_x3": 196.49, "r_y3": 169.02, "coord_origin": "TOPLEFT" }, "text": "4", "orig": "4", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 70, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 169.75, "r_y0": 175.65, "r_x1": 175.73, "r_y1": 175.65, "r_x2": 175.73, "r_y2": 167.88, "r_x3": 169.75, "r_y3": 167.88, "coord_origin": "TOPLEFT" }, "text": "A", "orig": "A", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 71, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 169.75, "r_y0": 214.61, "r_x1": 175.73, "r_y1": 214.61, "r_x2": 175.73, "r_y2": 206.84, "r_x3": 169.75, "r_y3": 206.84, "coord_origin": "TOPLEFT" }, "text": "B", "orig": "B", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 72, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 274.29, "r_y0": 176.05, "r_x1": 280.27, "r_y1": 176.05, "r_x2": 280.27, "r_y2": 168.28, "r_x3": 274.29, "r_y3": 168.28, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 73, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 359.56, "r_y0": 176.05, "r_x1": 365.54, "r_y1": 176.05, "r_x2": 365.54, "r_y2": 168.28, "r_x3": 359.56, "r_y3": 168.28, "coord_origin": "TOPLEFT" }, "text": "D", "orig": "D", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 74, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 169.75, "r_y0": 250.98, "r_x1": 175.27, "r_y1": 250.98, "r_x2": 175.27, "r_y2": 243.21, "r_x3": 169.75, "r_y3": 243.21, "coord_origin": "TOPLEFT" }, "text": "E", "orig": "E", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [ { "id": 38, "label": "text", "bbox": { "l": 374.49, "t": 168.59, "r": 381.67, "b": 177.92, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 6, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 374.49, "r_y0": 177.92, "r_x1": 381.67, "r_y1": 177.92, "r_x2": 381.67, "r_y2": 168.59, "r_x3": 374.49, "r_y3": 168.59, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 39, "label": "text", "bbox": { "l": 398.74, "t": 168.5, "r": 405.92, "b": 177.82, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 7, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 398.74, "r_y0": 177.82, "r_x1": 405.92, "r_y1": 177.82, "r_x2": 405.92, "r_y2": 168.5, "r_x3": 398.74, "r_y3": 168.5, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 40, "label": "text", "bbox": { "l": 373.77, "t": 192.93, "r": 380.94, "b": 202.25, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 8, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 373.77, "r_y0": 202.25, "r_x1": 380.94, "r_y1": 202.25, "r_x2": 380.94, "r_y2": 192.93, "r_x3": 373.77, "r_y3": 192.93, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 41, "label": "text", "bbox": { "l": 386.66, "t": 193.07, "r": 393.84, "b": 202.39, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 9, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 386.66, "r_y0": 202.39, "r_x1": 393.84, "r_y1": 202.39, "r_x2": 393.84, "r_y2": 193.07, "r_x3": 386.66, "r_y3": 193.07, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 42, "label": "text", "bbox": { "l": 386.69, "t": 205.14, "r": 393.86, "b": 214.46, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 10, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 386.69, "r_y0": 214.46, "r_x1": 393.86, "r_y1": 214.46, "r_x2": 393.86, "r_y2": 205.14, "r_x3": 386.69, "r_y3": 205.14, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 43, "label": "text", "bbox": { "l": 398.66, "t": 180.73, "r": 405.83, "b": 190.05, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 11, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 398.66, "r_y0": 190.05, "r_x1": 405.83, "r_y1": 190.05, "r_x2": 405.83, "r_y2": 180.73, "r_x3": 398.66, "r_y3": 180.73, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 44, "label": "text", "bbox": { "l": 410.78, "t": 180.74, "r": 417.95, "b": 190.06, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 12, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 410.78, "r_y0": 190.06, "r_x1": 417.95, "r_y1": 190.06, "r_x2": 417.95, "r_y2": 180.74, "r_x3": 410.78, "r_y3": 180.74, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 45, "label": "text", "bbox": { "l": 422.91, "t": 180.65, "r": 430.08, "b": 189.97, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 13, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 422.91, "r_y0": 189.97, "r_x1": 430.08, "r_y1": 189.97, "r_x2": 430.08, "r_y2": 180.65, "r_x3": 422.91, "r_y3": 180.65, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 46, "label": "text", "bbox": { "l": 398.78, "t": 192.99, "r": 405.96, "b": 202.31, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 14, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 398.78, "r_y0": 202.31, "r_x1": 405.96, "r_y1": 202.31, "r_x2": 405.96, "r_y2": 192.99, "r_x3": 398.78, "r_y3": 192.99, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 47, "label": "text", "bbox": { "l": 410.9, "t": 192.99, "r": 418.08, "b": 202.32, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 15, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 410.9, "r_y0": 202.32, "r_x1": 418.08, "r_y1": 202.32, "r_x2": 418.08, "r_y2": 192.99, "r_x3": 410.9, "r_y3": 192.99, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 48, "label": "text", "bbox": { "l": 423.03, "t": 192.91, "r": 430.2, "b": 202.23, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 16, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 423.03, "r_y0": 202.23, "r_x1": 430.2, "r_y1": 202.23, "r_x2": 430.2, "r_y2": 192.91, "r_x3": 423.03, "r_y3": 192.91, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 49, "label": "text", "bbox": { "l": 398.78, "t": 205.32, "r": 405.96, "b": 214.64, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 17, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 398.78, "r_y0": 214.64, "r_x1": 405.96, "r_y1": 214.64, "r_x2": 405.96, "r_y2": 205.32, "r_x3": 398.78, "r_y3": 205.32, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 50, "label": "text", "bbox": { "l": 410.9, "t": 205.32, "r": 418.08, "b": 214.64, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 18, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 410.9, "r_y0": 214.64, "r_x1": 418.08, "r_y1": 214.64, "r_x2": 418.08, "r_y2": 205.32, "r_x3": 410.9, "r_y3": 205.32, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 51, "label": "text", "bbox": { "l": 423.03, "t": 205.24, "r": 430.21, "b": 214.56, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 19, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 423.03, "r_y0": 214.56, "r_x1": 430.21, "r_y1": 214.56, "r_x2": 430.21, "r_y2": 205.24, "r_x3": 423.03, "r_y3": 205.24, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 52, "label": "text", "bbox": { "l": 386.51, "t": 217.04, "r": 393.68, "b": 226.36, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 20, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 386.51, "r_y0": 226.36, "r_x1": 393.68, "r_y1": 226.36, "r_x2": 393.68, "r_y2": 217.04, "r_x3": 386.51, "r_y3": 217.04, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 53, "label": "text", "bbox": { "l": 398.6, "t": 217.22, "r": 405.78, "b": 226.54, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 21, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 398.6, "r_y0": 226.54, "r_x1": 405.78, "r_y1": 226.54, "r_x2": 405.78, "r_y2": 217.22, "r_x3": 398.6, "r_y3": 217.22, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 54, "label": "text", "bbox": { "l": 410.72, "t": 217.22, "r": 417.9, "b": 226.54, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 22, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 410.72, "r_y0": 226.54, "r_x1": 417.9, "r_y1": 226.54, "r_x2": 417.9, "r_y2": 217.22, "r_x3": 410.72, "r_y3": 217.22, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 55, "label": "text", "bbox": { "l": 422.85, "t": 217.14, "r": 430.02, "b": 226.46, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 23, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 422.85, "r_y0": 226.46, "r_x1": 430.02, "r_y1": 226.46, "r_x2": 430.02, "r_y2": 217.14, "r_x3": 422.85, "r_y3": 217.14, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 56, "label": "text", "bbox": { "l": 435.16, "t": 167.69, "r": 447.86, "b": 177.01, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 24, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 435.16, "r_y0": 177.01, "r_x1": 447.86, "r_y1": 177.01, "r_x2": 447.86, "r_y2": 167.69, "r_x3": 435.16, "r_y3": 167.69, "coord_origin": "TOPLEFT" }, "text": "NL", "orig": "NL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 57, "label": "text", "bbox": { "l": 435.44, "t": 180.2, "r": 448.15, "b": 189.52, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 25, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 435.44, "r_y0": 189.52, "r_x1": 448.15, "r_y1": 189.52, "r_x2": 448.15, "r_y2": 180.2, "r_x3": 435.44, "r_y3": 180.2, "coord_origin": "TOPLEFT" }, "text": "NL", "orig": "NL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 58, "label": "text", "bbox": { "l": 435.47, "t": 192.49, "r": 448.17, "b": 201.82, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 26, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 435.47, "r_y0": 201.82, "r_x1": 448.17, "r_y1": 201.82, "r_x2": 448.17, "r_y2": 192.49, "r_x3": 435.47, "r_y3": 192.49, "coord_origin": "TOPLEFT" }, "text": "NL", "orig": "NL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 59, "label": "text", "bbox": { "l": 435.38, "t": 204.83, "r": 448.08, "b": 214.15, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 27, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 435.38, "r_y0": 214.15, "r_x1": 448.08, "r_y1": 214.15, "r_x2": 448.08, "r_y2": 204.83, "r_x3": 435.38, "r_y3": 204.83, "coord_origin": "TOPLEFT" }, "text": "NL", "orig": "NL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 60, "label": "text", "bbox": { "l": 435.6, "t": 217.23, "r": 448.3, "b": 226.56, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 28, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 435.6, "r_y0": 226.56, "r_x1": 448.3, "r_y1": 226.56, "r_x2": 448.3, "r_y2": 217.23, "r_x3": 435.6, "r_y3": 217.23, "coord_origin": "TOPLEFT" }, "text": "NL", "orig": "NL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 61, "label": "text", "bbox": { "l": 374.15, "t": 205.23, "r": 381.32, "b": 214.56, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 29, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 374.15, "r_y0": 214.56, "r_x1": 381.32, "r_y1": 214.56, "r_x2": 381.32, "r_y2": 205.23, "r_x3": 374.15, "r_y3": 205.23, "coord_origin": "TOPLEFT" }, "text": "U", "orig": "U", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 62, "label": "text", "bbox": { "l": 374.04, "t": 217.15, "r": 381.22, "b": 226.47, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 30, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 374.04, "r_y0": 226.47, "r_x1": 381.22, "r_y1": 226.47, "r_x2": 381.22, "r_y2": 217.15, "r_x3": 374.04, "r_y3": 217.15, "coord_origin": "TOPLEFT" }, "text": "U", "orig": "U", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 63, "label": "text", "bbox": { "l": 374.34, "t": 180.93, "r": 381.52, "b": 190.26, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 31, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 374.34, "r_y0": 190.26, "r_x1": 381.52, "r_y1": 190.26, "r_x2": 381.52, "r_y2": 180.93, "r_x3": 374.34, "r_y3": 180.93, "coord_origin": "TOPLEFT" }, "text": "U", "orig": "U", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 64, "label": "text", "bbox": { "l": 387.76, "t": 168.58, "r": 393.29, "b": 177.9, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 32, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 387.76, "r_y0": 177.9, "r_x1": 393.29, "r_y1": 177.9, "r_x2": 393.29, "r_y2": 168.58, "r_x3": 387.76, "r_y3": 168.58, "coord_origin": "TOPLEFT" }, "text": "L", "orig": "L", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 65, "label": "text", "bbox": { "l": 411.86, "t": 168.06, "r": 417.39, "b": 177.38, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 33, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 411.86, "r_y0": 177.38, "r_x1": 417.39, "r_y1": 177.38, "r_x2": 417.39, "r_y2": 168.06, "r_x3": 411.86, "r_y3": 168.06, "coord_origin": "TOPLEFT" }, "text": "L", "orig": "L", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 66, "label": "text", "bbox": { "l": 423.34, "t": 167.93, "r": 428.86, "b": 177.26, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 34, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 423.34, "r_y0": 177.26, "r_x1": 428.86, "r_y1": 177.26, "r_x2": 428.86, "r_y2": 167.93, "r_x3": 423.34, "r_y3": 167.93, "coord_origin": "TOPLEFT" }, "text": "L", "orig": "L", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 67, "label": "text", "bbox": { "l": 387.14, "t": 180.79, "r": 393.76, "b": 190.11, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 35, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 387.14, "r_y0": 190.11, "r_x1": 393.76, "r_y1": 190.11, "r_x2": 393.76, "r_y2": 180.79, "r_x3": 387.14, "r_y3": 180.79, "coord_origin": "TOPLEFT" }, "text": "X", "orig": "X", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 68, "label": "text", "bbox": { "l": 282.26, "t": 244.51, "r": 289.43, "b": 253.83, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 36, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 282.26, "r_y0": 253.83, "r_x1": 289.43, "r_y1": 253.83, "r_x2": 289.43, "r_y2": 244.51, "r_x3": 282.26, "r_y3": 244.51, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 69, "label": "text", "bbox": { "l": 282.11, "t": 256.85, "r": 289.29, "b": 266.17, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 37, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 282.11, "r_y0": 266.17, "r_x1": 289.29, "r_y1": 266.17, "r_x2": 289.29, "r_y2": 256.85, "r_x3": 282.11, "r_y3": 256.85, "coord_origin": "TOPLEFT" }, "text": "U", "orig": "U", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 70, "label": "text", "bbox": { "l": 282.41, "t": 269.13, "r": 289.58, "b": 278.45, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 38, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 282.41, "r_y0": 278.45, "r_x1": 289.58, "r_y1": 278.45, "r_x2": 289.58, "r_y2": 269.13, "r_x3": 282.41, "r_y3": 269.13, "coord_origin": "TOPLEFT" }, "text": "U", "orig": "U", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 71, "label": "text", "bbox": { "l": 295.53, "t": 244.49, "r": 301.05, "b": 253.82, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 39, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 295.53, "r_y0": 253.82, "r_x1": 301.05, "r_y1": 253.82, "r_x2": 301.05, "r_y2": 244.49, "r_x3": 295.53, "r_y3": 244.49, "coord_origin": "TOPLEFT" }, "text": "L", "orig": "L", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 72, "label": "text", "bbox": { "l": 307.47, "t": 244.57, "r": 312.99, "b": 253.9, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 40, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 307.47, "r_y0": 253.9, "r_x1": 312.99, "r_y1": 253.9, "r_x2": 312.99, "r_y2": 244.57, "r_x3": 307.47, "r_y3": 244.57, "coord_origin": "TOPLEFT" }, "text": "L", "orig": "L", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 73, "label": "text", "bbox": { "l": 318.77, "t": 244.44, "r": 324.29, "b": 253.76, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 41, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 318.77, "r_y0": 253.76, "r_x1": 324.29, "r_y1": 253.76, "r_x2": 324.29, "r_y2": 244.44, "r_x3": 318.77, "r_y3": 244.44, "coord_origin": "TOPLEFT" }, "text": "L", "orig": "L", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 74, "label": "text", "bbox": { "l": 294.9, "t": 256.7, "r": 301.04, "b": 266.02, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 42, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 294.9, "r_y0": 266.02, "r_x1": 301.04, "r_y1": 266.02, "r_x2": 301.04, "r_y2": 256.7, "r_x3": 294.9, "r_y3": 256.7, "coord_origin": "TOPLEFT" }, "text": "X", "orig": "X", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 75, "label": "text", "bbox": { "l": 307.18, "t": 256.7, "r": 325.59, "b": 266.02, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 43, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 307.18, "r_y0": 266.02, "r_x1": 325.59, "r_y1": 266.02, "r_x2": 325.59, "r_y2": 256.7, "r_x3": 307.18, "r_y3": 256.7, "coord_origin": "TOPLEFT" }, "text": "X X", "orig": "X X", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 76, "label": "text", "bbox": { "l": 294.79, "t": 269.25, "r": 300.93, "b": 278.58, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 44, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 294.79, "r_y0": 278.58, "r_x1": 300.93, "r_y1": 278.58, "r_x2": 300.93, "r_y2": 269.25, "r_x3": 294.79, "r_y3": 269.25, "coord_origin": "TOPLEFT" }, "text": "X", "orig": "X", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 77, "label": "text", "bbox": { "l": 307.06, "t": 269.25, "r": 325.48, "b": 278.58, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 45, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 307.06, "r_y0": 278.58, "r_x1": 325.48, "r_y1": 278.58, "r_x2": 325.48, "r_y2": 269.25, "r_x3": 307.06, "r_y3": 269.25, "coord_origin": "TOPLEFT" }, "text": "X X", "orig": "X X", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 78, "label": "text", "bbox": { "l": 195.94, "t": 268.75, "r": 203.11, "b": 278.07, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 46, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 195.94, "r_y0": 278.07, "r_x1": 203.11, "r_y1": 278.07, "r_x2": 203.11, "r_y2": 268.75, "r_x3": 195.94, "r_y3": 268.75, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 79, "label": "text", "bbox": { "l": 209.21, "t": 268.73, "r": 214.73, "b": 278.05, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 47, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 209.21, "r_y0": 278.05, "r_x1": 214.73, "r_y1": 278.05, "r_x2": 214.73, "r_y2": 268.73, "r_x3": 209.21, "r_y3": 268.73, "coord_origin": "TOPLEFT" }, "text": "L", "orig": "L", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 80, "label": "text", "bbox": { "l": 221.15, "t": 268.81, "r": 226.67, "b": 278.13, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 48, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 221.15, "r_y0": 278.13, "r_x1": 226.67, "r_y1": 278.13, "r_x2": 226.67, "r_y2": 268.81, "r_x3": 221.15, "r_y3": 268.81, "coord_origin": "TOPLEFT" }, "text": "L", "orig": "L", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 81, "label": "text", "bbox": { "l": 232.45, "t": 268.68, "r": 237.97, "b": 278.0, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 49, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 232.45, "r_y0": 278.0, "r_x1": 237.97, "r_y1": 278.0, "r_x2": 237.97, "r_y2": 268.68, "r_x3": 232.45, "r_y3": 268.68, "coord_origin": "TOPLEFT" }, "text": "L", "orig": "L", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 82, "label": "text", "bbox": { "l": 196.22, "t": 244.54, "r": 203.39, "b": 253.86, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 50, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 196.22, "r_y0": 253.86, "r_x1": 203.39, "r_y1": 253.86, "r_x2": 203.39, "r_y2": 244.54, "r_x3": 196.22, "r_y3": 244.54, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 83, "label": "text", "bbox": { "l": 250.32, "t": 244.1, "r": 257.5, "b": 253.42, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 51, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 250.32, "r_y0": 253.42, "r_x1": 257.5, "r_y1": 253.42, "r_x2": 257.5, "r_y2": 244.1, "r_x3": 250.32, "r_y3": 244.1, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 84, "label": "text", "bbox": { "l": 250.17, "t": 256.44, "r": 257.35, "b": 265.76, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 52, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 250.17, "r_y0": 265.76, "r_x1": 257.35, "r_y1": 265.76, "r_x2": 257.35, "r_y2": 256.44, "r_x3": 250.17, "r_y3": 256.44, "coord_origin": "TOPLEFT" }, "text": "U", "orig": "U", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 85, "label": "text", "bbox": { "l": 250.47, "t": 268.72, "r": 257.65, "b": 278.04, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 53, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 250.47, "r_y0": 278.04, "r_x1": 257.65, "r_y1": 278.04, "r_x2": 257.65, "r_y2": 268.72, "r_x3": 250.47, "r_y3": 268.72, "coord_origin": "TOPLEFT" }, "text": "U", "orig": "U", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 86, "label": "text", "bbox": { "l": 334.51, "t": 242.99, "r": 337.22, "b": 249.21, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 54, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 334.51, "r_y0": 249.21, "r_x1": 337.22, "r_y1": 249.21, "r_x2": 337.22, "r_y2": 242.99, "r_x3": 334.51, "r_y3": 242.99, "coord_origin": "TOPLEFT" }, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 87, "label": "text", "bbox": { "l": 339.94, "t": 242.99, "r": 391.49, "b": 249.21, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 55, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 339.94, "r_y0": 249.21, "r_x1": 391.49, "r_y1": 249.21, "r_x2": 391.49, "r_y2": 242.99, "r_x3": 339.94, "r_y3": 242.99, "coord_origin": "TOPLEFT" }, "text": "- simple cells: \"C\"", "orig": "- simple cells: \"C\"", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 88, "label": "text", "bbox": { "l": 334.51, "t": 252.93, "r": 337.33, "b": 259.15, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 56, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 334.51, "r_y0": 259.15, "r_x1": 337.33, "r_y1": 259.15, "r_x2": 337.33, "r_y2": 252.93, "r_x3": 334.51, "r_y3": 252.93, "coord_origin": "TOPLEFT" }, "text": "2", "orig": "2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 89, "label": "text", "bbox": { "l": 340.15, "t": 252.93, "r": 421.99, "b": 259.15, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 57, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 340.15, "r_y0": 259.15, "r_x1": 421.99, "r_y1": 259.15, "r_x2": 421.99, "r_y2": 252.93, "r_x3": 340.15, "r_y3": 252.93, "coord_origin": "TOPLEFT" }, "text": "- horizontal merges: \"C\", \"L\"", "orig": "- horizontal merges: \"C\", \"L\"", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 90, "label": "text", "bbox": { "l": 334.51, "t": 262.87, "r": 337.3, "b": 269.08, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 58, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 334.51, "r_y0": 269.08, "r_x1": 337.3, "r_y1": 269.08, "r_x2": 337.3, "r_y2": 262.87, "r_x3": 334.51, "r_y3": 262.87, "coord_origin": "TOPLEFT" }, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 91, "label": "text", "bbox": { "l": 340.09, "t": 262.87, "r": 415.34, "b": 269.08, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 59, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 340.09, "r_y0": 269.08, "r_x1": 415.34, "r_y1": 269.08, "r_x2": 415.34, "r_y2": 262.87, "r_x3": 340.09, "r_y3": 262.87, "coord_origin": "TOPLEFT" }, "text": "- vertical merges: \"C\", \"U\"", "orig": "- vertical merges: \"C\", \"U\"", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 18, "label": "list_item", "bbox": { "l": 334.51, "t": 272.81, "r": 426.6, "b": 279.02, "coord_origin": "TOPLEFT" }, "confidence": 0.525, "cells": [ { "index": 60, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 334.51, "r_y0": 279.02, "r_x1": 337.3, "r_y1": 279.02, "r_x2": 337.3, "r_y2": 272.81, "r_x3": 334.51, "r_y3": 272.81, "coord_origin": "TOPLEFT" }, "text": "4", "orig": "4", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 61, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 340.09, "r_y0": 279.02, "r_x1": 426.6, "r_y1": 279.02, "r_x2": 426.6, "r_y2": 272.81, "r_x3": 340.09, "r_y3": 272.81, "coord_origin": "TOPLEFT" }, "text": "- 2d merges: \"C\", \"L\", \"U\", \"X\"", "orig": "- 2d merges: \"C\", \"L\", \"U\", \"X\"", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 92, "label": "text", "bbox": { "l": 185.67, "t": 244.04, "r": 189.36, "b": 250.26, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 62, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 185.67, "r_y0": 250.26, "r_x1": 189.36, "r_y1": 250.26, "r_x2": 189.36, "r_y2": 244.04, "r_x3": 185.67, "r_y3": 244.04, "coord_origin": "TOPLEFT" }, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 93, "label": "text", "bbox": { "l": 185.97, "t": 268.35, "r": 189.65, "b": 274.56, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 63, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 185.97, "r_y0": 274.56, "r_x1": 189.65, "r_y1": 274.56, "r_x2": 189.65, "r_y2": 268.35, "r_x3": 185.97, "r_y3": 268.35, "coord_origin": "TOPLEFT" }, "text": "2", "orig": "2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 94, "label": "text", "bbox": { "l": 239.34, "t": 243.63, "r": 243.03, "b": 249.84, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 64, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 239.34, "r_y0": 249.84, "r_x1": 243.03, "r_y1": 249.84, "r_x2": 243.03, "r_y2": 243.63, "r_x3": 239.34, "r_y3": 243.63, "coord_origin": "TOPLEFT" }, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 95, "label": "text", "bbox": { "l": 271.33, "t": 243.49, "r": 275.01, "b": 249.71, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 65, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 271.33, "r_y0": 249.71, "r_x1": 275.01, "r_y1": 249.71, "r_x2": 275.01, "r_y2": 243.49, "r_x3": 271.33, "r_y3": 243.49, "coord_origin": "TOPLEFT" }, "text": "4", "orig": "4", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 96, "label": "text", "bbox": { "l": 229.82, "t": 166.51, "r": 233.5, "b": 172.73, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 66, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 229.82, "r_y0": 172.73, "r_x1": 233.5, "r_y1": 172.73, "r_x2": 233.5, "r_y2": 166.51, "r_x3": 229.82, "r_y3": 166.51, "coord_origin": "TOPLEFT" }, "text": "2", "orig": "2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 97, "label": "text", "bbox": { "l": 257.24, "t": 189.96, "r": 260.93, "b": 196.18, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 67, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 257.24, "r_y0": 196.18, "r_x1": 260.93, "r_y1": 196.18, "r_x2": 260.93, "r_y2": 189.96, "r_x3": 257.24, "r_y3": 189.96, "coord_origin": "TOPLEFT" }, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 98, "label": "text", "bbox": { "l": 186.88, "t": 177.98, "r": 190.56, "b": 184.19, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 68, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 186.88, "r_y0": 184.19, "r_x1": 190.56, "r_y1": 184.19, "r_x2": 190.56, "r_y2": 177.98, "r_x3": 186.88, "r_y3": 177.98, "coord_origin": "TOPLEFT" }, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 99, "label": "text", "bbox": { "l": 196.49, "t": 169.02, "r": 200.17, "b": 175.23, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 69, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 196.49, "r_y0": 175.23, "r_x1": 200.17, "r_y1": 175.23, "r_x2": 200.17, "r_y2": 169.02, "r_x3": 196.49, "r_y3": 169.02, "coord_origin": "TOPLEFT" }, "text": "4", "orig": "4", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 100, "label": "text", "bbox": { "l": 169.75, "t": 167.88, "r": 175.73, "b": 175.65, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 70, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 169.75, "r_y0": 175.65, "r_x1": 175.73, "r_y1": 175.65, "r_x2": 175.73, "r_y2": 167.88, "r_x3": 169.75, "r_y3": 167.88, "coord_origin": "TOPLEFT" }, "text": "A", "orig": "A", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 101, "label": "text", "bbox": { "l": 169.75, "t": 206.84, "r": 175.73, "b": 214.61, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 71, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 169.75, "r_y0": 214.61, "r_x1": 175.73, "r_y1": 214.61, "r_x2": 175.73, "r_y2": 206.84, "r_x3": 169.75, "r_y3": 206.84, "coord_origin": "TOPLEFT" }, "text": "B", "orig": "B", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 102, "label": "text", "bbox": { "l": 274.29, "t": 168.28, "r": 280.27, "b": 176.05, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 72, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 274.29, "r_y0": 176.05, "r_x1": 280.27, "r_y1": 176.05, "r_x2": 280.27, "r_y2": 168.28, "r_x3": 274.29, "r_y3": 168.28, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 103, "label": "text", "bbox": { "l": 359.56, "t": 168.28, "r": 365.54, "b": 176.05, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 73, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 359.56, "r_y0": 176.05, "r_x1": 365.54, "r_y1": 176.05, "r_x2": 365.54, "r_y2": 168.28, "r_x3": 359.56, "r_y3": 168.28, "coord_origin": "TOPLEFT" }, "text": "D", "orig": "D", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 104, "label": "text", "bbox": { "l": 169.75, "t": 243.21, "r": 175.27, "b": 250.98, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 74, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 169.75, "r_y0": 250.98, "r_x1": 175.27, "r_y1": 250.98, "r_x2": 175.27, "r_y2": 243.21, "r_x3": 169.75, "r_y3": 243.21, "coord_origin": "TOPLEFT" }, "text": "E", "orig": "E", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] } ] }, "text": "", "annotations": [], "provenance": null, "predicted_class": null, "confidence": null }, { "label": "section_header", "id": 9, "page_no": 6, "cluster": { "id": 9, "label": "section_header", "bbox": { "l": 134.76, "t": 305.3, "r": 246.65, "b": 314.1, "coord_origin": "TOPLEFT" }, "confidence": 0.923, "cells": [ { "index": 75, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 314.1, "r_x1": 149.4, "r_y1": 314.1, "r_x2": 149.4, "r_y2": 305.3, "r_x3": 134.76, "r_y3": 305.3, "coord_origin": "TOPLEFT" }, "text": "4.2", "orig": "4.2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 76, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 160.86, "r_y0": 314.1, "r_x1": 246.65, "r_y1": 314.1, "r_x2": 246.65, "r_y2": 305.3, "r_x3": 160.86, "r_y3": 305.3, "coord_origin": "TOPLEFT" }, "text": "Language Syntax", "orig": "Language Syntax", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "4.2 Language Syntax" }, { "label": "text", "id": 10, "page_no": 6, "cluster": { "id": 10, "label": "text", "bbox": { "l": 134.76, "t": 325.25, "r": 363.8, "b": 334.04, "coord_origin": "TOPLEFT" }, "confidence": 0.917, "cells": [ { "index": 77, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 334.04, "r_x1": 363.8, "r_y1": 334.04, "r_x2": 363.8, "r_y2": 325.25, "r_x3": 134.76, "r_y3": 325.25, "coord_origin": "TOPLEFT" }, "text": "The OTSL representation follows these syntax rules:", "orig": "The OTSL representation follows these syntax rules:", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "The OTSL representation follows these syntax rules:" }, { "label": "list_item", "id": 3, "page_no": 6, "cluster": { "id": 3, "label": "list_item", "bbox": { "l": 138.97, "t": 347.17, "r": 480.59, "b": 367.93, "coord_origin": "TOPLEFT" }, "confidence": 0.959, "cells": [ { "index": 78, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 138.97, "r_y0": 355.98, "r_x1": 146.72, "r_y1": 355.98, "r_x2": 146.72, "r_y2": 347.18, "r_x3": 138.97, "r_y3": 347.18, "coord_origin": "TOPLEFT" }, "text": "1.", "orig": "1.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 79, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.7, "r_y0": 355.98, "r_x1": 257.38, "r_y1": 355.98, "r_x2": 257.38, "r_y2": 347.17, "r_x3": 151.7, "r_y3": 347.17, "coord_origin": "TOPLEFT" }, "text": "Left-looking cell rule", "orig": "Left-looking cell rule", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 80, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 257.38, "r_y0": 355.98, "r_x1": 480.59, "r_y1": 355.98, "r_x2": 480.59, "r_y2": 347.18, "r_x3": 257.38, "r_y3": 347.18, "coord_origin": "TOPLEFT" }, "text": ": The left neighbour of an \"L\" cell must be either", "orig": ": The left neighbour of an \"L\" cell must be either", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 81, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.7, "r_y0": 367.93, "r_x1": 283.59, "r_y1": 367.93, "r_x2": 283.59, "r_y2": 359.14, "r_x3": 151.7, "r_y3": 359.14, "coord_origin": "TOPLEFT" }, "text": "another \"L\" cell or a \"C\" cell.", "orig": "another \"L\" cell or a \"C\" cell.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "1. Left-looking cell rule : The left neighbour of an \"L\" cell must be either another \"L\" cell or a \"C\" cell." }, { "label": "list_item", "id": 4, "page_no": 6, "cluster": { "id": 4, "label": "list_item", "bbox": { "l": 138.97, "t": 371.08, "r": 480.59, "b": 391.85, "coord_origin": "TOPLEFT" }, "confidence": 0.959, "cells": [ { "index": 82, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 138.97, "r_y0": 379.89, "r_x1": 146.72, "r_y1": 379.89, "r_x2": 146.72, "r_y2": 371.09, "r_x3": 138.97, "r_y3": 371.09, "coord_origin": "TOPLEFT" }, "text": "2.", "orig": "2.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 83, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.7, "r_y0": 379.89, "r_x1": 252.11, "r_y1": 379.89, "r_x2": 252.11, "r_y2": 371.08, "r_x3": 151.7, "r_y3": 371.08, "coord_origin": "TOPLEFT" }, "text": "Up-looking cell rule", "orig": "Up-looking cell rule", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 84, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 252.11, "r_y0": 379.89, "r_x1": 480.59, "r_y1": 379.89, "r_x2": 480.59, "r_y2": 371.09, "r_x3": 252.11, "r_y3": 371.09, "coord_origin": "TOPLEFT" }, "text": ": The upper neighbour of a \"U\" cell must be either", "orig": ": The upper neighbour of a \"U\" cell must be either", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 85, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.7, "r_y0": 391.85, "r_x1": 284.84, "r_y1": 391.85, "r_x2": 284.84, "r_y2": 383.05, "r_x3": 151.7, "r_y3": 383.05, "coord_origin": "TOPLEFT" }, "text": "another \"U\" cell or a \"C\" cell.", "orig": "another \"U\" cell or a \"C\" cell.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "2. Up-looking cell rule : The upper neighbour of a \"U\" cell must be either another \"U\" cell or a \"C\" cell." }, { "label": "section_header", "id": 14, "page_no": 6, "cluster": { "id": 14, "label": "section_header", "bbox": { "l": 138.97, "t": 395.0, "r": 226.07, "b": 403.8, "coord_origin": "TOPLEFT" }, "confidence": 0.651, "cells": [ { "index": 86, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 138.97, "r_y0": 403.8, "r_x1": 146.72, "r_y1": 403.8, "r_x2": 146.72, "r_y2": 395.01, "r_x3": 138.97, "r_y3": 395.01, "coord_origin": "TOPLEFT" }, "text": "3.", "orig": "3.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 87, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.7, "r_y0": 403.8, "r_x1": 223.3, "r_y1": 403.8, "r_x2": 223.3, "r_y2": 395.0, "r_x3": 151.7, "r_y3": 395.0, "coord_origin": "TOPLEFT" }, "text": "Cross cell rule", "orig": "Cross cell rule", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 88, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 223.31, "r_y0": 403.8, "r_x1": 226.07, "r_y1": 403.8, "r_x2": 226.07, "r_y2": 395.01, "r_x3": 223.31, "r_y3": 395.01, "coord_origin": "TOPLEFT" }, "text": ":", "orig": ":", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "3. Cross cell rule :" }, { "label": "list_item", "id": 13, "page_no": 6, "cluster": { "id": 13, "label": "list_item", "bbox": { "l": 151.7, "t": 406.97, "r": 480.59, "b": 439.67, "coord_origin": "TOPLEFT" }, "confidence": 0.725, "cells": [ { "index": 89, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.7, "r_y0": 415.76, "r_x1": 480.59, "r_y1": 415.76, "r_x2": 480.59, "r_y2": 406.97, "r_x3": 151.7, "r_y3": 406.97, "coord_origin": "TOPLEFT" }, "text": "The left neighbour of an \"X\" cell must be either another \"X\" cell or a \"U\"", "orig": "The left neighbour of an \"X\" cell must be either another \"X\" cell or a \"U\"", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 90, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.7, "r_y0": 427.72, "r_x1": 480.59, "r_y1": 427.72, "r_x2": 480.59, "r_y2": 418.92, "r_x3": 151.7, "r_y3": 418.92, "coord_origin": "TOPLEFT" }, "text": "cell, and the upper neighbour of an \"X\" cell must be either another \"X\" cell", "orig": "cell, and the upper neighbour of an \"X\" cell must be either another \"X\" cell", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 91, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.7, "r_y0": 439.67, "r_x1": 214.4, "r_y1": 439.67, "r_x2": 214.4, "r_y2": 430.88, "r_x3": 151.7, "r_y3": 430.88, "coord_origin": "TOPLEFT" }, "text": "or an \"L\" cell.", "orig": "or an \"L\" cell.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "The left neighbour of an \"X\" cell must be either another \"X\" cell or a \"U\" cell, and the upper neighbour of an \"X\" cell must be either another \"X\" cell or an \"L\" cell." }, { "label": "list_item", "id": 8, "page_no": 6, "cluster": { "id": 8, "label": "list_item", "bbox": { "l": 138.97, "t": 442.83, "r": 474.59, "b": 451.63, "coord_origin": "TOPLEFT" }, "confidence": 0.926, "cells": [ { "index": 92, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 138.97, "r_y0": 451.63, "r_x1": 146.72, "r_y1": 451.63, "r_x2": 146.72, "r_y2": 442.84, "r_x3": 138.97, "r_y3": 442.84, "coord_origin": "TOPLEFT" }, "text": "4.", "orig": "4.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 93, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.7, "r_y0": 451.63, "r_x1": 221.32, "r_y1": 451.63, "r_x2": 221.32, "r_y2": 442.83, "r_x3": 151.7, "r_y3": 442.83, "coord_origin": "TOPLEFT" }, "text": "First row rule", "orig": "First row rule", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 94, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 221.33, "r_y0": 451.63, "r_x1": 474.59, "r_y1": 451.63, "r_x2": 474.59, "r_y2": 442.84, "r_x3": 221.33, "r_y3": 442.84, "coord_origin": "TOPLEFT" }, "text": ": Only \"L\" cells and \"C\" cells are allowed in the first row.", "orig": ": Only \"L\" cells and \"C\" cells are allowed in the first row.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "4. First row rule : Only \"L\" cells and \"C\" cells are allowed in the first row." }, { "label": "list_item", "id": 5, "page_no": 6, "cluster": { "id": 5, "label": "list_item", "bbox": { "l": 138.97, "t": 454.78, "r": 480.59, "b": 475.55, "coord_origin": "TOPLEFT" }, "confidence": 0.942, "cells": [ { "index": 95, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 138.97, "r_y0": 463.59, "r_x1": 146.72, "r_y1": 463.59, "r_x2": 146.72, "r_y2": 454.79, "r_x3": 138.97, "r_y3": 454.79, "coord_origin": "TOPLEFT" }, "text": "5.", "orig": "5.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 96, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.7, "r_y0": 463.59, "r_x1": 240.72, "r_y1": 463.59, "r_x2": 240.72, "r_y2": 454.78, "r_x3": 151.7, "r_y3": 454.78, "coord_origin": "TOPLEFT" }, "text": "First column rule", "orig": "First column rule", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 97, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 240.72, "r_y0": 463.59, "r_x1": 480.59, "r_y1": 463.59, "r_x2": 480.59, "r_y2": 454.79, "r_x3": 240.72, "r_y3": 454.79, "coord_origin": "TOPLEFT" }, "text": ": Only \"U\" cells and \"C\" cells are allowed in the first", "orig": ": Only \"U\" cells and \"C\" cells are allowed in the first", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 98, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.7, "r_y0": 475.55, "r_x1": 186.01, "r_y1": 475.55, "r_x2": 186.01, "r_y2": 466.75, "r_x3": 151.7, "r_y3": 466.75, "coord_origin": "TOPLEFT" }, "text": "column.", "orig": "column.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "5. First column rule : Only \"U\" cells and \"C\" cells are allowed in the first column." }, { "label": "list_item", "id": 1, "page_no": 6, "cluster": { "id": 1, "label": "list_item", "bbox": { "l": 138.97, "t": 478.7, "r": 480.59, "b": 499.46, "coord_origin": "TOPLEFT" }, "confidence": 0.962, "cells": [ { "index": 99, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 138.97, "r_y0": 487.5, "r_x1": 146.72, "r_y1": 487.5, "r_x2": 146.72, "r_y2": 478.71, "r_x3": 138.97, "r_y3": 478.71, "coord_origin": "TOPLEFT" }, "text": "6.", "orig": "6.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 100, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.7, "r_y0": 487.5, "r_x1": 235.16, "r_y1": 487.5, "r_x2": 235.16, "r_y2": 478.7, "r_x3": 151.7, "r_y3": 478.7, "coord_origin": "TOPLEFT" }, "text": "Rectangular rule", "orig": "Rectangular rule", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 101, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 235.16, "r_y0": 487.5, "r_x1": 480.59, "r_y1": 487.5, "r_x2": 480.59, "r_y2": 478.71, "r_x3": 235.16, "r_y3": 478.71, "coord_origin": "TOPLEFT" }, "text": ": The table representation is always rectangular - all rows", "orig": ": The table representation is always rectangular - all rows", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 102, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.7, "r_y0": 499.46, "r_x1": 448.04, "r_y1": 499.46, "r_x2": 448.04, "r_y2": 490.66, "r_x3": 151.7, "r_y3": 490.66, "coord_origin": "TOPLEFT" }, "text": "must have an equal number of tokens, terminated with \"NL\" token.", "orig": "must have an equal number of tokens, terminated with \"NL\" token.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "6. Rectangular rule : The table representation is always rectangular - all rows must have an equal number of tokens, terminated with \"NL\" token." }, { "label": "text", "id": 0, "page_no": 6, "cluster": { "id": 0, "label": "text", "bbox": { "l": 134.76, "t": 512.59, "r": 480.6, "b": 640.94, "coord_origin": "TOPLEFT" }, "confidence": 0.979, "cells": [ { "index": 103, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 149.71, "r_y0": 521.39, "r_x1": 480.6, "r_y1": 521.39, "r_x2": 480.6, "r_y2": 512.59, "r_x3": 149.71, "r_y3": 512.59, "coord_origin": "TOPLEFT" }, "text": "The application of these rules gives OTSL a set of unique properties. First", "orig": "The application of these rules gives OTSL a set of unique properties. First", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 104, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 533.34, "r_x1": 480.59, "r_y1": 533.34, "r_x2": 480.59, "r_y2": 524.55, "r_x3": 134.76, "r_y3": 524.55, "coord_origin": "TOPLEFT" }, "text": "of all, the OTSL enforces a strictly rectangular structure representation, where", "orig": "of all, the OTSL enforces a strictly rectangular structure representation, where", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 105, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 545.3, "r_x1": 480.59, "r_y1": 545.3, "r_x2": 480.59, "r_y2": 536.5, "r_x3": 134.76, "r_y3": 536.5, "coord_origin": "TOPLEFT" }, "text": "every new-line token starts a new row. As a consequence, all rows and all columns", "orig": "every new-line token starts a new row. As a consequence, all rows and all columns", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 106, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 557.26, "r_x1": 480.59, "r_y1": 557.26, "r_x2": 480.59, "r_y2": 548.46, "r_x3": 134.76, "r_y3": 548.46, "coord_origin": "TOPLEFT" }, "text": "have exactly the same number of tokens, irrespective of cell spans. Secondly, the", "orig": "have exactly the same number of tokens, irrespective of cell spans. Secondly, the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 107, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 569.21, "r_x1": 480.59, "r_y1": 569.21, "r_x2": 480.59, "r_y2": 560.41, "r_x3": 134.76, "r_y3": 560.41, "coord_origin": "TOPLEFT" }, "text": "OTSL representation is unambiguous: Every table structure is represented in one", "orig": "OTSL representation is unambiguous: Every table structure is represented in one", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 108, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 581.17, "r_x1": 480.59, "r_y1": 581.17, "r_x2": 480.59, "r_y2": 572.37, "r_x3": 134.76, "r_y3": 572.37, "coord_origin": "TOPLEFT" }, "text": "way. In this representation every table cell corresponds to a \"C\"-cell token, which", "orig": "way. In this representation every table cell corresponds to a \"C\"-cell token, which", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 109, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 593.12, "r_x1": 480.59, "r_y1": 593.12, "r_x2": 480.59, "r_y2": 584.32, "r_x3": 134.76, "r_y3": 584.32, "coord_origin": "TOPLEFT" }, "text": "in case of spans is always located in the top-left corner of the table cell definition.", "orig": "in case of spans is always located in the top-left corner of the table cell definition.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 110, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 605.08, "r_x1": 480.59, "r_y1": 605.08, "r_x2": 480.59, "r_y2": 596.28, "r_x3": 134.76, "r_y3": 596.28, "coord_origin": "TOPLEFT" }, "text": "Third, OTSL syntax rules are only backward-looking. As a consequence, every", "orig": "Third, OTSL syntax rules are only backward-looking. As a consequence, every", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 111, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 617.03, "r_x1": 480.59, "r_y1": 617.03, "r_x2": 480.59, "r_y2": 608.23, "r_x3": 134.76, "r_y3": 608.23, "coord_origin": "TOPLEFT" }, "text": "predicted token can be validated straight during sequence generation by looking", "orig": "predicted token can be validated straight during sequence generation by looking", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 112, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 628.99, "r_x1": 480.59, "r_y1": 628.99, "r_x2": 480.59, "r_y2": 620.19, "r_x3": 134.76, "r_y3": 620.19, "coord_origin": "TOPLEFT" }, "text": "at the previously predicted sequence. As such, OTSL can guarantee that every", "orig": "at the previously predicted sequence. As such, OTSL can guarantee that every", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 113, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 640.94, "r_x1": 311.2, "r_y1": 640.94, "r_x2": 311.2, "r_y2": 632.14, "r_x3": 134.76, "r_y3": 632.14, "coord_origin": "TOPLEFT" }, "text": "predicted sequence is syntactically valid.", "orig": "predicted sequence is syntactically valid.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "The application of these rules gives OTSL a set of unique properties. First of all, the OTSL enforces a strictly rectangular structure representation, where every new-line token starts a new row. As a consequence, all rows and all columns have exactly the same number of tokens, irrespective of cell spans. Secondly, the OTSL representation is unambiguous: Every table structure is represented in one way. In this representation every table cell corresponds to a \"C\"-cell token, which in case of spans is always located in the top-left corner of the table cell definition. Third, OTSL syntax rules are only backward-looking. As a consequence, every predicted token can be validated straight during sequence generation by looking at the previously predicted sequence. As such, OTSL can guarantee that every predicted sequence is syntactically valid." }, { "label": "text", "id": 2, "page_no": 6, "cluster": { "id": 2, "label": "text", "bbox": { "l": 134.76, "t": 644.1, "r": 480.59, "b": 664.85, "coord_origin": "TOPLEFT" }, "confidence": 0.959, "cells": [ { "index": 114, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 149.71, "r_y0": 652.9, "r_x1": 480.59, "r_y1": 652.9, "r_x2": 480.59, "r_y2": 644.1, "r_x3": 149.71, "r_y3": 644.1, "coord_origin": "TOPLEFT" }, "text": "These characteristics can be easily learned by sequence generator networks,", "orig": "These characteristics can be easily learned by sequence generator networks,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 115, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 664.85, "r_x1": 480.59, "r_y1": 664.85, "r_x2": 480.59, "r_y2": 656.06, "r_x3": 134.76, "r_y3": 656.06, "coord_origin": "TOPLEFT" }, "text": "as we demonstrate further below. We find strong indications that this pattern", "orig": "as we demonstrate further below. We find strong indications that this pattern", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "These characteristics can be easily learned by sequence generator networks, as we demonstrate further below. We find strong indications that this pattern" } ], "body": [ { "label": "caption", "id": 6, "page_no": 6, "cluster": { "id": 6, "label": "caption", "bbox": { "l": 134.76, "t": 125.8, "r": 480.59, "b": 155.85, "coord_origin": "TOPLEFT" }, "confidence": 0.933, "cells": [ { "index": 2, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 133.73, "r_x1": 162.64, "r_y1": 133.73, "r_x2": 162.64, "r_y2": 125.8, "r_x3": 134.76, "r_y3": 125.8, "coord_origin": "TOPLEFT" }, "text": "Fig. 3.", "orig": "Fig. 3.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 3, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 166.28, "r_y0": 133.93, "r_x1": 480.59, "r_y1": 133.93, "r_x2": 480.59, "r_y2": 125.86, "r_x3": 166.28, "r_y3": 125.86, "coord_origin": "TOPLEFT" }, "text": "OTSL description of table structure: A - table example; B - graphical repre-", "orig": "OTSL description of table structure: A - table example; B - graphical repre-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 4, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 144.89, "r_x1": 480.59, "r_y1": 144.89, "r_x2": 480.59, "r_y2": 136.82, "r_x3": 134.76, "r_y3": 136.82, "coord_origin": "TOPLEFT" }, "text": "sentation of table structure; C - mapping structure on a grid; D - OTSL structure", "orig": "sentation of table structure; C - mapping structure on a grid; D - OTSL structure", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 5, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 155.85, "r_x1": 306.12, "r_y1": 155.85, "r_x2": 306.12, "r_y2": 147.78, "r_x3": 134.76, "r_y3": 147.78, "coord_origin": "TOPLEFT" }, "text": "encoding; E - explanation on cell encoding", "orig": "encoding; E - explanation on cell encoding", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "Fig. 3. OTSL description of table structure: A - table example; B - graphical representation of table structure; C - mapping structure on a grid; D - OTSL structure encoding; E - explanation on cell encoding" }, { "label": "picture", "id": 12, "page_no": 6, "cluster": { "id": 12, "label": "picture", "bbox": { "l": 164.65, "t": 163.8, "r": 449.55, "b": 280.34, "coord_origin": "TOPLEFT" }, "confidence": 0.787, "cells": [ { "index": 6, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 374.49, "r_y0": 177.92, "r_x1": 381.67, "r_y1": 177.92, "r_x2": 381.67, "r_y2": 168.59, "r_x3": 374.49, "r_y3": 168.59, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 7, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 398.74, "r_y0": 177.82, "r_x1": 405.92, "r_y1": 177.82, "r_x2": 405.92, "r_y2": 168.5, "r_x3": 398.74, "r_y3": 168.5, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 8, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 373.77, "r_y0": 202.25, "r_x1": 380.94, "r_y1": 202.25, "r_x2": 380.94, "r_y2": 192.93, "r_x3": 373.77, "r_y3": 192.93, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 9, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 386.66, "r_y0": 202.39, "r_x1": 393.84, "r_y1": 202.39, "r_x2": 393.84, "r_y2": 193.07, "r_x3": 386.66, "r_y3": 193.07, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 10, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 386.69, "r_y0": 214.46, "r_x1": 393.86, "r_y1": 214.46, "r_x2": 393.86, "r_y2": 205.14, "r_x3": 386.69, "r_y3": 205.14, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 11, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 398.66, "r_y0": 190.05, "r_x1": 405.83, "r_y1": 190.05, "r_x2": 405.83, "r_y2": 180.73, "r_x3": 398.66, "r_y3": 180.73, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 12, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 410.78, "r_y0": 190.06, "r_x1": 417.95, "r_y1": 190.06, "r_x2": 417.95, "r_y2": 180.74, "r_x3": 410.78, "r_y3": 180.74, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 13, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 422.91, "r_y0": 189.97, "r_x1": 430.08, "r_y1": 189.97, "r_x2": 430.08, "r_y2": 180.65, "r_x3": 422.91, "r_y3": 180.65, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 14, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 398.78, "r_y0": 202.31, "r_x1": 405.96, "r_y1": 202.31, "r_x2": 405.96, "r_y2": 192.99, "r_x3": 398.78, "r_y3": 192.99, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 15, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 410.9, "r_y0": 202.32, "r_x1": 418.08, "r_y1": 202.32, "r_x2": 418.08, "r_y2": 192.99, "r_x3": 410.9, "r_y3": 192.99, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 16, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 423.03, "r_y0": 202.23, "r_x1": 430.2, "r_y1": 202.23, "r_x2": 430.2, "r_y2": 192.91, "r_x3": 423.03, "r_y3": 192.91, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 17, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 398.78, "r_y0": 214.64, "r_x1": 405.96, "r_y1": 214.64, "r_x2": 405.96, "r_y2": 205.32, "r_x3": 398.78, "r_y3": 205.32, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 18, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 410.9, "r_y0": 214.64, "r_x1": 418.08, "r_y1": 214.64, "r_x2": 418.08, "r_y2": 205.32, "r_x3": 410.9, "r_y3": 205.32, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 19, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 423.03, "r_y0": 214.56, "r_x1": 430.21, "r_y1": 214.56, "r_x2": 430.21, "r_y2": 205.24, "r_x3": 423.03, "r_y3": 205.24, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 20, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 386.51, "r_y0": 226.36, "r_x1": 393.68, "r_y1": 226.36, "r_x2": 393.68, "r_y2": 217.04, "r_x3": 386.51, "r_y3": 217.04, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 21, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 398.6, "r_y0": 226.54, "r_x1": 405.78, "r_y1": 226.54, "r_x2": 405.78, "r_y2": 217.22, "r_x3": 398.6, "r_y3": 217.22, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 22, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 410.72, "r_y0": 226.54, "r_x1": 417.9, "r_y1": 226.54, "r_x2": 417.9, "r_y2": 217.22, "r_x3": 410.72, "r_y3": 217.22, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 23, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 422.85, "r_y0": 226.46, "r_x1": 430.02, "r_y1": 226.46, "r_x2": 430.02, "r_y2": 217.14, "r_x3": 422.85, "r_y3": 217.14, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 24, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 435.16, "r_y0": 177.01, "r_x1": 447.86, "r_y1": 177.01, "r_x2": 447.86, "r_y2": 167.69, "r_x3": 435.16, "r_y3": 167.69, "coord_origin": "TOPLEFT" }, "text": "NL", "orig": "NL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 25, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 435.44, "r_y0": 189.52, "r_x1": 448.15, "r_y1": 189.52, "r_x2": 448.15, "r_y2": 180.2, "r_x3": 435.44, "r_y3": 180.2, "coord_origin": "TOPLEFT" }, "text": "NL", "orig": "NL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 26, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 435.47, "r_y0": 201.82, "r_x1": 448.17, "r_y1": 201.82, "r_x2": 448.17, "r_y2": 192.49, "r_x3": 435.47, "r_y3": 192.49, "coord_origin": "TOPLEFT" }, "text": "NL", "orig": "NL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 27, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 435.38, "r_y0": 214.15, "r_x1": 448.08, "r_y1": 214.15, "r_x2": 448.08, "r_y2": 204.83, "r_x3": 435.38, "r_y3": 204.83, "coord_origin": "TOPLEFT" }, "text": "NL", "orig": "NL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 28, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 435.6, "r_y0": 226.56, "r_x1": 448.3, "r_y1": 226.56, "r_x2": 448.3, "r_y2": 217.23, "r_x3": 435.6, "r_y3": 217.23, "coord_origin": "TOPLEFT" }, "text": "NL", "orig": "NL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 29, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 374.15, "r_y0": 214.56, "r_x1": 381.32, "r_y1": 214.56, "r_x2": 381.32, "r_y2": 205.23, "r_x3": 374.15, "r_y3": 205.23, "coord_origin": "TOPLEFT" }, "text": "U", "orig": "U", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 30, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 374.04, "r_y0": 226.47, "r_x1": 381.22, "r_y1": 226.47, "r_x2": 381.22, "r_y2": 217.15, "r_x3": 374.04, "r_y3": 217.15, "coord_origin": "TOPLEFT" }, "text": "U", "orig": "U", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 31, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 374.34, "r_y0": 190.26, "r_x1": 381.52, "r_y1": 190.26, "r_x2": 381.52, "r_y2": 180.93, "r_x3": 374.34, "r_y3": 180.93, "coord_origin": "TOPLEFT" }, "text": "U", "orig": "U", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 32, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 387.76, "r_y0": 177.9, "r_x1": 393.29, "r_y1": 177.9, "r_x2": 393.29, "r_y2": 168.58, "r_x3": 387.76, "r_y3": 168.58, "coord_origin": "TOPLEFT" }, "text": "L", "orig": "L", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 33, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 411.86, "r_y0": 177.38, "r_x1": 417.39, "r_y1": 177.38, "r_x2": 417.39, "r_y2": 168.06, "r_x3": 411.86, "r_y3": 168.06, "coord_origin": "TOPLEFT" }, "text": "L", "orig": "L", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 34, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 423.34, "r_y0": 177.26, "r_x1": 428.86, "r_y1": 177.26, "r_x2": 428.86, "r_y2": 167.93, "r_x3": 423.34, "r_y3": 167.93, "coord_origin": "TOPLEFT" }, "text": "L", "orig": "L", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 35, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 387.14, "r_y0": 190.11, "r_x1": 393.76, "r_y1": 190.11, "r_x2": 393.76, "r_y2": 180.79, "r_x3": 387.14, "r_y3": 180.79, "coord_origin": "TOPLEFT" }, "text": "X", "orig": "X", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 36, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 282.26, "r_y0": 253.83, "r_x1": 289.43, "r_y1": 253.83, "r_x2": 289.43, "r_y2": 244.51, "r_x3": 282.26, "r_y3": 244.51, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 37, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 282.11, "r_y0": 266.17, "r_x1": 289.29, "r_y1": 266.17, "r_x2": 289.29, "r_y2": 256.85, "r_x3": 282.11, "r_y3": 256.85, "coord_origin": "TOPLEFT" }, "text": "U", "orig": "U", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 38, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 282.41, "r_y0": 278.45, "r_x1": 289.58, "r_y1": 278.45, "r_x2": 289.58, "r_y2": 269.13, "r_x3": 282.41, "r_y3": 269.13, "coord_origin": "TOPLEFT" }, "text": "U", "orig": "U", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 39, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 295.53, "r_y0": 253.82, "r_x1": 301.05, "r_y1": 253.82, "r_x2": 301.05, "r_y2": 244.49, "r_x3": 295.53, "r_y3": 244.49, "coord_origin": "TOPLEFT" }, "text": "L", "orig": "L", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 40, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 307.47, "r_y0": 253.9, "r_x1": 312.99, "r_y1": 253.9, "r_x2": 312.99, "r_y2": 244.57, "r_x3": 307.47, "r_y3": 244.57, "coord_origin": "TOPLEFT" }, "text": "L", "orig": "L", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 41, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 318.77, "r_y0": 253.76, "r_x1": 324.29, "r_y1": 253.76, "r_x2": 324.29, "r_y2": 244.44, "r_x3": 318.77, "r_y3": 244.44, "coord_origin": "TOPLEFT" }, "text": "L", "orig": "L", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 42, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 294.9, "r_y0": 266.02, "r_x1": 301.04, "r_y1": 266.02, "r_x2": 301.04, "r_y2": 256.7, "r_x3": 294.9, "r_y3": 256.7, "coord_origin": "TOPLEFT" }, "text": "X", "orig": "X", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 43, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 307.18, "r_y0": 266.02, "r_x1": 325.59, "r_y1": 266.02, "r_x2": 325.59, "r_y2": 256.7, "r_x3": 307.18, "r_y3": 256.7, "coord_origin": "TOPLEFT" }, "text": "X X", "orig": "X X", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 44, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 294.79, "r_y0": 278.58, "r_x1": 300.93, "r_y1": 278.58, "r_x2": 300.93, "r_y2": 269.25, "r_x3": 294.79, "r_y3": 269.25, "coord_origin": "TOPLEFT" }, "text": "X", "orig": "X", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 45, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 307.06, "r_y0": 278.58, "r_x1": 325.48, "r_y1": 278.58, "r_x2": 325.48, "r_y2": 269.25, "r_x3": 307.06, "r_y3": 269.25, "coord_origin": "TOPLEFT" }, "text": "X X", "orig": "X X", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 46, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 195.94, "r_y0": 278.07, "r_x1": 203.11, "r_y1": 278.07, "r_x2": 203.11, "r_y2": 268.75, "r_x3": 195.94, "r_y3": 268.75, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 47, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 209.21, "r_y0": 278.05, "r_x1": 214.73, "r_y1": 278.05, "r_x2": 214.73, "r_y2": 268.73, "r_x3": 209.21, "r_y3": 268.73, "coord_origin": "TOPLEFT" }, "text": "L", "orig": "L", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 48, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 221.15, "r_y0": 278.13, "r_x1": 226.67, "r_y1": 278.13, "r_x2": 226.67, "r_y2": 268.81, "r_x3": 221.15, "r_y3": 268.81, "coord_origin": "TOPLEFT" }, "text": "L", "orig": "L", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 49, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 232.45, "r_y0": 278.0, "r_x1": 237.97, "r_y1": 278.0, "r_x2": 237.97, "r_y2": 268.68, "r_x3": 232.45, "r_y3": 268.68, "coord_origin": "TOPLEFT" }, "text": "L", "orig": "L", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 50, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 196.22, "r_y0": 253.86, "r_x1": 203.39, "r_y1": 253.86, "r_x2": 203.39, "r_y2": 244.54, "r_x3": 196.22, "r_y3": 244.54, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 51, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 250.32, "r_y0": 253.42, "r_x1": 257.5, "r_y1": 253.42, "r_x2": 257.5, "r_y2": 244.1, "r_x3": 250.32, "r_y3": 244.1, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 52, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 250.17, "r_y0": 265.76, "r_x1": 257.35, "r_y1": 265.76, "r_x2": 257.35, "r_y2": 256.44, "r_x3": 250.17, "r_y3": 256.44, "coord_origin": "TOPLEFT" }, "text": "U", "orig": "U", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 53, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 250.47, "r_y0": 278.04, "r_x1": 257.65, "r_y1": 278.04, "r_x2": 257.65, "r_y2": 268.72, "r_x3": 250.47, "r_y3": 268.72, "coord_origin": "TOPLEFT" }, "text": "U", "orig": "U", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 54, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 334.51, "r_y0": 249.21, "r_x1": 337.22, "r_y1": 249.21, "r_x2": 337.22, "r_y2": 242.99, "r_x3": 334.51, "r_y3": 242.99, "coord_origin": "TOPLEFT" }, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 55, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 339.94, "r_y0": 249.21, "r_x1": 391.49, "r_y1": 249.21, "r_x2": 391.49, "r_y2": 242.99, "r_x3": 339.94, "r_y3": 242.99, "coord_origin": "TOPLEFT" }, "text": "- simple cells: \"C\"", "orig": "- simple cells: \"C\"", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 56, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 334.51, "r_y0": 259.15, "r_x1": 337.33, "r_y1": 259.15, "r_x2": 337.33, "r_y2": 252.93, "r_x3": 334.51, "r_y3": 252.93, "coord_origin": "TOPLEFT" }, "text": "2", "orig": "2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 57, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 340.15, "r_y0": 259.15, "r_x1": 421.99, "r_y1": 259.15, "r_x2": 421.99, "r_y2": 252.93, "r_x3": 340.15, "r_y3": 252.93, "coord_origin": "TOPLEFT" }, "text": "- horizontal merges: \"C\", \"L\"", "orig": "- horizontal merges: \"C\", \"L\"", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 58, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 334.51, "r_y0": 269.08, "r_x1": 337.3, "r_y1": 269.08, "r_x2": 337.3, "r_y2": 262.87, "r_x3": 334.51, "r_y3": 262.87, "coord_origin": "TOPLEFT" }, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 59, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 340.09, "r_y0": 269.08, "r_x1": 415.34, "r_y1": 269.08, "r_x2": 415.34, "r_y2": 262.87, "r_x3": 340.09, "r_y3": 262.87, "coord_origin": "TOPLEFT" }, "text": "- vertical merges: \"C\", \"U\"", "orig": "- vertical merges: \"C\", \"U\"", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 60, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 334.51, "r_y0": 279.02, "r_x1": 337.3, "r_y1": 279.02, "r_x2": 337.3, "r_y2": 272.81, "r_x3": 334.51, "r_y3": 272.81, "coord_origin": "TOPLEFT" }, "text": "4", "orig": "4", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 61, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 340.09, "r_y0": 279.02, "r_x1": 426.6, "r_y1": 279.02, "r_x2": 426.6, "r_y2": 272.81, "r_x3": 340.09, "r_y3": 272.81, "coord_origin": "TOPLEFT" }, "text": "- 2d merges: \"C\", \"L\", \"U\", \"X\"", "orig": "- 2d merges: \"C\", \"L\", \"U\", \"X\"", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 62, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 185.67, "r_y0": 250.26, "r_x1": 189.36, "r_y1": 250.26, "r_x2": 189.36, "r_y2": 244.04, "r_x3": 185.67, "r_y3": 244.04, "coord_origin": "TOPLEFT" }, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 63, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 185.97, "r_y0": 274.56, "r_x1": 189.65, "r_y1": 274.56, "r_x2": 189.65, "r_y2": 268.35, "r_x3": 185.97, "r_y3": 268.35, "coord_origin": "TOPLEFT" }, "text": "2", "orig": "2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 64, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 239.34, "r_y0": 249.84, "r_x1": 243.03, "r_y1": 249.84, "r_x2": 243.03, "r_y2": 243.63, "r_x3": 239.34, "r_y3": 243.63, "coord_origin": "TOPLEFT" }, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 65, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 271.33, "r_y0": 249.71, "r_x1": 275.01, "r_y1": 249.71, "r_x2": 275.01, "r_y2": 243.49, "r_x3": 271.33, "r_y3": 243.49, "coord_origin": "TOPLEFT" }, "text": "4", "orig": "4", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 66, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 229.82, "r_y0": 172.73, "r_x1": 233.5, "r_y1": 172.73, "r_x2": 233.5, "r_y2": 166.51, "r_x3": 229.82, "r_y3": 166.51, "coord_origin": "TOPLEFT" }, "text": "2", "orig": "2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 67, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 257.24, "r_y0": 196.18, "r_x1": 260.93, "r_y1": 196.18, "r_x2": 260.93, "r_y2": 189.96, "r_x3": 257.24, "r_y3": 189.96, "coord_origin": "TOPLEFT" }, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 68, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 186.88, "r_y0": 184.19, "r_x1": 190.56, "r_y1": 184.19, "r_x2": 190.56, "r_y2": 177.98, "r_x3": 186.88, "r_y3": 177.98, "coord_origin": "TOPLEFT" }, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 69, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 196.49, "r_y0": 175.23, "r_x1": 200.17, "r_y1": 175.23, "r_x2": 200.17, "r_y2": 169.02, "r_x3": 196.49, "r_y3": 169.02, "coord_origin": "TOPLEFT" }, "text": "4", "orig": "4", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 70, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 169.75, "r_y0": 175.65, "r_x1": 175.73, "r_y1": 175.65, "r_x2": 175.73, "r_y2": 167.88, "r_x3": 169.75, "r_y3": 167.88, "coord_origin": "TOPLEFT" }, "text": "A", "orig": "A", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 71, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 169.75, "r_y0": 214.61, "r_x1": 175.73, "r_y1": 214.61, "r_x2": 175.73, "r_y2": 206.84, "r_x3": 169.75, "r_y3": 206.84, "coord_origin": "TOPLEFT" }, "text": "B", "orig": "B", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 72, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 274.29, "r_y0": 176.05, "r_x1": 280.27, "r_y1": 176.05, "r_x2": 280.27, "r_y2": 168.28, "r_x3": 274.29, "r_y3": 168.28, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 73, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 359.56, "r_y0": 176.05, "r_x1": 365.54, "r_y1": 176.05, "r_x2": 365.54, "r_y2": 168.28, "r_x3": 359.56, "r_y3": 168.28, "coord_origin": "TOPLEFT" }, "text": "D", "orig": "D", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 74, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 169.75, "r_y0": 250.98, "r_x1": 175.27, "r_y1": 250.98, "r_x2": 175.27, "r_y2": 243.21, "r_x3": 169.75, "r_y3": 243.21, "coord_origin": "TOPLEFT" }, "text": "E", "orig": "E", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [ { "id": 38, "label": "text", "bbox": { "l": 374.49, "t": 168.59, "r": 381.67, "b": 177.92, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 6, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 374.49, "r_y0": 177.92, "r_x1": 381.67, "r_y1": 177.92, "r_x2": 381.67, "r_y2": 168.59, "r_x3": 374.49, "r_y3": 168.59, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 39, "label": "text", "bbox": { "l": 398.74, "t": 168.5, "r": 405.92, "b": 177.82, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 7, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 398.74, "r_y0": 177.82, "r_x1": 405.92, "r_y1": 177.82, "r_x2": 405.92, "r_y2": 168.5, "r_x3": 398.74, "r_y3": 168.5, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 40, "label": "text", "bbox": { "l": 373.77, "t": 192.93, "r": 380.94, "b": 202.25, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 8, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 373.77, "r_y0": 202.25, "r_x1": 380.94, "r_y1": 202.25, "r_x2": 380.94, "r_y2": 192.93, "r_x3": 373.77, "r_y3": 192.93, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 41, "label": "text", "bbox": { "l": 386.66, "t": 193.07, "r": 393.84, "b": 202.39, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 9, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 386.66, "r_y0": 202.39, "r_x1": 393.84, "r_y1": 202.39, "r_x2": 393.84, "r_y2": 193.07, "r_x3": 386.66, "r_y3": 193.07, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 42, "label": "text", "bbox": { "l": 386.69, "t": 205.14, "r": 393.86, "b": 214.46, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 10, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 386.69, "r_y0": 214.46, "r_x1": 393.86, "r_y1": 214.46, "r_x2": 393.86, "r_y2": 205.14, "r_x3": 386.69, "r_y3": 205.14, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 43, "label": "text", "bbox": { "l": 398.66, "t": 180.73, "r": 405.83, "b": 190.05, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 11, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 398.66, "r_y0": 190.05, "r_x1": 405.83, "r_y1": 190.05, "r_x2": 405.83, "r_y2": 180.73, "r_x3": 398.66, "r_y3": 180.73, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 44, "label": "text", "bbox": { "l": 410.78, "t": 180.74, "r": 417.95, "b": 190.06, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 12, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 410.78, "r_y0": 190.06, "r_x1": 417.95, "r_y1": 190.06, "r_x2": 417.95, "r_y2": 180.74, "r_x3": 410.78, "r_y3": 180.74, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 45, "label": "text", "bbox": { "l": 422.91, "t": 180.65, "r": 430.08, "b": 189.97, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 13, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 422.91, "r_y0": 189.97, "r_x1": 430.08, "r_y1": 189.97, "r_x2": 430.08, "r_y2": 180.65, "r_x3": 422.91, "r_y3": 180.65, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 46, "label": "text", "bbox": { "l": 398.78, "t": 192.99, "r": 405.96, "b": 202.31, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 14, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 398.78, "r_y0": 202.31, "r_x1": 405.96, "r_y1": 202.31, "r_x2": 405.96, "r_y2": 192.99, "r_x3": 398.78, "r_y3": 192.99, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 47, "label": "text", "bbox": { "l": 410.9, "t": 192.99, "r": 418.08, "b": 202.32, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 15, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 410.9, "r_y0": 202.32, "r_x1": 418.08, "r_y1": 202.32, "r_x2": 418.08, "r_y2": 192.99, "r_x3": 410.9, "r_y3": 192.99, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 48, "label": "text", "bbox": { "l": 423.03, "t": 192.91, "r": 430.2, "b": 202.23, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 16, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 423.03, "r_y0": 202.23, "r_x1": 430.2, "r_y1": 202.23, "r_x2": 430.2, "r_y2": 192.91, "r_x3": 423.03, "r_y3": 192.91, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 49, "label": "text", "bbox": { "l": 398.78, "t": 205.32, "r": 405.96, "b": 214.64, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 17, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 398.78, "r_y0": 214.64, "r_x1": 405.96, "r_y1": 214.64, "r_x2": 405.96, "r_y2": 205.32, "r_x3": 398.78, "r_y3": 205.32, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 50, "label": "text", "bbox": { "l": 410.9, "t": 205.32, "r": 418.08, "b": 214.64, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 18, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 410.9, "r_y0": 214.64, "r_x1": 418.08, "r_y1": 214.64, "r_x2": 418.08, "r_y2": 205.32, "r_x3": 410.9, "r_y3": 205.32, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 51, "label": "text", "bbox": { "l": 423.03, "t": 205.24, "r": 430.21, "b": 214.56, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 19, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 423.03, "r_y0": 214.56, "r_x1": 430.21, "r_y1": 214.56, "r_x2": 430.21, "r_y2": 205.24, "r_x3": 423.03, "r_y3": 205.24, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 52, "label": "text", "bbox": { "l": 386.51, "t": 217.04, "r": 393.68, "b": 226.36, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 20, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 386.51, "r_y0": 226.36, "r_x1": 393.68, "r_y1": 226.36, "r_x2": 393.68, "r_y2": 217.04, "r_x3": 386.51, "r_y3": 217.04, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 53, "label": "text", "bbox": { "l": 398.6, "t": 217.22, "r": 405.78, "b": 226.54, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 21, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 398.6, "r_y0": 226.54, "r_x1": 405.78, "r_y1": 226.54, "r_x2": 405.78, "r_y2": 217.22, "r_x3": 398.6, "r_y3": 217.22, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 54, "label": "text", "bbox": { "l": 410.72, "t": 217.22, "r": 417.9, "b": 226.54, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 22, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 410.72, "r_y0": 226.54, "r_x1": 417.9, "r_y1": 226.54, "r_x2": 417.9, "r_y2": 217.22, "r_x3": 410.72, "r_y3": 217.22, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 55, "label": "text", "bbox": { "l": 422.85, "t": 217.14, "r": 430.02, "b": 226.46, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 23, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 422.85, "r_y0": 226.46, "r_x1": 430.02, "r_y1": 226.46, "r_x2": 430.02, "r_y2": 217.14, "r_x3": 422.85, "r_y3": 217.14, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 56, "label": "text", "bbox": { "l": 435.16, "t": 167.69, "r": 447.86, "b": 177.01, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 24, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 435.16, "r_y0": 177.01, "r_x1": 447.86, "r_y1": 177.01, "r_x2": 447.86, "r_y2": 167.69, "r_x3": 435.16, "r_y3": 167.69, "coord_origin": "TOPLEFT" }, "text": "NL", "orig": "NL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 57, "label": "text", "bbox": { "l": 435.44, "t": 180.2, "r": 448.15, "b": 189.52, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 25, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 435.44, "r_y0": 189.52, "r_x1": 448.15, "r_y1": 189.52, "r_x2": 448.15, "r_y2": 180.2, "r_x3": 435.44, "r_y3": 180.2, "coord_origin": "TOPLEFT" }, "text": "NL", "orig": "NL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 58, "label": "text", "bbox": { "l": 435.47, "t": 192.49, "r": 448.17, "b": 201.82, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 26, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 435.47, "r_y0": 201.82, "r_x1": 448.17, "r_y1": 201.82, "r_x2": 448.17, "r_y2": 192.49, "r_x3": 435.47, "r_y3": 192.49, "coord_origin": "TOPLEFT" }, "text": "NL", "orig": "NL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 59, "label": "text", "bbox": { "l": 435.38, "t": 204.83, "r": 448.08, "b": 214.15, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 27, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 435.38, "r_y0": 214.15, "r_x1": 448.08, "r_y1": 214.15, "r_x2": 448.08, "r_y2": 204.83, "r_x3": 435.38, "r_y3": 204.83, "coord_origin": "TOPLEFT" }, "text": "NL", "orig": "NL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 60, "label": "text", "bbox": { "l": 435.6, "t": 217.23, "r": 448.3, "b": 226.56, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 28, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 435.6, "r_y0": 226.56, "r_x1": 448.3, "r_y1": 226.56, "r_x2": 448.3, "r_y2": 217.23, "r_x3": 435.6, "r_y3": 217.23, "coord_origin": "TOPLEFT" }, "text": "NL", "orig": "NL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 61, "label": "text", "bbox": { "l": 374.15, "t": 205.23, "r": 381.32, "b": 214.56, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 29, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 374.15, "r_y0": 214.56, "r_x1": 381.32, "r_y1": 214.56, "r_x2": 381.32, "r_y2": 205.23, "r_x3": 374.15, "r_y3": 205.23, "coord_origin": "TOPLEFT" }, "text": "U", "orig": "U", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 62, "label": "text", "bbox": { "l": 374.04, "t": 217.15, "r": 381.22, "b": 226.47, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 30, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 374.04, "r_y0": 226.47, "r_x1": 381.22, "r_y1": 226.47, "r_x2": 381.22, "r_y2": 217.15, "r_x3": 374.04, "r_y3": 217.15, "coord_origin": "TOPLEFT" }, "text": "U", "orig": "U", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 63, "label": "text", "bbox": { "l": 374.34, "t": 180.93, "r": 381.52, "b": 190.26, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 31, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 374.34, "r_y0": 190.26, "r_x1": 381.52, "r_y1": 190.26, "r_x2": 381.52, "r_y2": 180.93, "r_x3": 374.34, "r_y3": 180.93, "coord_origin": "TOPLEFT" }, "text": "U", "orig": "U", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 64, "label": "text", "bbox": { "l": 387.76, "t": 168.58, "r": 393.29, "b": 177.9, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 32, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 387.76, "r_y0": 177.9, "r_x1": 393.29, "r_y1": 177.9, "r_x2": 393.29, "r_y2": 168.58, "r_x3": 387.76, "r_y3": 168.58, "coord_origin": "TOPLEFT" }, "text": "L", "orig": "L", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 65, "label": "text", "bbox": { "l": 411.86, "t": 168.06, "r": 417.39, "b": 177.38, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 33, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 411.86, "r_y0": 177.38, "r_x1": 417.39, "r_y1": 177.38, "r_x2": 417.39, "r_y2": 168.06, "r_x3": 411.86, "r_y3": 168.06, "coord_origin": "TOPLEFT" }, "text": "L", "orig": "L", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 66, "label": "text", "bbox": { "l": 423.34, "t": 167.93, "r": 428.86, "b": 177.26, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 34, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 423.34, "r_y0": 177.26, "r_x1": 428.86, "r_y1": 177.26, "r_x2": 428.86, "r_y2": 167.93, "r_x3": 423.34, "r_y3": 167.93, "coord_origin": "TOPLEFT" }, "text": "L", "orig": "L", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 67, "label": "text", "bbox": { "l": 387.14, "t": 180.79, "r": 393.76, "b": 190.11, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 35, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 387.14, "r_y0": 190.11, "r_x1": 393.76, "r_y1": 190.11, "r_x2": 393.76, "r_y2": 180.79, "r_x3": 387.14, "r_y3": 180.79, "coord_origin": "TOPLEFT" }, "text": "X", "orig": "X", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 68, "label": "text", "bbox": { "l": 282.26, "t": 244.51, "r": 289.43, "b": 253.83, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 36, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 282.26, "r_y0": 253.83, "r_x1": 289.43, "r_y1": 253.83, "r_x2": 289.43, "r_y2": 244.51, "r_x3": 282.26, "r_y3": 244.51, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 69, "label": "text", "bbox": { "l": 282.11, "t": 256.85, "r": 289.29, "b": 266.17, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 37, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 282.11, "r_y0": 266.17, "r_x1": 289.29, "r_y1": 266.17, "r_x2": 289.29, "r_y2": 256.85, "r_x3": 282.11, "r_y3": 256.85, "coord_origin": "TOPLEFT" }, "text": "U", "orig": "U", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 70, "label": "text", "bbox": { "l": 282.41, "t": 269.13, "r": 289.58, "b": 278.45, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 38, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 282.41, "r_y0": 278.45, "r_x1": 289.58, "r_y1": 278.45, "r_x2": 289.58, "r_y2": 269.13, "r_x3": 282.41, "r_y3": 269.13, "coord_origin": "TOPLEFT" }, "text": "U", "orig": "U", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 71, "label": "text", "bbox": { "l": 295.53, "t": 244.49, "r": 301.05, "b": 253.82, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 39, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 295.53, "r_y0": 253.82, "r_x1": 301.05, "r_y1": 253.82, "r_x2": 301.05, "r_y2": 244.49, "r_x3": 295.53, "r_y3": 244.49, "coord_origin": "TOPLEFT" }, "text": "L", "orig": "L", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 72, "label": "text", "bbox": { "l": 307.47, "t": 244.57, "r": 312.99, "b": 253.9, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 40, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 307.47, "r_y0": 253.9, "r_x1": 312.99, "r_y1": 253.9, "r_x2": 312.99, "r_y2": 244.57, "r_x3": 307.47, "r_y3": 244.57, "coord_origin": "TOPLEFT" }, "text": "L", "orig": "L", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 73, "label": "text", "bbox": { "l": 318.77, "t": 244.44, "r": 324.29, "b": 253.76, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 41, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 318.77, "r_y0": 253.76, "r_x1": 324.29, "r_y1": 253.76, "r_x2": 324.29, "r_y2": 244.44, "r_x3": 318.77, "r_y3": 244.44, "coord_origin": "TOPLEFT" }, "text": "L", "orig": "L", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 74, "label": "text", "bbox": { "l": 294.9, "t": 256.7, "r": 301.04, "b": 266.02, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 42, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 294.9, "r_y0": 266.02, "r_x1": 301.04, "r_y1": 266.02, "r_x2": 301.04, "r_y2": 256.7, "r_x3": 294.9, "r_y3": 256.7, "coord_origin": "TOPLEFT" }, "text": "X", "orig": "X", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 75, "label": "text", "bbox": { "l": 307.18, "t": 256.7, "r": 325.59, "b": 266.02, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 43, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 307.18, "r_y0": 266.02, "r_x1": 325.59, "r_y1": 266.02, "r_x2": 325.59, "r_y2": 256.7, "r_x3": 307.18, "r_y3": 256.7, "coord_origin": "TOPLEFT" }, "text": "X X", "orig": "X X", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 76, "label": "text", "bbox": { "l": 294.79, "t": 269.25, "r": 300.93, "b": 278.58, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 44, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 294.79, "r_y0": 278.58, "r_x1": 300.93, "r_y1": 278.58, "r_x2": 300.93, "r_y2": 269.25, "r_x3": 294.79, "r_y3": 269.25, "coord_origin": "TOPLEFT" }, "text": "X", "orig": "X", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 77, "label": "text", "bbox": { "l": 307.06, "t": 269.25, "r": 325.48, "b": 278.58, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 45, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 307.06, "r_y0": 278.58, "r_x1": 325.48, "r_y1": 278.58, "r_x2": 325.48, "r_y2": 269.25, "r_x3": 307.06, "r_y3": 269.25, "coord_origin": "TOPLEFT" }, "text": "X X", "orig": "X X", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 78, "label": "text", "bbox": { "l": 195.94, "t": 268.75, "r": 203.11, "b": 278.07, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 46, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 195.94, "r_y0": 278.07, "r_x1": 203.11, "r_y1": 278.07, "r_x2": 203.11, "r_y2": 268.75, "r_x3": 195.94, "r_y3": 268.75, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 79, "label": "text", "bbox": { "l": 209.21, "t": 268.73, "r": 214.73, "b": 278.05, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 47, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 209.21, "r_y0": 278.05, "r_x1": 214.73, "r_y1": 278.05, "r_x2": 214.73, "r_y2": 268.73, "r_x3": 209.21, "r_y3": 268.73, "coord_origin": "TOPLEFT" }, "text": "L", "orig": "L", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 80, "label": "text", "bbox": { "l": 221.15, "t": 268.81, "r": 226.67, "b": 278.13, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 48, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 221.15, "r_y0": 278.13, "r_x1": 226.67, "r_y1": 278.13, "r_x2": 226.67, "r_y2": 268.81, "r_x3": 221.15, "r_y3": 268.81, "coord_origin": "TOPLEFT" }, "text": "L", "orig": "L", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 81, "label": "text", "bbox": { "l": 232.45, "t": 268.68, "r": 237.97, "b": 278.0, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 49, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 232.45, "r_y0": 278.0, "r_x1": 237.97, "r_y1": 278.0, "r_x2": 237.97, "r_y2": 268.68, "r_x3": 232.45, "r_y3": 268.68, "coord_origin": "TOPLEFT" }, "text": "L", "orig": "L", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 82, "label": "text", "bbox": { "l": 196.22, "t": 244.54, "r": 203.39, "b": 253.86, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 50, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 196.22, "r_y0": 253.86, "r_x1": 203.39, "r_y1": 253.86, "r_x2": 203.39, "r_y2": 244.54, "r_x3": 196.22, "r_y3": 244.54, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 83, "label": "text", "bbox": { "l": 250.32, "t": 244.1, "r": 257.5, "b": 253.42, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 51, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 250.32, "r_y0": 253.42, "r_x1": 257.5, "r_y1": 253.42, "r_x2": 257.5, "r_y2": 244.1, "r_x3": 250.32, "r_y3": 244.1, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 84, "label": "text", "bbox": { "l": 250.17, "t": 256.44, "r": 257.35, "b": 265.76, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 52, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 250.17, "r_y0": 265.76, "r_x1": 257.35, "r_y1": 265.76, "r_x2": 257.35, "r_y2": 256.44, "r_x3": 250.17, "r_y3": 256.44, "coord_origin": "TOPLEFT" }, "text": "U", "orig": "U", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 85, "label": "text", "bbox": { "l": 250.47, "t": 268.72, "r": 257.65, "b": 278.04, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 53, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 250.47, "r_y0": 278.04, "r_x1": 257.65, "r_y1": 278.04, "r_x2": 257.65, "r_y2": 268.72, "r_x3": 250.47, "r_y3": 268.72, "coord_origin": "TOPLEFT" }, "text": "U", "orig": "U", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 86, "label": "text", "bbox": { "l": 334.51, "t": 242.99, "r": 337.22, "b": 249.21, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 54, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 334.51, "r_y0": 249.21, "r_x1": 337.22, "r_y1": 249.21, "r_x2": 337.22, "r_y2": 242.99, "r_x3": 334.51, "r_y3": 242.99, "coord_origin": "TOPLEFT" }, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 87, "label": "text", "bbox": { "l": 339.94, "t": 242.99, "r": 391.49, "b": 249.21, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 55, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 339.94, "r_y0": 249.21, "r_x1": 391.49, "r_y1": 249.21, "r_x2": 391.49, "r_y2": 242.99, "r_x3": 339.94, "r_y3": 242.99, "coord_origin": "TOPLEFT" }, "text": "- simple cells: \"C\"", "orig": "- simple cells: \"C\"", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 88, "label": "text", "bbox": { "l": 334.51, "t": 252.93, "r": 337.33, "b": 259.15, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 56, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 334.51, "r_y0": 259.15, "r_x1": 337.33, "r_y1": 259.15, "r_x2": 337.33, "r_y2": 252.93, "r_x3": 334.51, "r_y3": 252.93, "coord_origin": "TOPLEFT" }, "text": "2", "orig": "2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 89, "label": "text", "bbox": { "l": 340.15, "t": 252.93, "r": 421.99, "b": 259.15, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 57, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 340.15, "r_y0": 259.15, "r_x1": 421.99, "r_y1": 259.15, "r_x2": 421.99, "r_y2": 252.93, "r_x3": 340.15, "r_y3": 252.93, "coord_origin": "TOPLEFT" }, "text": "- horizontal merges: \"C\", \"L\"", "orig": "- horizontal merges: \"C\", \"L\"", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 90, "label": "text", "bbox": { "l": 334.51, "t": 262.87, "r": 337.3, "b": 269.08, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 58, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 334.51, "r_y0": 269.08, "r_x1": 337.3, "r_y1": 269.08, "r_x2": 337.3, "r_y2": 262.87, "r_x3": 334.51, "r_y3": 262.87, "coord_origin": "TOPLEFT" }, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 91, "label": "text", "bbox": { "l": 340.09, "t": 262.87, "r": 415.34, "b": 269.08, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 59, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 340.09, "r_y0": 269.08, "r_x1": 415.34, "r_y1": 269.08, "r_x2": 415.34, "r_y2": 262.87, "r_x3": 340.09, "r_y3": 262.87, "coord_origin": "TOPLEFT" }, "text": "- vertical merges: \"C\", \"U\"", "orig": "- vertical merges: \"C\", \"U\"", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 18, "label": "list_item", "bbox": { "l": 334.51, "t": 272.81, "r": 426.6, "b": 279.02, "coord_origin": "TOPLEFT" }, "confidence": 0.525, "cells": [ { "index": 60, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 334.51, "r_y0": 279.02, "r_x1": 337.3, "r_y1": 279.02, "r_x2": 337.3, "r_y2": 272.81, "r_x3": 334.51, "r_y3": 272.81, "coord_origin": "TOPLEFT" }, "text": "4", "orig": "4", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 61, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 340.09, "r_y0": 279.02, "r_x1": 426.6, "r_y1": 279.02, "r_x2": 426.6, "r_y2": 272.81, "r_x3": 340.09, "r_y3": 272.81, "coord_origin": "TOPLEFT" }, "text": "- 2d merges: \"C\", \"L\", \"U\", \"X\"", "orig": "- 2d merges: \"C\", \"L\", \"U\", \"X\"", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 92, "label": "text", "bbox": { "l": 185.67, "t": 244.04, "r": 189.36, "b": 250.26, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 62, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 185.67, "r_y0": 250.26, "r_x1": 189.36, "r_y1": 250.26, "r_x2": 189.36, "r_y2": 244.04, "r_x3": 185.67, "r_y3": 244.04, "coord_origin": "TOPLEFT" }, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 93, "label": "text", "bbox": { "l": 185.97, "t": 268.35, "r": 189.65, "b": 274.56, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 63, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 185.97, "r_y0": 274.56, "r_x1": 189.65, "r_y1": 274.56, "r_x2": 189.65, "r_y2": 268.35, "r_x3": 185.97, "r_y3": 268.35, "coord_origin": "TOPLEFT" }, "text": "2", "orig": "2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 94, "label": "text", "bbox": { "l": 239.34, "t": 243.63, "r": 243.03, "b": 249.84, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 64, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 239.34, "r_y0": 249.84, "r_x1": 243.03, "r_y1": 249.84, "r_x2": 243.03, "r_y2": 243.63, "r_x3": 239.34, "r_y3": 243.63, "coord_origin": "TOPLEFT" }, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 95, "label": "text", "bbox": { "l": 271.33, "t": 243.49, "r": 275.01, "b": 249.71, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 65, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 271.33, "r_y0": 249.71, "r_x1": 275.01, "r_y1": 249.71, "r_x2": 275.01, "r_y2": 243.49, "r_x3": 271.33, "r_y3": 243.49, "coord_origin": "TOPLEFT" }, "text": "4", "orig": "4", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 96, "label": "text", "bbox": { "l": 229.82, "t": 166.51, "r": 233.5, "b": 172.73, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 66, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 229.82, "r_y0": 172.73, "r_x1": 233.5, "r_y1": 172.73, "r_x2": 233.5, "r_y2": 166.51, "r_x3": 229.82, "r_y3": 166.51, "coord_origin": "TOPLEFT" }, "text": "2", "orig": "2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 97, "label": "text", "bbox": { "l": 257.24, "t": 189.96, "r": 260.93, "b": 196.18, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 67, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 257.24, "r_y0": 196.18, "r_x1": 260.93, "r_y1": 196.18, "r_x2": 260.93, "r_y2": 189.96, "r_x3": 257.24, "r_y3": 189.96, "coord_origin": "TOPLEFT" }, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 98, "label": "text", "bbox": { "l": 186.88, "t": 177.98, "r": 190.56, "b": 184.19, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 68, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 186.88, "r_y0": 184.19, "r_x1": 190.56, "r_y1": 184.19, "r_x2": 190.56, "r_y2": 177.98, "r_x3": 186.88, "r_y3": 177.98, "coord_origin": "TOPLEFT" }, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 99, "label": "text", "bbox": { "l": 196.49, "t": 169.02, "r": 200.17, "b": 175.23, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 69, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 196.49, "r_y0": 175.23, "r_x1": 200.17, "r_y1": 175.23, "r_x2": 200.17, "r_y2": 169.02, "r_x3": 196.49, "r_y3": 169.02, "coord_origin": "TOPLEFT" }, "text": "4", "orig": "4", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 100, "label": "text", "bbox": { "l": 169.75, "t": 167.88, "r": 175.73, "b": 175.65, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 70, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 169.75, "r_y0": 175.65, "r_x1": 175.73, "r_y1": 175.65, "r_x2": 175.73, "r_y2": 167.88, "r_x3": 169.75, "r_y3": 167.88, "coord_origin": "TOPLEFT" }, "text": "A", "orig": "A", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 101, "label": "text", "bbox": { "l": 169.75, "t": 206.84, "r": 175.73, "b": 214.61, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 71, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 169.75, "r_y0": 214.61, "r_x1": 175.73, "r_y1": 214.61, "r_x2": 175.73, "r_y2": 206.84, "r_x3": 169.75, "r_y3": 206.84, "coord_origin": "TOPLEFT" }, "text": "B", "orig": "B", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 102, "label": "text", "bbox": { "l": 274.29, "t": 168.28, "r": 280.27, "b": 176.05, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 72, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 274.29, "r_y0": 176.05, "r_x1": 280.27, "r_y1": 176.05, "r_x2": 280.27, "r_y2": 168.28, "r_x3": 274.29, "r_y3": 168.28, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 103, "label": "text", "bbox": { "l": 359.56, "t": 168.28, "r": 365.54, "b": 176.05, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 73, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 359.56, "r_y0": 176.05, "r_x1": 365.54, "r_y1": 176.05, "r_x2": 365.54, "r_y2": 168.28, "r_x3": 359.56, "r_y3": 168.28, "coord_origin": "TOPLEFT" }, "text": "D", "orig": "D", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 104, "label": "text", "bbox": { "l": 169.75, "t": 243.21, "r": 175.27, "b": 250.98, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 74, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 169.75, "r_y0": 250.98, "r_x1": 175.27, "r_y1": 250.98, "r_x2": 175.27, "r_y2": 243.21, "r_x3": 169.75, "r_y3": 243.21, "coord_origin": "TOPLEFT" }, "text": "E", "orig": "E", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] } ] }, "text": "", "annotations": [], "provenance": null, "predicted_class": null, "confidence": null }, { "label": "section_header", "id": 9, "page_no": 6, "cluster": { "id": 9, "label": "section_header", "bbox": { "l": 134.76, "t": 305.3, "r": 246.65, "b": 314.1, "coord_origin": "TOPLEFT" }, "confidence": 0.923, "cells": [ { "index": 75, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 314.1, "r_x1": 149.4, "r_y1": 314.1, "r_x2": 149.4, "r_y2": 305.3, "r_x3": 134.76, "r_y3": 305.3, "coord_origin": "TOPLEFT" }, "text": "4.2", "orig": "4.2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 76, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 160.86, "r_y0": 314.1, "r_x1": 246.65, "r_y1": 314.1, "r_x2": 246.65, "r_y2": 305.3, "r_x3": 160.86, "r_y3": 305.3, "coord_origin": "TOPLEFT" }, "text": "Language Syntax", "orig": "Language Syntax", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "4.2 Language Syntax" }, { "label": "text", "id": 10, "page_no": 6, "cluster": { "id": 10, "label": "text", "bbox": { "l": 134.76, "t": 325.25, "r": 363.8, "b": 334.04, "coord_origin": "TOPLEFT" }, "confidence": 0.917, "cells": [ { "index": 77, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 334.04, "r_x1": 363.8, "r_y1": 334.04, "r_x2": 363.8, "r_y2": 325.25, "r_x3": 134.76, "r_y3": 325.25, "coord_origin": "TOPLEFT" }, "text": "The OTSL representation follows these syntax rules:", "orig": "The OTSL representation follows these syntax rules:", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "The OTSL representation follows these syntax rules:" }, { "label": "list_item", "id": 3, "page_no": 6, "cluster": { "id": 3, "label": "list_item", "bbox": { "l": 138.97, "t": 347.17, "r": 480.59, "b": 367.93, "coord_origin": "TOPLEFT" }, "confidence": 0.959, "cells": [ { "index": 78, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 138.97, "r_y0": 355.98, "r_x1": 146.72, "r_y1": 355.98, "r_x2": 146.72, "r_y2": 347.18, "r_x3": 138.97, "r_y3": 347.18, "coord_origin": "TOPLEFT" }, "text": "1.", "orig": "1.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 79, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.7, "r_y0": 355.98, "r_x1": 257.38, "r_y1": 355.98, "r_x2": 257.38, "r_y2": 347.17, "r_x3": 151.7, "r_y3": 347.17, "coord_origin": "TOPLEFT" }, "text": "Left-looking cell rule", "orig": "Left-looking cell rule", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 80, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 257.38, "r_y0": 355.98, "r_x1": 480.59, "r_y1": 355.98, "r_x2": 480.59, "r_y2": 347.18, "r_x3": 257.38, "r_y3": 347.18, "coord_origin": "TOPLEFT" }, "text": ": The left neighbour of an \"L\" cell must be either", "orig": ": The left neighbour of an \"L\" cell must be either", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 81, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.7, "r_y0": 367.93, "r_x1": 283.59, "r_y1": 367.93, "r_x2": 283.59, "r_y2": 359.14, "r_x3": 151.7, "r_y3": 359.14, "coord_origin": "TOPLEFT" }, "text": "another \"L\" cell or a \"C\" cell.", "orig": "another \"L\" cell or a \"C\" cell.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "1. Left-looking cell rule : The left neighbour of an \"L\" cell must be either another \"L\" cell or a \"C\" cell." }, { "label": "list_item", "id": 4, "page_no": 6, "cluster": { "id": 4, "label": "list_item", "bbox": { "l": 138.97, "t": 371.08, "r": 480.59, "b": 391.85, "coord_origin": "TOPLEFT" }, "confidence": 0.959, "cells": [ { "index": 82, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 138.97, "r_y0": 379.89, "r_x1": 146.72, "r_y1": 379.89, "r_x2": 146.72, "r_y2": 371.09, "r_x3": 138.97, "r_y3": 371.09, "coord_origin": "TOPLEFT" }, "text": "2.", "orig": "2.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 83, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.7, "r_y0": 379.89, "r_x1": 252.11, "r_y1": 379.89, "r_x2": 252.11, "r_y2": 371.08, "r_x3": 151.7, "r_y3": 371.08, "coord_origin": "TOPLEFT" }, "text": "Up-looking cell rule", "orig": "Up-looking cell rule", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 84, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 252.11, "r_y0": 379.89, "r_x1": 480.59, "r_y1": 379.89, "r_x2": 480.59, "r_y2": 371.09, "r_x3": 252.11, "r_y3": 371.09, "coord_origin": "TOPLEFT" }, "text": ": The upper neighbour of a \"U\" cell must be either", "orig": ": The upper neighbour of a \"U\" cell must be either", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 85, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.7, "r_y0": 391.85, "r_x1": 284.84, "r_y1": 391.85, "r_x2": 284.84, "r_y2": 383.05, "r_x3": 151.7, "r_y3": 383.05, "coord_origin": "TOPLEFT" }, "text": "another \"U\" cell or a \"C\" cell.", "orig": "another \"U\" cell or a \"C\" cell.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "2. Up-looking cell rule : The upper neighbour of a \"U\" cell must be either another \"U\" cell or a \"C\" cell." }, { "label": "section_header", "id": 14, "page_no": 6, "cluster": { "id": 14, "label": "section_header", "bbox": { "l": 138.97, "t": 395.0, "r": 226.07, "b": 403.8, "coord_origin": "TOPLEFT" }, "confidence": 0.651, "cells": [ { "index": 86, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 138.97, "r_y0": 403.8, "r_x1": 146.72, "r_y1": 403.8, "r_x2": 146.72, "r_y2": 395.01, "r_x3": 138.97, "r_y3": 395.01, "coord_origin": "TOPLEFT" }, "text": "3.", "orig": "3.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 87, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.7, "r_y0": 403.8, "r_x1": 223.3, "r_y1": 403.8, "r_x2": 223.3, "r_y2": 395.0, "r_x3": 151.7, "r_y3": 395.0, "coord_origin": "TOPLEFT" }, "text": "Cross cell rule", "orig": "Cross cell rule", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 88, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 223.31, "r_y0": 403.8, "r_x1": 226.07, "r_y1": 403.8, "r_x2": 226.07, "r_y2": 395.01, "r_x3": 223.31, "r_y3": 395.01, "coord_origin": "TOPLEFT" }, "text": ":", "orig": ":", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "3. Cross cell rule :" }, { "label": "list_item", "id": 13, "page_no": 6, "cluster": { "id": 13, "label": "list_item", "bbox": { "l": 151.7, "t": 406.97, "r": 480.59, "b": 439.67, "coord_origin": "TOPLEFT" }, "confidence": 0.725, "cells": [ { "index": 89, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.7, "r_y0": 415.76, "r_x1": 480.59, "r_y1": 415.76, "r_x2": 480.59, "r_y2": 406.97, "r_x3": 151.7, "r_y3": 406.97, "coord_origin": "TOPLEFT" }, "text": "The left neighbour of an \"X\" cell must be either another \"X\" cell or a \"U\"", "orig": "The left neighbour of an \"X\" cell must be either another \"X\" cell or a \"U\"", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 90, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.7, "r_y0": 427.72, "r_x1": 480.59, "r_y1": 427.72, "r_x2": 480.59, "r_y2": 418.92, "r_x3": 151.7, "r_y3": 418.92, "coord_origin": "TOPLEFT" }, "text": "cell, and the upper neighbour of an \"X\" cell must be either another \"X\" cell", "orig": "cell, and the upper neighbour of an \"X\" cell must be either another \"X\" cell", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 91, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.7, "r_y0": 439.67, "r_x1": 214.4, "r_y1": 439.67, "r_x2": 214.4, "r_y2": 430.88, "r_x3": 151.7, "r_y3": 430.88, "coord_origin": "TOPLEFT" }, "text": "or an \"L\" cell.", "orig": "or an \"L\" cell.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "The left neighbour of an \"X\" cell must be either another \"X\" cell or a \"U\" cell, and the upper neighbour of an \"X\" cell must be either another \"X\" cell or an \"L\" cell." }, { "label": "list_item", "id": 8, "page_no": 6, "cluster": { "id": 8, "label": "list_item", "bbox": { "l": 138.97, "t": 442.83, "r": 474.59, "b": 451.63, "coord_origin": "TOPLEFT" }, "confidence": 0.926, "cells": [ { "index": 92, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 138.97, "r_y0": 451.63, "r_x1": 146.72, "r_y1": 451.63, "r_x2": 146.72, "r_y2": 442.84, "r_x3": 138.97, "r_y3": 442.84, "coord_origin": "TOPLEFT" }, "text": "4.", "orig": "4.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 93, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.7, "r_y0": 451.63, "r_x1": 221.32, "r_y1": 451.63, "r_x2": 221.32, "r_y2": 442.83, "r_x3": 151.7, "r_y3": 442.83, "coord_origin": "TOPLEFT" }, "text": "First row rule", "orig": "First row rule", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 94, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 221.33, "r_y0": 451.63, "r_x1": 474.59, "r_y1": 451.63, "r_x2": 474.59, "r_y2": 442.84, "r_x3": 221.33, "r_y3": 442.84, "coord_origin": "TOPLEFT" }, "text": ": Only \"L\" cells and \"C\" cells are allowed in the first row.", "orig": ": Only \"L\" cells and \"C\" cells are allowed in the first row.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "4. First row rule : Only \"L\" cells and \"C\" cells are allowed in the first row." }, { "label": "list_item", "id": 5, "page_no": 6, "cluster": { "id": 5, "label": "list_item", "bbox": { "l": 138.97, "t": 454.78, "r": 480.59, "b": 475.55, "coord_origin": "TOPLEFT" }, "confidence": 0.942, "cells": [ { "index": 95, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 138.97, "r_y0": 463.59, "r_x1": 146.72, "r_y1": 463.59, "r_x2": 146.72, "r_y2": 454.79, "r_x3": 138.97, "r_y3": 454.79, "coord_origin": "TOPLEFT" }, "text": "5.", "orig": "5.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 96, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.7, "r_y0": 463.59, "r_x1": 240.72, "r_y1": 463.59, "r_x2": 240.72, "r_y2": 454.78, "r_x3": 151.7, "r_y3": 454.78, "coord_origin": "TOPLEFT" }, "text": "First column rule", "orig": "First column rule", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 97, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 240.72, "r_y0": 463.59, "r_x1": 480.59, "r_y1": 463.59, "r_x2": 480.59, "r_y2": 454.79, "r_x3": 240.72, "r_y3": 454.79, "coord_origin": "TOPLEFT" }, "text": ": Only \"U\" cells and \"C\" cells are allowed in the first", "orig": ": Only \"U\" cells and \"C\" cells are allowed in the first", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 98, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.7, "r_y0": 475.55, "r_x1": 186.01, "r_y1": 475.55, "r_x2": 186.01, "r_y2": 466.75, "r_x3": 151.7, "r_y3": 466.75, "coord_origin": "TOPLEFT" }, "text": "column.", "orig": "column.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "5. First column rule : Only \"U\" cells and \"C\" cells are allowed in the first column." }, { "label": "list_item", "id": 1, "page_no": 6, "cluster": { "id": 1, "label": "list_item", "bbox": { "l": 138.97, "t": 478.7, "r": 480.59, "b": 499.46, "coord_origin": "TOPLEFT" }, "confidence": 0.962, "cells": [ { "index": 99, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 138.97, "r_y0": 487.5, "r_x1": 146.72, "r_y1": 487.5, "r_x2": 146.72, "r_y2": 478.71, "r_x3": 138.97, "r_y3": 478.71, "coord_origin": "TOPLEFT" }, "text": "6.", "orig": "6.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 100, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.7, "r_y0": 487.5, "r_x1": 235.16, "r_y1": 487.5, "r_x2": 235.16, "r_y2": 478.7, "r_x3": 151.7, "r_y3": 478.7, "coord_origin": "TOPLEFT" }, "text": "Rectangular rule", "orig": "Rectangular rule", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 101, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 235.16, "r_y0": 487.5, "r_x1": 480.59, "r_y1": 487.5, "r_x2": 480.59, "r_y2": 478.71, "r_x3": 235.16, "r_y3": 478.71, "coord_origin": "TOPLEFT" }, "text": ": The table representation is always rectangular - all rows", "orig": ": The table representation is always rectangular - all rows", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 102, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.7, "r_y0": 499.46, "r_x1": 448.04, "r_y1": 499.46, "r_x2": 448.04, "r_y2": 490.66, "r_x3": 151.7, "r_y3": 490.66, "coord_origin": "TOPLEFT" }, "text": "must have an equal number of tokens, terminated with \"NL\" token.", "orig": "must have an equal number of tokens, terminated with \"NL\" token.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "6. Rectangular rule : The table representation is always rectangular - all rows must have an equal number of tokens, terminated with \"NL\" token." }, { "label": "text", "id": 0, "page_no": 6, "cluster": { "id": 0, "label": "text", "bbox": { "l": 134.76, "t": 512.59, "r": 480.6, "b": 640.94, "coord_origin": "TOPLEFT" }, "confidence": 0.979, "cells": [ { "index": 103, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 149.71, "r_y0": 521.39, "r_x1": 480.6, "r_y1": 521.39, "r_x2": 480.6, "r_y2": 512.59, "r_x3": 149.71, "r_y3": 512.59, "coord_origin": "TOPLEFT" }, "text": "The application of these rules gives OTSL a set of unique properties. First", "orig": "The application of these rules gives OTSL a set of unique properties. First", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 104, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 533.34, "r_x1": 480.59, "r_y1": 533.34, "r_x2": 480.59, "r_y2": 524.55, "r_x3": 134.76, "r_y3": 524.55, "coord_origin": "TOPLEFT" }, "text": "of all, the OTSL enforces a strictly rectangular structure representation, where", "orig": "of all, the OTSL enforces a strictly rectangular structure representation, where", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 105, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 545.3, "r_x1": 480.59, "r_y1": 545.3, "r_x2": 480.59, "r_y2": 536.5, "r_x3": 134.76, "r_y3": 536.5, "coord_origin": "TOPLEFT" }, "text": "every new-line token starts a new row. As a consequence, all rows and all columns", "orig": "every new-line token starts a new row. As a consequence, all rows and all columns", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 106, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 557.26, "r_x1": 480.59, "r_y1": 557.26, "r_x2": 480.59, "r_y2": 548.46, "r_x3": 134.76, "r_y3": 548.46, "coord_origin": "TOPLEFT" }, "text": "have exactly the same number of tokens, irrespective of cell spans. Secondly, the", "orig": "have exactly the same number of tokens, irrespective of cell spans. Secondly, the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 107, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 569.21, "r_x1": 480.59, "r_y1": 569.21, "r_x2": 480.59, "r_y2": 560.41, "r_x3": 134.76, "r_y3": 560.41, "coord_origin": "TOPLEFT" }, "text": "OTSL representation is unambiguous: Every table structure is represented in one", "orig": "OTSL representation is unambiguous: Every table structure is represented in one", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 108, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 581.17, "r_x1": 480.59, "r_y1": 581.17, "r_x2": 480.59, "r_y2": 572.37, "r_x3": 134.76, "r_y3": 572.37, "coord_origin": "TOPLEFT" }, "text": "way. In this representation every table cell corresponds to a \"C\"-cell token, which", "orig": "way. In this representation every table cell corresponds to a \"C\"-cell token, which", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 109, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 593.12, "r_x1": 480.59, "r_y1": 593.12, "r_x2": 480.59, "r_y2": 584.32, "r_x3": 134.76, "r_y3": 584.32, "coord_origin": "TOPLEFT" }, "text": "in case of spans is always located in the top-left corner of the table cell definition.", "orig": "in case of spans is always located in the top-left corner of the table cell definition.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 110, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 605.08, "r_x1": 480.59, "r_y1": 605.08, "r_x2": 480.59, "r_y2": 596.28, "r_x3": 134.76, "r_y3": 596.28, "coord_origin": "TOPLEFT" }, "text": "Third, OTSL syntax rules are only backward-looking. As a consequence, every", "orig": "Third, OTSL syntax rules are only backward-looking. As a consequence, every", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 111, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 617.03, "r_x1": 480.59, "r_y1": 617.03, "r_x2": 480.59, "r_y2": 608.23, "r_x3": 134.76, "r_y3": 608.23, "coord_origin": "TOPLEFT" }, "text": "predicted token can be validated straight during sequence generation by looking", "orig": "predicted token can be validated straight during sequence generation by looking", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 112, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 628.99, "r_x1": 480.59, "r_y1": 628.99, "r_x2": 480.59, "r_y2": 620.19, "r_x3": 134.76, "r_y3": 620.19, "coord_origin": "TOPLEFT" }, "text": "at the previously predicted sequence. As such, OTSL can guarantee that every", "orig": "at the previously predicted sequence. As such, OTSL can guarantee that every", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 113, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 640.94, "r_x1": 311.2, "r_y1": 640.94, "r_x2": 311.2, "r_y2": 632.14, "r_x3": 134.76, "r_y3": 632.14, "coord_origin": "TOPLEFT" }, "text": "predicted sequence is syntactically valid.", "orig": "predicted sequence is syntactically valid.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "The application of these rules gives OTSL a set of unique properties. First of all, the OTSL enforces a strictly rectangular structure representation, where every new-line token starts a new row. As a consequence, all rows and all columns have exactly the same number of tokens, irrespective of cell spans. Secondly, the OTSL representation is unambiguous: Every table structure is represented in one way. In this representation every table cell corresponds to a \"C\"-cell token, which in case of spans is always located in the top-left corner of the table cell definition. Third, OTSL syntax rules are only backward-looking. As a consequence, every predicted token can be validated straight during sequence generation by looking at the previously predicted sequence. As such, OTSL can guarantee that every predicted sequence is syntactically valid." }, { "label": "text", "id": 2, "page_no": 6, "cluster": { "id": 2, "label": "text", "bbox": { "l": 134.76, "t": 644.1, "r": 480.59, "b": 664.85, "coord_origin": "TOPLEFT" }, "confidence": 0.959, "cells": [ { "index": 114, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 149.71, "r_y0": 652.9, "r_x1": 480.59, "r_y1": 652.9, "r_x2": 480.59, "r_y2": 644.1, "r_x3": 149.71, "r_y3": 644.1, "coord_origin": "TOPLEFT" }, "text": "These characteristics can be easily learned by sequence generator networks,", "orig": "These characteristics can be easily learned by sequence generator networks,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 115, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 664.85, "r_x1": 480.59, "r_y1": 664.85, "r_x2": 480.59, "r_y2": 656.06, "r_x3": 134.76, "r_y3": 656.06, "coord_origin": "TOPLEFT" }, "text": "as we demonstrate further below. We find strong indications that this pattern", "orig": "as we demonstrate further below. We find strong indications that this pattern", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "These characteristics can be easily learned by sequence generator networks, as we demonstrate further below. We find strong indications that this pattern" } ], "headers": [ { "label": "page_header", "id": 7, "page_no": 6, "cluster": { "id": 7, "label": "page_header", "bbox": { "l": 194.48, "t": 93.77, "r": 447.54, "b": 101.84, "coord_origin": "TOPLEFT" }, "confidence": 0.933, "cells": [ { "index": 0, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 194.48, "r_y0": 101.84, "r_x1": 447.54, "r_y1": 101.84, "r_x2": 447.54, "r_y2": 93.77, "r_x3": 194.48, "r_y3": 93.77, "coord_origin": "TOPLEFT" }, "text": "Optimized Table Tokenization for Table Structure Recognition", "orig": "Optimized Table Tokenization for Table Structure Recognition", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "Optimized Table Tokenization for Table Structure Recognition" }, { "label": "page_header", "id": 11, "page_no": 6, "cluster": { "id": 11, "label": "page_header", "bbox": { "l": 475.98, "t": 93.77, "r": 480.59, "b": 101.84, "coord_origin": "TOPLEFT" }, "confidence": 0.875, "cells": [ { "index": 1, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 475.98, "r_y0": 101.84, "r_x1": 480.59, "r_y1": 101.84, "r_x2": 480.59, "r_y2": 93.77, "r_x3": 475.98, "r_y3": 93.77, "coord_origin": "TOPLEFT" }, "text": "7", "orig": "7", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "7" } ] } }, { "page_no": 7, "size": { "width": 612.0, "height": 792.0 }, "parsed_page": { "dimension": { "angle": 0.0, "rect": { "r_x0": 0.0, "r_y0": 0.0, "r_x1": 612.0, "r_y1": 0.0, "r_x2": 612.0, "r_y2": 792.0, "r_x3": 0.0, "r_y3": 792.0, "coord_origin": "BOTTOMLEFT" }, "boundary_type": "crop_box", "art_bbox": { "l": 0.0, "t": 792.0, "r": 612.0, "b": 0.0, "coord_origin": "BOTTOMLEFT" }, "bleed_bbox": { "l": 0.0, "t": 792.0, "r": 612.0, "b": 0.0, "coord_origin": "BOTTOMLEFT" }, "crop_bbox": { "l": 0.0, "t": 792.0, "r": 612.0, "b": 0.0, "coord_origin": "BOTTOMLEFT" }, "media_bbox": { "l": 0.0, "t": 792.0, "r": 612.0, "b": 0.0, "coord_origin": "BOTTOMLEFT" }, "trim_bbox": { "l": 0.0, "t": 792.0, "r": 612.0, "b": 0.0, "coord_origin": "BOTTOMLEFT" } }, "bitmap_resources": [], "char_cells": [], "word_cells": [], "textline_cells": [ { "index": 0, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 101.84, "r_x1": 139.37, "r_y1": 101.84, "r_x2": 139.37, "r_y2": 93.77, "r_x3": 134.76, "r_y3": 93.77, "coord_origin": "TOPLEFT" }, "text": "8", "orig": "8", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 1, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 167.81, "r_y0": 101.84, "r_x1": 178.08, "r_y1": 101.84, "r_x2": 178.08, "r_y2": 93.77, "r_x3": 167.81, "r_y3": 93.77, "coord_origin": "TOPLEFT" }, "text": "M.", "orig": "M.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 2, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 182.37, "r_y0": 101.84, "r_x1": 231.72, "r_y1": 101.84, "r_x2": 231.72, "r_y2": 93.77, "r_x3": 182.37, "r_y3": 93.77, "coord_origin": "TOPLEFT" }, "text": "Lysak, et al.", "orig": "Lysak, et al.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 3, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 127.73, "r_x1": 480.59, "r_y1": 127.73, "r_x2": 480.59, "r_y2": 118.93, "r_x3": 134.76, "r_y3": 118.93, "coord_origin": "TOPLEFT" }, "text": "reduces significantly the column drift seen in the HTML based models (see Fig-", "orig": "reduces significantly the column drift seen in the HTML based models (see Fig-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 4, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 139.69, "r_x1": 163.56, "r_y1": 139.69, "r_x2": 163.56, "r_y2": 130.89, "r_x3": 134.76, "r_y3": 130.89, "coord_origin": "TOPLEFT" }, "text": "ure 5).", "orig": "ure 5).", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 5, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 170.36, "r_x1": 149.4, "r_y1": 170.36, "r_x2": 149.4, "r_y2": 161.56, "r_x3": 134.76, "r_y3": 161.56, "coord_origin": "TOPLEFT" }, "text": "4.3", "orig": "4.3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 6, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 160.86, "r_y0": 170.36, "r_x1": 319.35, "r_y1": 170.36, "r_x2": 319.35, "r_y2": 161.56, "r_x3": 160.86, "r_y3": 161.56, "coord_origin": "TOPLEFT" }, "text": "Error-detection and -mitigation", "orig": "Error-detection and -mitigation", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 7, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 191.08, "r_x1": 480.6, "r_y1": 191.08, "r_x2": 480.6, "r_y2": 182.28, "r_x3": 134.76, "r_y3": 182.28, "coord_origin": "TOPLEFT" }, "text": "The design of OTSL allows to validate a table structure easily on an unfinished", "orig": "The design of OTSL allows to validate a table structure easily on an unfinished", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 8, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 203.03, "r_x1": 480.59, "r_y1": 203.03, "r_x2": 480.59, "r_y2": 194.24, "r_x3": 134.76, "r_y3": 194.24, "coord_origin": "TOPLEFT" }, "text": "sequence. The detection of an invalid sequence token is a clear indication of a", "orig": "sequence. The detection of an invalid sequence token is a clear indication of a", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 9, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 214.99, "r_x1": 480.59, "r_y1": 214.99, "r_x2": 480.59, "r_y2": 206.19, "r_x3": 134.76, "r_y3": 206.19, "coord_origin": "TOPLEFT" }, "text": "prediction mistake, however a valid sequence by itself does not guarantee pre-", "orig": "prediction mistake, however a valid sequence by itself does not guarantee pre-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 10, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 226.94, "r_x1": 480.59, "r_y1": 226.94, "r_x2": 480.59, "r_y2": 218.15, "r_x3": 134.76, "r_y3": 218.15, "coord_origin": "TOPLEFT" }, "text": "diction correctness. Different heuristics can be used to correct token errors in", "orig": "diction correctness. Different heuristics can be used to correct token errors in", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 11, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 238.9, "r_x1": 480.59, "r_y1": 238.9, "r_x2": 480.59, "r_y2": 230.1, "r_x3": 134.76, "r_y3": 230.1, "coord_origin": "TOPLEFT" }, "text": "an invalid sequence and thus increase the chances for accurate predictions. Such", "orig": "an invalid sequence and thus increase the chances for accurate predictions. Such", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 12, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 250.85, "r_x1": 480.59, "r_y1": 250.85, "r_x2": 480.59, "r_y2": 242.06, "r_x3": 134.76, "r_y3": 242.06, "coord_origin": "TOPLEFT" }, "text": "heuristics can be applied either after the prediction of each token, or at the end", "orig": "heuristics can be applied either after the prediction of each token, or at the end", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 13, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 262.81, "r_x1": 480.59, "r_y1": 262.81, "r_x2": 480.59, "r_y2": 254.01, "r_x3": 134.76, "r_y3": 254.01, "coord_origin": "TOPLEFT" }, "text": "on the entire predicted sequence. For example a simple heuristic which can cor-", "orig": "on the entire predicted sequence. For example a simple heuristic which can cor-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 14, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 274.77, "r_x1": 480.59, "r_y1": 274.77, "r_x2": 480.59, "r_y2": 265.97, "r_x3": 134.76, "r_y3": 265.97, "coord_origin": "TOPLEFT" }, "text": "rect the predicted OTSL sequence on-the-fly is to verify if the token with the", "orig": "rect the predicted OTSL sequence on-the-fly is to verify if the token with the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 15, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 286.72, "r_x1": 480.6, "r_y1": 286.72, "r_x2": 480.6, "r_y2": 277.92, "r_x3": 134.76, "r_y3": 277.92, "coord_origin": "TOPLEFT" }, "text": "highest prediction confidence invalidates the predicted sequence, and replace it", "orig": "highest prediction confidence invalidates the predicted sequence, and replace it", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 16, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 298.68, "r_x1": 469.4, "r_y1": 298.68, "r_x2": 469.4, "r_y2": 289.88, "r_x3": 134.76, "r_y3": 289.88, "coord_origin": "TOPLEFT" }, "text": "by the token with the next highest confidence until OTSL rules are satisfied.", "orig": "by the token with the next highest confidence until OTSL rules are satisfied.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 17, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 331.73, "r_x1": 141.49, "r_y1": 331.73, "r_x2": 141.49, "r_y2": 321.16, "r_x3": 134.76, "r_y3": 321.16, "coord_origin": "TOPLEFT" }, "text": "5", "orig": "5", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 18, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 154.94, "r_y0": 331.73, "r_x1": 229.04, "r_y1": 331.73, "r_x2": 229.04, "r_y2": 321.16, "r_x3": 154.94, "r_y3": 321.16, "coord_origin": "TOPLEFT" }, "text": "Experiments", "orig": "Experiments", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 19, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 356.05, "r_x1": 480.59, "r_y1": 356.05, "r_x2": 480.59, "r_y2": 347.25, "r_x3": 134.76, "r_y3": 347.25, "coord_origin": "TOPLEFT" }, "text": "To evaluate the impact of OTSL on prediction accuracy and inference times, we", "orig": "To evaluate the impact of OTSL on prediction accuracy and inference times, we", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 20, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 368.0, "r_x1": 480.59, "r_y1": 368.0, "r_x2": 480.59, "r_y2": 359.2, "r_x3": 134.76, "r_y3": 359.2, "coord_origin": "TOPLEFT" }, "text": "conducted a series of experiments based on the TableFormer model (Figure 4)", "orig": "conducted a series of experiments based on the TableFormer model (Figure 4)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 21, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 379.96, "r_x1": 480.59, "r_y1": 379.96, "r_x2": 480.59, "r_y2": 371.16, "r_x3": 134.76, "r_y3": 371.16, "coord_origin": "TOPLEFT" }, "text": "with two objectives: Firstly we evaluate the prediction quality and performance", "orig": "with two objectives: Firstly we evaluate the prediction quality and performance", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 22, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 391.91, "r_x1": 480.59, "r_y1": 391.91, "r_x2": 480.59, "r_y2": 383.11, "r_x3": 134.76, "r_y3": 383.11, "coord_origin": "TOPLEFT" }, "text": "of OTSL vs. HTML after performing Hyper Parameter Optimization (HPO) on", "orig": "of OTSL vs. HTML after performing Hyper Parameter Optimization (HPO) on", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 23, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 403.87, "r_x1": 148.6, "r_y1": 403.87, "r_x2": 148.6, "r_y2": 395.07, "r_x3": 134.76, "r_y3": 395.07, "coord_origin": "TOPLEFT" }, "text": "the", "orig": "the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 24, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.63, "r_y0": 403.87, "r_x1": 191.85, "r_y1": 403.87, "r_x2": 191.85, "r_y2": 395.07, "r_x3": 151.63, "r_y3": 395.07, "coord_origin": "TOPLEFT" }, "text": "canonical", "orig": "canonical", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 25, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 195.9, "r_y0": 403.87, "r_x1": 480.6, "r_y1": 403.87, "r_x2": 480.6, "r_y2": 395.07, "r_x3": 195.9, "r_y3": 395.07, "coord_origin": "TOPLEFT" }, "text": "PubTabNet data set. Secondly we pick the best hyper-parameters", "orig": "PubTabNet data set. Secondly we pick the best hyper-parameters", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 26, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.77, "r_y0": 415.82, "r_x1": 480.59, "r_y1": 415.82, "r_x2": 480.59, "r_y2": 407.02, "r_x3": 134.77, "r_y3": 407.02, "coord_origin": "TOPLEFT" }, "text": "found in the first step and evaluate how OTSL impacts the performance of", "orig": "found in the first step and evaluate how OTSL impacts the performance of", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 27, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.77, "r_y0": 427.78, "r_x1": 480.59, "r_y1": 427.78, "r_x2": 480.59, "r_y2": 418.98, "r_x3": 134.77, "r_y3": 418.98, "coord_origin": "TOPLEFT" }, "text": "TableFormer after training on other publicly available data sets (FinTabNet,", "orig": "TableFormer after training on other publicly available data sets (FinTabNet,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 28, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.77, "r_y0": 439.73, "r_x1": 480.59, "r_y1": 439.73, "r_x2": 480.59, "r_y2": 430.94, "r_x3": 134.77, "r_y3": 430.94, "coord_origin": "TOPLEFT" }, "text": "PubTables-1M [14]). The ground truth (GT) from all data sets has been con-", "orig": "PubTables-1M [14]). The ground truth (GT) from all data sets has been con-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 29, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.77, "r_y0": 451.69, "r_x1": 479.3, "r_y1": 451.69, "r_x2": 479.3, "r_y2": 442.89, "r_x3": 134.77, "r_y3": 442.89, "coord_origin": "TOPLEFT" }, "text": "verted into OTSL format for this purpose, and will be made publicly available.", "orig": "verted into OTSL format for this purpose, and will be made publicly available.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 30, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.77, "r_y0": 492.57, "r_x1": 162.64, "r_y1": 492.57, "r_x2": 162.64, "r_y2": 484.65, "r_x3": 134.77, "r_y3": 484.65, "coord_origin": "TOPLEFT" }, "text": "Fig. 4.", "orig": "Fig. 4.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 31, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 165.2, "r_y0": 492.78, "r_x1": 480.59, "r_y1": 492.78, "r_x2": 480.59, "r_y2": 484.71, "r_x3": 165.2, "r_y3": 484.71, "coord_origin": "TOPLEFT" }, "text": "Architecture sketch of the TableFormer model, which is a representative for the", "orig": "Architecture sketch of the TableFormer model, which is a representative for the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 32, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.77, "r_y0": 503.74, "r_x1": 206.7, "r_y1": 503.74, "r_x2": 206.7, "r_y2": 495.67, "r_x3": 134.77, "r_y3": 495.67, "coord_origin": "TOPLEFT" }, "text": "Im2Seq approach.", "orig": "Im2Seq approach.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 33, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 147.3, "r_y0": 543.1, "r_x1": 149.71, "r_y1": 543.1, "r_x2": 149.71, "r_y2": 540.73, "r_x3": 147.3, "r_y3": 540.73, "coord_origin": "TOPLEFT" }, "text": "1.", "orig": "1.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 34, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 150.91, "r_y0": 543.1, "r_x1": 155.72, "r_y1": 543.1, "r_x2": 155.72, "r_y2": 540.73, "r_x3": 150.91, "r_y3": 540.73, "coord_origin": "TOPLEFT" }, "text": "Item", "orig": "Item", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 35, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 162.76, "r_y0": 537.76, "r_x1": 172.3, "r_y1": 537.76, "r_x2": 172.3, "r_y2": 535.39, "r_x3": 162.76, "r_y3": 535.39, "coord_origin": "TOPLEFT" }, "text": "Amount", "orig": "Amount", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 36, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 147.64, "r_y0": 537.73, "r_x1": 155.92, "r_y1": 537.73, "r_x2": 155.92, "r_y2": 535.37, "r_x3": 147.64, "r_y3": 535.37, "coord_origin": "TOPLEFT" }, "text": "Names", "orig": "Names", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 37, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 158.48, "r_y0": 543.1, "r_x1": 164.1, "r_y1": 543.1, "r_x2": 164.1, "r_y2": 540.73, "r_x3": 158.48, "r_y3": 540.73, "coord_origin": "TOPLEFT" }, "text": "1000", "orig": "1000", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 38, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 158.48, "r_y0": 547.04, "r_x1": 162.7, "r_y1": 547.04, "r_x2": 162.7, "r_y2": 544.67, "r_x3": 158.48, "r_y3": 544.67, "coord_origin": "TOPLEFT" }, "text": "500", "orig": "500", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 39, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 158.48, "r_y0": 551.28, "r_x1": 164.1, "r_y1": 551.28, "r_x2": 164.1, "r_y2": 548.91, "r_x3": 158.48, "r_y3": 548.91, "coord_origin": "TOPLEFT" }, "text": "3500", "orig": "3500", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 40, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 158.48, "r_y0": 555.52, "r_x1": 162.7, "r_y1": 555.52, "r_x2": 162.7, "r_y2": 553.15, "r_x3": 158.48, "r_y3": 553.15, "coord_origin": "TOPLEFT" }, "text": "150", "orig": "150", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 41, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 168.82, "r_y0": 543.1, "r_x1": 172.89, "r_y1": 543.1, "r_x2": 172.89, "r_y2": 540.73, "r_x3": 168.82, "r_y3": 540.73, "coord_origin": "TOPLEFT" }, "text": "unit", "orig": "unit", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 42, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 168.82, "r_y0": 547.04, "r_x1": 172.89, "r_y1": 547.04, "r_x2": 172.89, "r_y2": 544.67, "r_x3": 168.82, "r_y3": 544.67, "coord_origin": "TOPLEFT" }, "text": "unit", "orig": "unit", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 43, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 168.82, "r_y0": 551.28, "r_x1": 172.89, "r_y1": 551.28, "r_x2": 172.89, "r_y2": 548.91, "r_x3": 168.82, "r_y3": 548.91, "coord_origin": "TOPLEFT" }, "text": "unit", "orig": "unit", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 44, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 168.82, "r_y0": 555.52, "r_x1": 172.89, "r_y1": 555.52, "r_x2": 172.89, "r_y2": 553.15, "r_x3": 168.82, "r_y3": 553.15, "coord_origin": "TOPLEFT" }, "text": "unit", "orig": "unit", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 45, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 147.3, "r_y0": 547.04, "r_x1": 149.71, "r_y1": 547.04, "r_x2": 149.71, "r_y2": 544.67, "r_x3": 147.3, "r_y3": 544.67, "coord_origin": "TOPLEFT" }, "text": "2.", "orig": "2.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 46, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 150.91, "r_y0": 547.04, "r_x1": 155.72, "r_y1": 547.04, "r_x2": 155.72, "r_y2": 544.67, "r_x3": 150.91, "r_y3": 544.67, "coord_origin": "TOPLEFT" }, "text": "Item", "orig": "Item", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 47, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 147.3, "r_y0": 551.28, "r_x1": 149.71, "r_y1": 551.28, "r_x2": 149.71, "r_y2": 548.91, "r_x3": 147.3, "r_y3": 548.91, "coord_origin": "TOPLEFT" }, "text": "3.", "orig": "3.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 48, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 150.91, "r_y0": 551.28, "r_x1": 155.72, "r_y1": 551.28, "r_x2": 155.72, "r_y2": 548.91, "r_x3": 150.91, "r_y3": 548.91, "coord_origin": "TOPLEFT" }, "text": "Item", "orig": "Item", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 49, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 147.3, "r_y0": 555.52, "r_x1": 149.71, "r_y1": 555.52, "r_x2": 149.71, "r_y2": 553.15, "r_x3": 147.3, "r_y3": 553.15, "coord_origin": "TOPLEFT" }, "text": "4.", "orig": "4.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 50, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 150.91, "r_y0": 555.52, "r_x1": 155.72, "r_y1": 555.52, "r_x2": 155.72, "r_y2": 553.15, "r_x3": 150.91, "r_y3": 553.15, "coord_origin": "TOPLEFT" }, "text": "Item", "orig": "Item", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 51, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 152.05, "r_y0": 521.27, "r_x1": 171.25, "r_y1": 521.27, "r_x2": 171.25, "r_y2": 517.01, "r_x3": 152.05, "r_y3": 517.01, "coord_origin": "TOPLEFT" }, "text": "Extracted", "orig": "Extracted", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 52, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 148.13, "r_y0": 526.58, "r_x1": 175.17, "r_y1": 526.58, "r_x2": 175.17, "r_y2": 522.31, "r_x3": 148.13, "r_y3": 522.31, "coord_origin": "TOPLEFT" }, "text": "Table Images", "orig": "Table Images", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 53, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 193.53, "r_y0": 528.78, "r_x1": 220.32, "r_y1": 528.78, "r_x2": 220.32, "r_y2": 524.51, "r_x3": 193.53, "r_y3": 524.51, "coord_origin": "TOPLEFT" }, "text": "Standardized", "orig": "Standardized", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 54, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 199.47, "r_y0": 534.08, "r_x1": 214.38, "r_y1": 534.08, "r_x2": 214.38, "r_y2": 529.82, "r_x3": 199.47, "r_y3": 529.82, "coord_origin": "TOPLEFT" }, "text": "Images", "orig": "Images", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 55, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 273.61, "r_y0": 514.17, "r_x1": 284.47, "r_y1": 514.17, "r_x2": 284.47, "r_y2": 509.91, "r_x3": 273.61, "r_y3": 509.91, "coord_origin": "TOPLEFT" }, "text": "BBox", "orig": "BBox", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 56, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 270.45, "r_y0": 517.96, "r_x1": 287.63, "r_y1": 517.96, "r_x2": 287.63, "r_y2": 513.69, "r_x3": 270.45, "r_y3": 513.69, "coord_origin": "TOPLEFT" }, "text": "Decoder", "orig": "Decoder", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 57, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 332.48, "r_y0": 512.41, "r_x1": 348.14, "r_y1": 512.41, "r_x2": 348.14, "r_y2": 508.14, "r_x3": 332.48, "r_y3": 508.14, "coord_origin": "TOPLEFT" }, "text": "BBoxes", "orig": "BBoxes", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 58, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 376.69, "r_y0": 525.38, "r_x1": 407.25, "r_y1": 525.38, "r_x2": 407.25, "r_y2": 521.12, "r_x3": 376.69, "r_y3": 521.12, "coord_origin": "TOPLEFT" }, "text": "BBoxes can be", "orig": "BBoxes can be", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 59, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 373.91, "r_y0": 529.93, "r_x1": 410.04, "r_y1": 529.93, "r_x2": 410.04, "r_y2": 525.67, "r_x3": 373.91, "r_y3": 525.67, "coord_origin": "TOPLEFT" }, "text": "traced back to the", "orig": "traced back to the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 60, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 375.3, "r_y0": 534.47, "r_x1": 408.65, "r_y1": 534.47, "r_x2": 408.65, "r_y2": 530.21, "r_x3": 375.3, "r_y3": 530.21, "coord_origin": "TOPLEFT" }, "text": "original image to", "orig": "original image to", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 61, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 377.07, "r_y0": 539.02, "r_x1": 406.88, "r_y1": 539.02, "r_x2": 406.88, "r_y2": 534.76, "r_x3": 377.07, "r_y3": 534.76, "coord_origin": "TOPLEFT" }, "text": "extract content", "orig": "extract content", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 62, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 383.57, "r_y0": 567.5, "r_x1": 433.77, "r_y1": 567.5, "r_x2": 433.77, "r_y2": 563.24, "r_x3": 383.57, "r_y3": 563.24, "coord_origin": "TOPLEFT" }, "text": "Structure Tags sequence", "orig": "Structure Tags sequence", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 63, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 383.53, "r_y0": 572.05, "r_x1": 433.81, "r_y1": 572.05, "r_x2": 433.81, "r_y2": 567.79, "r_x3": 383.53, "r_y3": 567.79, "coord_origin": "TOPLEFT" }, "text": "provide full description of", "orig": "provide full description of", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 64, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 390.48, "r_y0": 576.59, "r_x1": 426.86, "r_y1": 576.59, "r_x2": 426.86, "r_y2": 572.33, "r_x3": 390.48, "r_y3": 572.33, "coord_origin": "TOPLEFT" }, "text": "the table structure", "orig": "the table structure", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 65, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 293.95, "r_y0": 582.15, "r_x1": 323.17, "r_y1": 582.15, "r_x2": 323.17, "r_y2": 577.89, "r_x3": 293.95, "r_y3": 577.89, "coord_origin": "TOPLEFT" }, "text": "Structure Tags", "orig": "Structure Tags", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 66, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 293.95, "r_y0": 586.7, "r_x1": 324.59, "r_y1": 586.7, "r_x2": 324.59, "r_y2": 582.44, "r_x3": 293.95, "r_y3": 582.44, "coord_origin": "TOPLEFT" }, "text": "in OTSL format", "orig": "in OTSL format", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 67, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 333.08, "r_y0": 546.09, "r_x1": 364.15, "r_y1": 546.09, "r_x2": 364.15, "r_y2": 541.82, "r_x3": 333.08, "r_y3": 541.82, "coord_origin": "TOPLEFT" }, "text": "BBoxes in sync", "orig": "BBoxes in sync", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 68, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 333.08, "r_y0": 549.87, "r_x1": 369.72, "r_y1": 549.87, "r_x2": 369.72, "r_y2": 545.61, "r_x3": 333.08, "r_y3": 545.61, "coord_origin": "TOPLEFT" }, "text": "with tag sequence", "orig": "with tag sequence", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 69, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 232.66, "r_y0": 519.5, "r_x1": 249.59, "r_y1": 519.5, "r_x2": 249.59, "r_y2": 515.24, "r_x3": 232.66, "r_y3": 515.24, "coord_origin": "TOPLEFT" }, "text": "Encoder", "orig": "Encoder", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 70, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 269.82, "r_y0": 550.23, "r_x1": 288.26, "r_y1": 550.23, "r_x2": 288.26, "r_y2": 545.97, "r_x3": 269.82, "r_y3": 545.97, "coord_origin": "TOPLEFT" }, "text": "Structure", "orig": "Structure", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 71, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 270.45, "r_y0": 554.02, "r_x1": 287.63, "r_y1": 554.02, "r_x2": 287.63, "r_y2": 549.76, "r_x3": 270.45, "r_y3": 549.76, "coord_origin": "TOPLEFT" }, "text": "Decoder", "orig": "Decoder", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 72, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 332.18, "r_y0": 520.18, "r_x1": 358.11, "r_y1": 520.18, "r_x2": 358.11, "r_y2": 515.91, "r_x3": 332.18, "r_y3": 515.91, "coord_origin": "TOPLEFT" }, "text": "[x1, y2, x2, y2]", "orig": "[x1, y2, x2, y2]", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 73, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 332.18, "r_y0": 526.24, "r_x1": 361.58, "r_y1": 526.24, "r_x2": 361.58, "r_y2": 521.97, "r_x3": 332.18, "r_y3": 521.97, "coord_origin": "TOPLEFT" }, "text": "[x1', y2', x2', y2']", "orig": "[x1', y2', x2', y2']", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 74, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 332.18, "r_y0": 532.3, "r_x1": 364.76, "r_y1": 532.3, "r_x2": 364.76, "r_y2": 528.03, "r_x3": 332.18, "r_y3": 528.03, "coord_origin": "TOPLEFT" }, "text": "[x1'', y2'', x2'', y2'']", "orig": "[x1'', y2'', x2'', y2'']", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 75, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 332.18, "r_y0": 538.36, "r_x1": 335.97, "r_y1": 538.36, "r_x2": 335.97, "r_y2": 534.09, "r_x3": 332.18, "r_y3": 534.09, "coord_origin": "TOPLEFT" }, "text": "...", "orig": "...", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 76, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 326.89, "r_y0": 520.66, "r_x1": 329.42, "r_y1": 520.66, "r_x2": 329.42, "r_y2": 516.4, "r_x3": 326.89, "r_y3": 516.4, "coord_origin": "TOPLEFT" }, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 77, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 327.04, "r_y0": 526.69, "r_x1": 329.57, "r_y1": 526.69, "r_x2": 329.57, "r_y2": 522.42, "r_x3": 327.04, "r_y3": 522.42, "coord_origin": "TOPLEFT" }, "text": "2", "orig": "2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 78, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 327.04, "r_y0": 532.78, "r_x1": 329.57, "r_y1": 532.78, "r_x2": 329.57, "r_y2": 528.52, "r_x3": 327.04, "r_y3": 528.52, "coord_origin": "TOPLEFT" }, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 79, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 424.14, "r_y0": 531.71, "r_x1": 426.67, "r_y1": 531.71, "r_x2": 426.67, "r_y2": 527.44, "r_x3": 424.14, "r_y3": 527.44, "coord_origin": "TOPLEFT" }, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 80, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 453.0, "r_y0": 521.72, "r_x1": 455.53, "r_y1": 521.72, "r_x2": 455.53, "r_y2": 517.45, "r_x3": 453.0, "r_y3": 517.45, "coord_origin": "TOPLEFT" }, "text": "2", "orig": "2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 81, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 423.86, "r_y0": 521.33, "r_x1": 426.39, "r_y1": 521.33, "r_x2": 426.39, "r_y2": 517.06, "r_x3": 423.86, "r_y3": 517.06, "coord_origin": "TOPLEFT" }, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 82, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 333.43, "r_y0": 562.36, "r_x1": 337.28, "r_y1": 562.36, "r_x2": 337.28, "r_y2": 557.37, "r_x3": 333.43, "r_y3": 557.37, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 83, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 340.35, "r_y0": 562.31, "r_x1": 344.2, "r_y1": 562.31, "r_x2": 344.2, "r_y2": 557.32, "r_x3": 340.35, "r_y3": 557.32, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 84, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 340.31, "r_y0": 568.86, "r_x1": 344.15, "r_y1": 568.86, "r_x2": 344.15, "r_y2": 563.87, "r_x3": 340.31, "r_y3": 563.87, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 85, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 346.8, "r_y0": 568.86, "r_x1": 350.64, "r_y1": 568.86, "r_x2": 350.64, "r_y2": 563.87, "r_x3": 346.8, "r_y3": 563.87, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 86, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 333.6, "r_y0": 568.81, "r_x1": 337.44, "r_y1": 568.81, "r_x2": 337.44, "r_y2": 563.82, "r_x3": 333.6, "r_y3": 563.82, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 87, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 340.38, "r_y0": 575.42, "r_x1": 344.22, "r_y1": 575.42, "r_x2": 344.22, "r_y2": 570.43, "r_x3": 340.38, "r_y3": 570.43, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 88, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 346.86, "r_y0": 575.42, "r_x1": 350.71, "r_y1": 575.42, "r_x2": 350.71, "r_y2": 570.43, "r_x3": 346.86, "r_y3": 570.43, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 89, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 333.66, "r_y0": 575.37, "r_x1": 337.5, "r_y1": 575.37, "r_x2": 337.5, "r_y2": 570.38, "r_x3": 333.66, "r_y3": 570.38, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 90, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 340.38, "r_y0": 582.02, "r_x1": 344.22, "r_y1": 582.02, "r_x2": 344.22, "r_y2": 577.03, "r_x3": 340.38, "r_y3": 577.03, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 91, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 346.87, "r_y0": 582.02, "r_x1": 350.71, "r_y1": 582.02, "r_x2": 350.71, "r_y2": 577.03, "r_x3": 346.87, "r_y3": 577.03, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 92, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 333.66, "r_y0": 581.97, "r_x1": 337.5, "r_y1": 581.97, "r_x2": 337.5, "r_y2": 576.98, "r_x3": 333.66, "r_y3": 576.98, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 93, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 340.28, "r_y0": 588.39, "r_x1": 344.12, "r_y1": 588.39, "r_x2": 344.12, "r_y2": 583.4, "r_x3": 340.28, "r_y3": 583.4, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 94, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 346.77, "r_y0": 588.39, "r_x1": 350.61, "r_y1": 588.39, "r_x2": 350.61, "r_y2": 583.4, "r_x3": 346.77, "r_y3": 583.4, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 95, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 333.57, "r_y0": 588.35, "r_x1": 337.41, "r_y1": 588.35, "r_x2": 337.41, "r_y2": 583.35, "r_x3": 333.57, "r_y3": 583.35, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 96, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 353.03, "r_y0": 561.87, "r_x1": 359.83, "r_y1": 561.87, "r_x2": 359.83, "r_y2": 556.88, "r_x3": 353.03, "r_y3": 556.88, "coord_origin": "TOPLEFT" }, "text": "NL", "orig": "NL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 97, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 353.19, "r_y0": 568.57, "r_x1": 359.99, "r_y1": 568.57, "r_x2": 359.99, "r_y2": 563.58, "r_x3": 353.19, "r_y3": 563.58, "coord_origin": "TOPLEFT" }, "text": "NL", "orig": "NL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 98, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 353.2, "r_y0": 575.15, "r_x1": 360.0, "r_y1": 575.15, "r_x2": 360.0, "r_y2": 570.16, "r_x3": 353.2, "r_y3": 570.16, "coord_origin": "TOPLEFT" }, "text": "NL", "orig": "NL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 99, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 353.15, "r_y0": 581.76, "r_x1": 359.95, "r_y1": 581.76, "r_x2": 359.95, "r_y2": 576.77, "r_x3": 353.15, "r_y3": 576.77, "coord_origin": "TOPLEFT" }, "text": "NL", "orig": "NL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 100, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 353.27, "r_y0": 588.4, "r_x1": 360.07, "r_y1": 588.4, "r_x2": 360.07, "r_y2": 583.41, "r_x3": 353.27, "r_y3": 583.41, "coord_origin": "TOPLEFT" }, "text": "NL", "orig": "NL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 101, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 347.38, "r_y0": 562.07, "r_x1": 350.34, "r_y1": 562.07, "r_x2": 350.34, "r_y2": 557.08, "r_x3": 347.38, "r_y3": 557.08, "coord_origin": "TOPLEFT" }, "text": "L", "orig": "L", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 102, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 331.14, "r_y0": 568.55, "r_x1": 333.67, "r_y1": 568.55, "r_x2": 333.67, "r_y2": 564.29, "r_x3": 331.14, "r_y3": 564.29, "coord_origin": "TOPLEFT" }, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 103, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 340.81, "r_y0": 558.86, "r_x1": 343.34, "r_y1": 558.86, "r_x2": 343.34, "r_y2": 554.59, "r_x3": 340.81, "r_y3": 554.59, "coord_origin": "TOPLEFT" }, "text": "2", "orig": "2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 104, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 330.98, "r_y0": 559.09, "r_x1": 333.51, "r_y1": 559.09, "r_x2": 333.51, "r_y2": 554.83, "r_x3": 330.98, "r_y3": 554.83, "coord_origin": "TOPLEFT" }, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 105, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 149.71, "r_y0": 628.99, "r_x1": 480.59, "r_y1": 628.99, "r_x2": 480.59, "r_y2": 620.19, "r_x3": 149.71, "r_y3": 620.19, "coord_origin": "TOPLEFT" }, "text": "We rely on standard metrics such as Tree Edit Distance score (TEDs) for", "orig": "We rely on standard metrics such as Tree Edit Distance score (TEDs) for", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 106, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 640.94, "r_x1": 480.59, "r_y1": 640.94, "r_x2": 480.59, "r_y2": 632.15, "r_x3": 134.76, "r_y3": 632.15, "coord_origin": "TOPLEFT" }, "text": "table structure prediction, and Mean Average Precision (mAP) with 0.75 Inter-", "orig": "table structure prediction, and Mean Average Precision (mAP) with 0.75 Inter-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 107, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 652.9, "r_x1": 480.59, "r_y1": 652.9, "r_x2": 480.59, "r_y2": 644.1, "r_x3": 134.76, "r_y3": 644.1, "coord_origin": "TOPLEFT" }, "text": "section Over Union (IOU) threshold for the bounding-box predictions of table", "orig": "section Over Union (IOU) threshold for the bounding-box predictions of table", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 108, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 664.85, "r_x1": 480.59, "r_y1": 664.85, "r_x2": 480.59, "r_y2": 656.06, "r_x3": 134.76, "r_y3": 656.06, "coord_origin": "TOPLEFT" }, "text": "cells. The predicted OTSL structures were converted back to HTML format in", "orig": "cells. The predicted OTSL structures were converted back to HTML format in", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "has_chars": false, "has_words": false, "has_lines": true, "image": null, "lines": [] }, "predictions": { "layout": { "clusters": [ { "id": 9, "label": "page_header", "bbox": { "l": 134.76, "t": 93.77, "r": 139.37, "b": 101.84, "coord_origin": "TOPLEFT" }, "confidence": 0.83, "cells": [ { "index": 0, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 101.84, "r_x1": 139.37, "r_y1": 101.84, "r_x2": 139.37, "r_y2": 93.77, "r_x3": 134.76, "r_y3": 93.77, "coord_origin": "TOPLEFT" }, "text": "8", "orig": "8", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 8, "label": "page_header", "bbox": { "l": 167.81, "t": 93.77, "r": 231.72, "b": 101.84, "coord_origin": "TOPLEFT" }, "confidence": 0.863, "cells": [ { "index": 1, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 167.81, "r_y0": 101.84, "r_x1": 178.08, "r_y1": 101.84, "r_x2": 178.08, "r_y2": 93.77, "r_x3": 167.81, "r_y3": 93.77, "coord_origin": "TOPLEFT" }, "text": "M.", "orig": "M.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 2, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 182.37, "r_y0": 101.84, "r_x1": 231.72, "r_y1": 101.84, "r_x2": 231.72, "r_y2": 93.77, "r_x3": 182.37, "r_y3": 93.77, "coord_origin": "TOPLEFT" }, "text": "Lysak, et al.", "orig": "Lysak, et al.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 5, "label": "text", "bbox": { "l": 134.76, "t": 118.93, "r": 480.59, "b": 139.69, "coord_origin": "TOPLEFT" }, "confidence": 0.946, "cells": [ { "index": 3, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 127.73, "r_x1": 480.59, "r_y1": 127.73, "r_x2": 480.59, "r_y2": 118.93, "r_x3": 134.76, "r_y3": 118.93, "coord_origin": "TOPLEFT" }, "text": "reduces significantly the column drift seen in the HTML based models (see Fig-", "orig": "reduces significantly the column drift seen in the HTML based models (see Fig-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 4, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 139.69, "r_x1": 163.56, "r_y1": 139.69, "r_x2": 163.56, "r_y2": 130.89, "r_x3": 134.76, "r_y3": 130.89, "coord_origin": "TOPLEFT" }, "text": "ure 5).", "orig": "ure 5).", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 2, "label": "section_header", "bbox": { "l": 134.76, "t": 161.56, "r": 319.35, "b": 170.36, "coord_origin": "TOPLEFT" }, "confidence": 0.955, "cells": [ { "index": 5, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 170.36, "r_x1": 149.4, "r_y1": 170.36, "r_x2": 149.4, "r_y2": 161.56, "r_x3": 134.76, "r_y3": 161.56, "coord_origin": "TOPLEFT" }, "text": "4.3", "orig": "4.3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 6, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 160.86, "r_y0": 170.36, "r_x1": 319.35, "r_y1": 170.36, "r_x2": 319.35, "r_y2": 161.56, "r_x3": 160.86, "r_y3": 161.56, "coord_origin": "TOPLEFT" }, "text": "Error-detection and -mitigation", "orig": "Error-detection and -mitigation", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 0, "label": "text", "bbox": { "l": 134.76, "t": 182.28, "r": 480.6, "b": 298.68, "coord_origin": "TOPLEFT" }, "confidence": 0.988, "cells": [ { "index": 7, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 191.08, "r_x1": 480.6, "r_y1": 191.08, "r_x2": 480.6, "r_y2": 182.28, "r_x3": 134.76, "r_y3": 182.28, "coord_origin": "TOPLEFT" }, "text": "The design of OTSL allows to validate a table structure easily on an unfinished", "orig": "The design of OTSL allows to validate a table structure easily on an unfinished", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 8, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 203.03, "r_x1": 480.59, "r_y1": 203.03, "r_x2": 480.59, "r_y2": 194.24, "r_x3": 134.76, "r_y3": 194.24, "coord_origin": "TOPLEFT" }, "text": "sequence. The detection of an invalid sequence token is a clear indication of a", "orig": "sequence. The detection of an invalid sequence token is a clear indication of a", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 9, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 214.99, "r_x1": 480.59, "r_y1": 214.99, "r_x2": 480.59, "r_y2": 206.19, "r_x3": 134.76, "r_y3": 206.19, "coord_origin": "TOPLEFT" }, "text": "prediction mistake, however a valid sequence by itself does not guarantee pre-", "orig": "prediction mistake, however a valid sequence by itself does not guarantee pre-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 10, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 226.94, "r_x1": 480.59, "r_y1": 226.94, "r_x2": 480.59, "r_y2": 218.15, "r_x3": 134.76, "r_y3": 218.15, "coord_origin": "TOPLEFT" }, "text": "diction correctness. Different heuristics can be used to correct token errors in", "orig": "diction correctness. Different heuristics can be used to correct token errors in", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 11, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 238.9, "r_x1": 480.59, "r_y1": 238.9, "r_x2": 480.59, "r_y2": 230.1, "r_x3": 134.76, "r_y3": 230.1, "coord_origin": "TOPLEFT" }, "text": "an invalid sequence and thus increase the chances for accurate predictions. Such", "orig": "an invalid sequence and thus increase the chances for accurate predictions. Such", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 12, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 250.85, "r_x1": 480.59, "r_y1": 250.85, "r_x2": 480.59, "r_y2": 242.06, "r_x3": 134.76, "r_y3": 242.06, "coord_origin": "TOPLEFT" }, "text": "heuristics can be applied either after the prediction of each token, or at the end", "orig": "heuristics can be applied either after the prediction of each token, or at the end", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 13, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 262.81, "r_x1": 480.59, "r_y1": 262.81, "r_x2": 480.59, "r_y2": 254.01, "r_x3": 134.76, "r_y3": 254.01, "coord_origin": "TOPLEFT" }, "text": "on the entire predicted sequence. For example a simple heuristic which can cor-", "orig": "on the entire predicted sequence. For example a simple heuristic which can cor-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 14, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 274.77, "r_x1": 480.59, "r_y1": 274.77, "r_x2": 480.59, "r_y2": 265.97, "r_x3": 134.76, "r_y3": 265.97, "coord_origin": "TOPLEFT" }, "text": "rect the predicted OTSL sequence on-the-fly is to verify if the token with the", "orig": "rect the predicted OTSL sequence on-the-fly is to verify if the token with the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 15, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 286.72, "r_x1": 480.6, "r_y1": 286.72, "r_x2": 480.6, "r_y2": 277.92, "r_x3": 134.76, "r_y3": 277.92, "coord_origin": "TOPLEFT" }, "text": "highest prediction confidence invalidates the predicted sequence, and replace it", "orig": "highest prediction confidence invalidates the predicted sequence, and replace it", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 16, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 298.68, "r_x1": 469.4, "r_y1": 298.68, "r_x2": 469.4, "r_y2": 289.88, "r_x3": 134.76, "r_y3": 289.88, "coord_origin": "TOPLEFT" }, "text": "by the token with the next highest confidence until OTSL rules are satisfied.", "orig": "by the token with the next highest confidence until OTSL rules are satisfied.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 3, "label": "section_header", "bbox": { "l": 134.76, "t": 321.16, "r": 229.04, "b": 331.73, "coord_origin": "TOPLEFT" }, "confidence": 0.952, "cells": [ { "index": 17, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 331.73, "r_x1": 141.49, "r_y1": 331.73, "r_x2": 141.49, "r_y2": 321.16, "r_x3": 134.76, "r_y3": 321.16, "coord_origin": "TOPLEFT" }, "text": "5", "orig": "5", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 18, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 154.94, "r_y0": 331.73, "r_x1": 229.04, "r_y1": 331.73, "r_x2": 229.04, "r_y2": 321.16, "r_x3": 154.94, "r_y3": 321.16, "coord_origin": "TOPLEFT" }, "text": "Experiments", "orig": "Experiments", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 1, "label": "text", "bbox": { "l": 134.76, "t": 347.25, "r": 480.6, "b": 451.69, "coord_origin": "TOPLEFT" }, "confidence": 0.988, "cells": [ { "index": 19, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 356.05, "r_x1": 480.59, "r_y1": 356.05, "r_x2": 480.59, "r_y2": 347.25, "r_x3": 134.76, "r_y3": 347.25, "coord_origin": "TOPLEFT" }, "text": "To evaluate the impact of OTSL on prediction accuracy and inference times, we", "orig": "To evaluate the impact of OTSL on prediction accuracy and inference times, we", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 20, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 368.0, "r_x1": 480.59, "r_y1": 368.0, "r_x2": 480.59, "r_y2": 359.2, "r_x3": 134.76, "r_y3": 359.2, "coord_origin": "TOPLEFT" }, "text": "conducted a series of experiments based on the TableFormer model (Figure 4)", "orig": "conducted a series of experiments based on the TableFormer model (Figure 4)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 21, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 379.96, "r_x1": 480.59, "r_y1": 379.96, "r_x2": 480.59, "r_y2": 371.16, "r_x3": 134.76, "r_y3": 371.16, "coord_origin": "TOPLEFT" }, "text": "with two objectives: Firstly we evaluate the prediction quality and performance", "orig": "with two objectives: Firstly we evaluate the prediction quality and performance", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 22, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 391.91, "r_x1": 480.59, "r_y1": 391.91, "r_x2": 480.59, "r_y2": 383.11, "r_x3": 134.76, "r_y3": 383.11, "coord_origin": "TOPLEFT" }, "text": "of OTSL vs. HTML after performing Hyper Parameter Optimization (HPO) on", "orig": "of OTSL vs. HTML after performing Hyper Parameter Optimization (HPO) on", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 23, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 403.87, "r_x1": 148.6, "r_y1": 403.87, "r_x2": 148.6, "r_y2": 395.07, "r_x3": 134.76, "r_y3": 395.07, "coord_origin": "TOPLEFT" }, "text": "the", "orig": "the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 24, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.63, "r_y0": 403.87, "r_x1": 191.85, "r_y1": 403.87, "r_x2": 191.85, "r_y2": 395.07, "r_x3": 151.63, "r_y3": 395.07, "coord_origin": "TOPLEFT" }, "text": "canonical", "orig": "canonical", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 25, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 195.9, "r_y0": 403.87, "r_x1": 480.6, "r_y1": 403.87, "r_x2": 480.6, "r_y2": 395.07, "r_x3": 195.9, "r_y3": 395.07, "coord_origin": "TOPLEFT" }, "text": "PubTabNet data set. Secondly we pick the best hyper-parameters", "orig": "PubTabNet data set. Secondly we pick the best hyper-parameters", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 26, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.77, "r_y0": 415.82, "r_x1": 480.59, "r_y1": 415.82, "r_x2": 480.59, "r_y2": 407.02, "r_x3": 134.77, "r_y3": 407.02, "coord_origin": "TOPLEFT" }, "text": "found in the first step and evaluate how OTSL impacts the performance of", "orig": "found in the first step and evaluate how OTSL impacts the performance of", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 27, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.77, "r_y0": 427.78, "r_x1": 480.59, "r_y1": 427.78, "r_x2": 480.59, "r_y2": 418.98, "r_x3": 134.77, "r_y3": 418.98, "coord_origin": "TOPLEFT" }, "text": "TableFormer after training on other publicly available data sets (FinTabNet,", "orig": "TableFormer after training on other publicly available data sets (FinTabNet,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 28, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.77, "r_y0": 439.73, "r_x1": 480.59, "r_y1": 439.73, "r_x2": 480.59, "r_y2": 430.94, "r_x3": 134.77, "r_y3": 430.94, "coord_origin": "TOPLEFT" }, "text": "PubTables-1M [14]). The ground truth (GT) from all data sets has been con-", "orig": "PubTables-1M [14]). The ground truth (GT) from all data sets has been con-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 29, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.77, "r_y0": 451.69, "r_x1": 479.3, "r_y1": 451.69, "r_x2": 479.3, "r_y2": 442.89, "r_x3": 134.77, "r_y3": 442.89, "coord_origin": "TOPLEFT" }, "text": "verted into OTSL format for this purpose, and will be made publicly available.", "orig": "verted into OTSL format for this purpose, and will be made publicly available.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 7, "label": "caption", "bbox": { "l": 134.77, "t": 484.65, "r": 480.59, "b": 503.74, "coord_origin": "TOPLEFT" }, "confidence": 0.93, "cells": [ { "index": 30, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.77, "r_y0": 492.57, "r_x1": 162.64, "r_y1": 492.57, "r_x2": 162.64, "r_y2": 484.65, "r_x3": 134.77, "r_y3": 484.65, "coord_origin": "TOPLEFT" }, "text": "Fig. 4.", "orig": "Fig. 4.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 31, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 165.2, "r_y0": 492.78, "r_x1": 480.59, "r_y1": 492.78, "r_x2": 480.59, "r_y2": 484.71, "r_x3": 165.2, "r_y3": 484.71, "coord_origin": "TOPLEFT" }, "text": "Architecture sketch of the TableFormer model, which is a representative for the", "orig": "Architecture sketch of the TableFormer model, which is a representative for the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 32, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.77, "r_y0": 503.74, "r_x1": 206.7, "r_y1": 503.74, "r_x2": 206.7, "r_y2": 495.67, "r_x3": 134.77, "r_y3": 495.67, "coord_origin": "TOPLEFT" }, "text": "Im2Seq approach.", "orig": "Im2Seq approach.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 6, "label": "picture", "bbox": { "l": 140.71, "t": 508.06, "r": 472.73, "b": 593.68, "coord_origin": "TOPLEFT" }, "confidence": 0.93, "cells": [ { "index": 33, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 147.3, "r_y0": 543.1, "r_x1": 149.71, "r_y1": 543.1, "r_x2": 149.71, "r_y2": 540.73, "r_x3": 147.3, "r_y3": 540.73, "coord_origin": "TOPLEFT" }, "text": "1.", "orig": "1.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 34, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 150.91, "r_y0": 543.1, "r_x1": 155.72, "r_y1": 543.1, "r_x2": 155.72, "r_y2": 540.73, "r_x3": 150.91, "r_y3": 540.73, "coord_origin": "TOPLEFT" }, "text": "Item", "orig": "Item", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 35, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 162.76, "r_y0": 537.76, "r_x1": 172.3, "r_y1": 537.76, "r_x2": 172.3, "r_y2": 535.39, "r_x3": 162.76, "r_y3": 535.39, "coord_origin": "TOPLEFT" }, "text": "Amount", "orig": "Amount", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 36, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 147.64, "r_y0": 537.73, "r_x1": 155.92, "r_y1": 537.73, "r_x2": 155.92, "r_y2": 535.37, "r_x3": 147.64, "r_y3": 535.37, "coord_origin": "TOPLEFT" }, "text": "Names", "orig": "Names", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 37, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 158.48, "r_y0": 543.1, "r_x1": 164.1, "r_y1": 543.1, "r_x2": 164.1, "r_y2": 540.73, "r_x3": 158.48, "r_y3": 540.73, "coord_origin": "TOPLEFT" }, "text": "1000", "orig": "1000", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 38, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 158.48, "r_y0": 547.04, "r_x1": 162.7, "r_y1": 547.04, "r_x2": 162.7, "r_y2": 544.67, "r_x3": 158.48, "r_y3": 544.67, "coord_origin": "TOPLEFT" }, "text": "500", "orig": "500", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 39, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 158.48, "r_y0": 551.28, "r_x1": 164.1, "r_y1": 551.28, "r_x2": 164.1, "r_y2": 548.91, "r_x3": 158.48, "r_y3": 548.91, "coord_origin": "TOPLEFT" }, "text": "3500", "orig": "3500", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 40, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 158.48, "r_y0": 555.52, "r_x1": 162.7, "r_y1": 555.52, "r_x2": 162.7, "r_y2": 553.15, "r_x3": 158.48, "r_y3": 553.15, "coord_origin": "TOPLEFT" }, "text": "150", "orig": "150", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 41, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 168.82, "r_y0": 543.1, "r_x1": 172.89, "r_y1": 543.1, "r_x2": 172.89, "r_y2": 540.73, "r_x3": 168.82, "r_y3": 540.73, "coord_origin": "TOPLEFT" }, "text": "unit", "orig": "unit", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 42, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 168.82, "r_y0": 547.04, "r_x1": 172.89, "r_y1": 547.04, "r_x2": 172.89, "r_y2": 544.67, "r_x3": 168.82, "r_y3": 544.67, "coord_origin": "TOPLEFT" }, "text": "unit", "orig": "unit", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 43, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 168.82, "r_y0": 551.28, "r_x1": 172.89, "r_y1": 551.28, "r_x2": 172.89, "r_y2": 548.91, "r_x3": 168.82, "r_y3": 548.91, "coord_origin": "TOPLEFT" }, "text": "unit", "orig": "unit", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 44, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 168.82, "r_y0": 555.52, "r_x1": 172.89, "r_y1": 555.52, "r_x2": 172.89, "r_y2": 553.15, "r_x3": 168.82, "r_y3": 553.15, "coord_origin": "TOPLEFT" }, "text": "unit", "orig": "unit", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 45, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 147.3, "r_y0": 547.04, "r_x1": 149.71, "r_y1": 547.04, "r_x2": 149.71, "r_y2": 544.67, "r_x3": 147.3, "r_y3": 544.67, "coord_origin": "TOPLEFT" }, "text": "2.", "orig": "2.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 46, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 150.91, "r_y0": 547.04, "r_x1": 155.72, "r_y1": 547.04, "r_x2": 155.72, "r_y2": 544.67, "r_x3": 150.91, "r_y3": 544.67, "coord_origin": "TOPLEFT" }, "text": "Item", "orig": "Item", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 47, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 147.3, "r_y0": 551.28, "r_x1": 149.71, "r_y1": 551.28, "r_x2": 149.71, "r_y2": 548.91, "r_x3": 147.3, "r_y3": 548.91, "coord_origin": "TOPLEFT" }, "text": "3.", "orig": "3.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 48, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 150.91, "r_y0": 551.28, "r_x1": 155.72, "r_y1": 551.28, "r_x2": 155.72, "r_y2": 548.91, "r_x3": 150.91, "r_y3": 548.91, "coord_origin": "TOPLEFT" }, "text": "Item", "orig": "Item", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 49, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 147.3, "r_y0": 555.52, "r_x1": 149.71, "r_y1": 555.52, "r_x2": 149.71, "r_y2": 553.15, "r_x3": 147.3, "r_y3": 553.15, "coord_origin": "TOPLEFT" }, "text": "4.", "orig": "4.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 50, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 150.91, "r_y0": 555.52, "r_x1": 155.72, "r_y1": 555.52, "r_x2": 155.72, "r_y2": 553.15, "r_x3": 150.91, "r_y3": 553.15, "coord_origin": "TOPLEFT" }, "text": "Item", "orig": "Item", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 51, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 152.05, "r_y0": 521.27, "r_x1": 171.25, "r_y1": 521.27, "r_x2": 171.25, "r_y2": 517.01, "r_x3": 152.05, "r_y3": 517.01, "coord_origin": "TOPLEFT" }, "text": "Extracted", "orig": "Extracted", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 52, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 148.13, "r_y0": 526.58, "r_x1": 175.17, "r_y1": 526.58, "r_x2": 175.17, "r_y2": 522.31, "r_x3": 148.13, "r_y3": 522.31, "coord_origin": "TOPLEFT" }, "text": "Table Images", "orig": "Table Images", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 53, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 193.53, "r_y0": 528.78, "r_x1": 220.32, "r_y1": 528.78, "r_x2": 220.32, "r_y2": 524.51, "r_x3": 193.53, "r_y3": 524.51, "coord_origin": "TOPLEFT" }, "text": "Standardized", "orig": "Standardized", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 54, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 199.47, "r_y0": 534.08, "r_x1": 214.38, "r_y1": 534.08, "r_x2": 214.38, "r_y2": 529.82, "r_x3": 199.47, "r_y3": 529.82, "coord_origin": "TOPLEFT" }, "text": "Images", "orig": "Images", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 55, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 273.61, "r_y0": 514.17, "r_x1": 284.47, "r_y1": 514.17, "r_x2": 284.47, "r_y2": 509.91, "r_x3": 273.61, "r_y3": 509.91, "coord_origin": "TOPLEFT" }, "text": "BBox", "orig": "BBox", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 56, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 270.45, "r_y0": 517.96, "r_x1": 287.63, "r_y1": 517.96, "r_x2": 287.63, "r_y2": 513.69, "r_x3": 270.45, "r_y3": 513.69, "coord_origin": "TOPLEFT" }, "text": "Decoder", "orig": "Decoder", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 57, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 332.48, "r_y0": 512.41, "r_x1": 348.14, "r_y1": 512.41, "r_x2": 348.14, "r_y2": 508.14, "r_x3": 332.48, "r_y3": 508.14, "coord_origin": "TOPLEFT" }, "text": "BBoxes", "orig": "BBoxes", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 58, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 376.69, "r_y0": 525.38, "r_x1": 407.25, "r_y1": 525.38, "r_x2": 407.25, "r_y2": 521.12, "r_x3": 376.69, "r_y3": 521.12, "coord_origin": "TOPLEFT" }, "text": "BBoxes can be", "orig": "BBoxes can be", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 59, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 373.91, "r_y0": 529.93, "r_x1": 410.04, "r_y1": 529.93, "r_x2": 410.04, "r_y2": 525.67, "r_x3": 373.91, "r_y3": 525.67, "coord_origin": "TOPLEFT" }, "text": "traced back to the", "orig": "traced back to the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 60, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 375.3, "r_y0": 534.47, "r_x1": 408.65, "r_y1": 534.47, "r_x2": 408.65, "r_y2": 530.21, "r_x3": 375.3, "r_y3": 530.21, "coord_origin": "TOPLEFT" }, "text": "original image to", "orig": "original image to", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 61, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 377.07, "r_y0": 539.02, "r_x1": 406.88, "r_y1": 539.02, "r_x2": 406.88, "r_y2": 534.76, "r_x3": 377.07, "r_y3": 534.76, "coord_origin": "TOPLEFT" }, "text": "extract content", "orig": "extract content", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 62, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 383.57, "r_y0": 567.5, "r_x1": 433.77, "r_y1": 567.5, "r_x2": 433.77, "r_y2": 563.24, "r_x3": 383.57, "r_y3": 563.24, "coord_origin": "TOPLEFT" }, "text": "Structure Tags sequence", "orig": "Structure Tags sequence", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 63, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 383.53, "r_y0": 572.05, "r_x1": 433.81, "r_y1": 572.05, "r_x2": 433.81, "r_y2": 567.79, "r_x3": 383.53, "r_y3": 567.79, "coord_origin": "TOPLEFT" }, "text": "provide full description of", "orig": "provide full description of", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 64, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 390.48, "r_y0": 576.59, "r_x1": 426.86, "r_y1": 576.59, "r_x2": 426.86, "r_y2": 572.33, "r_x3": 390.48, "r_y3": 572.33, "coord_origin": "TOPLEFT" }, "text": "the table structure", "orig": "the table structure", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 65, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 293.95, "r_y0": 582.15, "r_x1": 323.17, "r_y1": 582.15, "r_x2": 323.17, "r_y2": 577.89, "r_x3": 293.95, "r_y3": 577.89, "coord_origin": "TOPLEFT" }, "text": "Structure Tags", "orig": "Structure Tags", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 66, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 293.95, "r_y0": 586.7, "r_x1": 324.59, "r_y1": 586.7, "r_x2": 324.59, "r_y2": 582.44, "r_x3": 293.95, "r_y3": 582.44, "coord_origin": "TOPLEFT" }, "text": "in OTSL format", "orig": "in OTSL format", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 67, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 333.08, "r_y0": 546.09, "r_x1": 364.15, "r_y1": 546.09, "r_x2": 364.15, "r_y2": 541.82, "r_x3": 333.08, "r_y3": 541.82, "coord_origin": "TOPLEFT" }, "text": "BBoxes in sync", "orig": "BBoxes in sync", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 68, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 333.08, "r_y0": 549.87, "r_x1": 369.72, "r_y1": 549.87, "r_x2": 369.72, "r_y2": 545.61, "r_x3": 333.08, "r_y3": 545.61, "coord_origin": "TOPLEFT" }, "text": "with tag sequence", "orig": "with tag sequence", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 69, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 232.66, "r_y0": 519.5, "r_x1": 249.59, "r_y1": 519.5, "r_x2": 249.59, "r_y2": 515.24, "r_x3": 232.66, "r_y3": 515.24, "coord_origin": "TOPLEFT" }, "text": "Encoder", "orig": "Encoder", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 70, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 269.82, "r_y0": 550.23, "r_x1": 288.26, "r_y1": 550.23, "r_x2": 288.26, "r_y2": 545.97, "r_x3": 269.82, "r_y3": 545.97, "coord_origin": "TOPLEFT" }, "text": "Structure", "orig": "Structure", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 71, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 270.45, "r_y0": 554.02, "r_x1": 287.63, "r_y1": 554.02, "r_x2": 287.63, "r_y2": 549.76, "r_x3": 270.45, "r_y3": 549.76, "coord_origin": "TOPLEFT" }, "text": "Decoder", "orig": "Decoder", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 72, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 332.18, "r_y0": 520.18, "r_x1": 358.11, "r_y1": 520.18, "r_x2": 358.11, "r_y2": 515.91, "r_x3": 332.18, "r_y3": 515.91, "coord_origin": "TOPLEFT" }, "text": "[x1, y2, x2, y2]", "orig": "[x1, y2, x2, y2]", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 73, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 332.18, "r_y0": 526.24, "r_x1": 361.58, "r_y1": 526.24, "r_x2": 361.58, "r_y2": 521.97, "r_x3": 332.18, "r_y3": 521.97, "coord_origin": "TOPLEFT" }, "text": "[x1', y2', x2', y2']", "orig": "[x1', y2', x2', y2']", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 74, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 332.18, "r_y0": 532.3, "r_x1": 364.76, "r_y1": 532.3, "r_x2": 364.76, "r_y2": 528.03, "r_x3": 332.18, "r_y3": 528.03, "coord_origin": "TOPLEFT" }, "text": "[x1'', y2'', x2'', y2'']", "orig": "[x1'', y2'', x2'', y2'']", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 75, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 332.18, "r_y0": 538.36, "r_x1": 335.97, "r_y1": 538.36, "r_x2": 335.97, "r_y2": 534.09, "r_x3": 332.18, "r_y3": 534.09, "coord_origin": "TOPLEFT" }, "text": "...", "orig": "...", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 76, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 326.89, "r_y0": 520.66, "r_x1": 329.42, "r_y1": 520.66, "r_x2": 329.42, "r_y2": 516.4, "r_x3": 326.89, "r_y3": 516.4, "coord_origin": "TOPLEFT" }, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 77, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 327.04, "r_y0": 526.69, "r_x1": 329.57, "r_y1": 526.69, "r_x2": 329.57, "r_y2": 522.42, "r_x3": 327.04, "r_y3": 522.42, "coord_origin": "TOPLEFT" }, "text": "2", "orig": "2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 78, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 327.04, "r_y0": 532.78, "r_x1": 329.57, "r_y1": 532.78, "r_x2": 329.57, "r_y2": 528.52, "r_x3": 327.04, "r_y3": 528.52, "coord_origin": "TOPLEFT" }, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 79, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 424.14, "r_y0": 531.71, "r_x1": 426.67, "r_y1": 531.71, "r_x2": 426.67, "r_y2": 527.44, "r_x3": 424.14, "r_y3": 527.44, "coord_origin": "TOPLEFT" }, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 80, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 453.0, "r_y0": 521.72, "r_x1": 455.53, "r_y1": 521.72, "r_x2": 455.53, "r_y2": 517.45, "r_x3": 453.0, "r_y3": 517.45, "coord_origin": "TOPLEFT" }, "text": "2", "orig": "2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 81, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 423.86, "r_y0": 521.33, "r_x1": 426.39, "r_y1": 521.33, "r_x2": 426.39, "r_y2": 517.06, "r_x3": 423.86, "r_y3": 517.06, "coord_origin": "TOPLEFT" }, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 82, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 333.43, "r_y0": 562.36, "r_x1": 337.28, "r_y1": 562.36, "r_x2": 337.28, "r_y2": 557.37, "r_x3": 333.43, "r_y3": 557.37, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 83, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 340.35, "r_y0": 562.31, "r_x1": 344.2, "r_y1": 562.31, "r_x2": 344.2, "r_y2": 557.32, "r_x3": 340.35, "r_y3": 557.32, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 84, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 340.31, "r_y0": 568.86, "r_x1": 344.15, "r_y1": 568.86, "r_x2": 344.15, "r_y2": 563.87, "r_x3": 340.31, "r_y3": 563.87, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 85, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 346.8, "r_y0": 568.86, "r_x1": 350.64, "r_y1": 568.86, "r_x2": 350.64, "r_y2": 563.87, "r_x3": 346.8, "r_y3": 563.87, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 86, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 333.6, "r_y0": 568.81, "r_x1": 337.44, "r_y1": 568.81, "r_x2": 337.44, "r_y2": 563.82, "r_x3": 333.6, "r_y3": 563.82, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 87, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 340.38, "r_y0": 575.42, "r_x1": 344.22, "r_y1": 575.42, "r_x2": 344.22, "r_y2": 570.43, "r_x3": 340.38, "r_y3": 570.43, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 88, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 346.86, "r_y0": 575.42, "r_x1": 350.71, "r_y1": 575.42, "r_x2": 350.71, "r_y2": 570.43, "r_x3": 346.86, "r_y3": 570.43, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 89, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 333.66, "r_y0": 575.37, "r_x1": 337.5, "r_y1": 575.37, "r_x2": 337.5, "r_y2": 570.38, "r_x3": 333.66, "r_y3": 570.38, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 90, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 340.38, "r_y0": 582.02, "r_x1": 344.22, "r_y1": 582.02, "r_x2": 344.22, "r_y2": 577.03, "r_x3": 340.38, "r_y3": 577.03, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 91, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 346.87, "r_y0": 582.02, "r_x1": 350.71, "r_y1": 582.02, "r_x2": 350.71, "r_y2": 577.03, "r_x3": 346.87, "r_y3": 577.03, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 92, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 333.66, "r_y0": 581.97, "r_x1": 337.5, "r_y1": 581.97, "r_x2": 337.5, "r_y2": 576.98, "r_x3": 333.66, "r_y3": 576.98, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 93, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 340.28, "r_y0": 588.39, "r_x1": 344.12, "r_y1": 588.39, "r_x2": 344.12, "r_y2": 583.4, "r_x3": 340.28, "r_y3": 583.4, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 94, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 346.77, "r_y0": 588.39, "r_x1": 350.61, "r_y1": 588.39, "r_x2": 350.61, "r_y2": 583.4, "r_x3": 346.77, "r_y3": 583.4, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 95, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 333.57, "r_y0": 588.35, "r_x1": 337.41, "r_y1": 588.35, "r_x2": 337.41, "r_y2": 583.35, "r_x3": 333.57, "r_y3": 583.35, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 96, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 353.03, "r_y0": 561.87, "r_x1": 359.83, "r_y1": 561.87, "r_x2": 359.83, "r_y2": 556.88, "r_x3": 353.03, "r_y3": 556.88, "coord_origin": "TOPLEFT" }, "text": "NL", "orig": "NL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 97, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 353.19, "r_y0": 568.57, "r_x1": 359.99, "r_y1": 568.57, "r_x2": 359.99, "r_y2": 563.58, "r_x3": 353.19, "r_y3": 563.58, "coord_origin": "TOPLEFT" }, "text": "NL", "orig": "NL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 98, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 353.2, "r_y0": 575.15, "r_x1": 360.0, "r_y1": 575.15, "r_x2": 360.0, "r_y2": 570.16, "r_x3": 353.2, "r_y3": 570.16, "coord_origin": "TOPLEFT" }, "text": "NL", "orig": "NL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 99, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 353.15, "r_y0": 581.76, "r_x1": 359.95, "r_y1": 581.76, "r_x2": 359.95, "r_y2": 576.77, "r_x3": 353.15, "r_y3": 576.77, "coord_origin": "TOPLEFT" }, "text": "NL", "orig": "NL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 100, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 353.27, "r_y0": 588.4, "r_x1": 360.07, "r_y1": 588.4, "r_x2": 360.07, "r_y2": 583.41, "r_x3": 353.27, "r_y3": 583.41, "coord_origin": "TOPLEFT" }, "text": "NL", "orig": "NL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 101, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 347.38, "r_y0": 562.07, "r_x1": 350.34, "r_y1": 562.07, "r_x2": 350.34, "r_y2": 557.08, "r_x3": 347.38, "r_y3": 557.08, "coord_origin": "TOPLEFT" }, "text": "L", "orig": "L", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 102, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 331.14, "r_y0": 568.55, "r_x1": 333.67, "r_y1": 568.55, "r_x2": 333.67, "r_y2": 564.29, "r_x3": 331.14, "r_y3": 564.29, "coord_origin": "TOPLEFT" }, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 103, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 340.81, "r_y0": 558.86, "r_x1": 343.34, "r_y1": 558.86, "r_x2": 343.34, "r_y2": 554.59, "r_x3": 340.81, "r_y3": 554.59, "coord_origin": "TOPLEFT" }, "text": "2", "orig": "2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 104, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 330.98, "r_y0": 559.09, "r_x1": 333.51, "r_y1": 559.09, "r_x2": 333.51, "r_y2": 554.83, "r_x3": 330.98, "r_y3": 554.83, "coord_origin": "TOPLEFT" }, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [ { "id": 13, "label": "text", "bbox": { "l": 147.3, "t": 540.73, "r": 149.71, "b": 543.1, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 33, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 147.3, "r_y0": 543.1, "r_x1": 149.71, "r_y1": 543.1, "r_x2": 149.71, "r_y2": 540.73, "r_x3": 147.3, "r_y3": 540.73, "coord_origin": "TOPLEFT" }, "text": "1.", "orig": "1.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 14, "label": "text", "bbox": { "l": 150.91, "t": 540.73, "r": 155.72, "b": 543.1, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 34, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 150.91, "r_y0": 543.1, "r_x1": 155.72, "r_y1": 543.1, "r_x2": 155.72, "r_y2": 540.73, "r_x3": 150.91, "r_y3": 540.73, "coord_origin": "TOPLEFT" }, "text": "Item", "orig": "Item", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 15, "label": "text", "bbox": { "l": 162.76, "t": 535.39, "r": 172.3, "b": 537.76, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 35, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 162.76, "r_y0": 537.76, "r_x1": 172.3, "r_y1": 537.76, "r_x2": 172.3, "r_y2": 535.39, "r_x3": 162.76, "r_y3": 535.39, "coord_origin": "TOPLEFT" }, "text": "Amount", "orig": "Amount", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 16, "label": "text", "bbox": { "l": 147.64, "t": 535.37, "r": 155.92, "b": 537.73, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 36, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 147.64, "r_y0": 537.73, "r_x1": 155.92, "r_y1": 537.73, "r_x2": 155.92, "r_y2": 535.37, "r_x3": 147.64, "r_y3": 535.37, "coord_origin": "TOPLEFT" }, "text": "Names", "orig": "Names", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 17, "label": "text", "bbox": { "l": 158.48, "t": 540.73, "r": 164.1, "b": 543.1, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 37, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 158.48, "r_y0": 543.1, "r_x1": 164.1, "r_y1": 543.1, "r_x2": 164.1, "r_y2": 540.73, "r_x3": 158.48, "r_y3": 540.73, "coord_origin": "TOPLEFT" }, "text": "1000", "orig": "1000", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 18, "label": "text", "bbox": { "l": 158.48, "t": 544.67, "r": 162.7, "b": 547.04, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 38, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 158.48, "r_y0": 547.04, "r_x1": 162.7, "r_y1": 547.04, "r_x2": 162.7, "r_y2": 544.67, "r_x3": 158.48, "r_y3": 544.67, "coord_origin": "TOPLEFT" }, "text": "500", "orig": "500", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 19, "label": "text", "bbox": { "l": 158.48, "t": 548.91, "r": 164.1, "b": 551.28, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 39, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 158.48, "r_y0": 551.28, "r_x1": 164.1, "r_y1": 551.28, "r_x2": 164.1, "r_y2": 548.91, "r_x3": 158.48, "r_y3": 548.91, "coord_origin": "TOPLEFT" }, "text": "3500", "orig": "3500", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 20, "label": "text", "bbox": { "l": 158.48, "t": 553.15, "r": 162.7, "b": 555.52, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 40, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 158.48, "r_y0": 555.52, "r_x1": 162.7, "r_y1": 555.52, "r_x2": 162.7, "r_y2": 553.15, "r_x3": 158.48, "r_y3": 553.15, "coord_origin": "TOPLEFT" }, "text": "150", "orig": "150", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 21, "label": "text", "bbox": { "l": 168.82, "t": 540.73, "r": 172.89, "b": 543.1, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 41, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 168.82, "r_y0": 543.1, "r_x1": 172.89, "r_y1": 543.1, "r_x2": 172.89, "r_y2": 540.73, "r_x3": 168.82, "r_y3": 540.73, "coord_origin": "TOPLEFT" }, "text": "unit", "orig": "unit", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 22, "label": "text", "bbox": { "l": 168.82, "t": 544.67, "r": 172.89, "b": 547.04, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 42, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 168.82, "r_y0": 547.04, "r_x1": 172.89, "r_y1": 547.04, "r_x2": 172.89, "r_y2": 544.67, "r_x3": 168.82, "r_y3": 544.67, "coord_origin": "TOPLEFT" }, "text": "unit", "orig": "unit", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 23, "label": "text", "bbox": { "l": 168.82, "t": 548.91, "r": 172.89, "b": 551.28, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 43, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 168.82, "r_y0": 551.28, "r_x1": 172.89, "r_y1": 551.28, "r_x2": 172.89, "r_y2": 548.91, "r_x3": 168.82, "r_y3": 548.91, "coord_origin": "TOPLEFT" }, "text": "unit", "orig": "unit", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 24, "label": "text", "bbox": { "l": 168.82, "t": 553.15, "r": 172.89, "b": 555.52, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 44, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 168.82, "r_y0": 555.52, "r_x1": 172.89, "r_y1": 555.52, "r_x2": 172.89, "r_y2": 553.15, "r_x3": 168.82, "r_y3": 553.15, "coord_origin": "TOPLEFT" }, "text": "unit", "orig": "unit", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 25, "label": "text", "bbox": { "l": 147.3, "t": 544.67, "r": 149.71, "b": 547.04, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 45, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 147.3, "r_y0": 547.04, "r_x1": 149.71, "r_y1": 547.04, "r_x2": 149.71, "r_y2": 544.67, "r_x3": 147.3, "r_y3": 544.67, "coord_origin": "TOPLEFT" }, "text": "2.", "orig": "2.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 26, "label": "text", "bbox": { "l": 150.91, "t": 544.67, "r": 155.72, "b": 547.04, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 46, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 150.91, "r_y0": 547.04, "r_x1": 155.72, "r_y1": 547.04, "r_x2": 155.72, "r_y2": 544.67, "r_x3": 150.91, "r_y3": 544.67, "coord_origin": "TOPLEFT" }, "text": "Item", "orig": "Item", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 27, "label": "text", "bbox": { "l": 147.3, "t": 548.91, "r": 149.71, "b": 551.28, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 47, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 147.3, "r_y0": 551.28, "r_x1": 149.71, "r_y1": 551.28, "r_x2": 149.71, "r_y2": 548.91, "r_x3": 147.3, "r_y3": 548.91, "coord_origin": "TOPLEFT" }, "text": "3.", "orig": "3.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 28, "label": "text", "bbox": { "l": 150.91, "t": 548.91, "r": 155.72, "b": 551.28, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 48, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 150.91, "r_y0": 551.28, "r_x1": 155.72, "r_y1": 551.28, "r_x2": 155.72, "r_y2": 548.91, "r_x3": 150.91, "r_y3": 548.91, "coord_origin": "TOPLEFT" }, "text": "Item", "orig": "Item", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 29, "label": "text", "bbox": { "l": 147.3, "t": 553.15, "r": 149.71, "b": 555.52, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 49, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 147.3, "r_y0": 555.52, "r_x1": 149.71, "r_y1": 555.52, "r_x2": 149.71, "r_y2": 553.15, "r_x3": 147.3, "r_y3": 553.15, "coord_origin": "TOPLEFT" }, "text": "4.", "orig": "4.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 30, "label": "text", "bbox": { "l": 150.91, "t": 553.15, "r": 155.72, "b": 555.52, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 50, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 150.91, "r_y0": 555.52, "r_x1": 155.72, "r_y1": 555.52, "r_x2": 155.72, "r_y2": 553.15, "r_x3": 150.91, "r_y3": 553.15, "coord_origin": "TOPLEFT" }, "text": "Item", "orig": "Item", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 31, "label": "text", "bbox": { "l": 152.05, "t": 517.01, "r": 171.25, "b": 521.27, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 51, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 152.05, "r_y0": 521.27, "r_x1": 171.25, "r_y1": 521.27, "r_x2": 171.25, "r_y2": 517.01, "r_x3": 152.05, "r_y3": 517.01, "coord_origin": "TOPLEFT" }, "text": "Extracted", "orig": "Extracted", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 32, "label": "text", "bbox": { "l": 148.13, "t": 522.31, "r": 175.17, "b": 526.58, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 52, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 148.13, "r_y0": 526.58, "r_x1": 175.17, "r_y1": 526.58, "r_x2": 175.17, "r_y2": 522.31, "r_x3": 148.13, "r_y3": 522.31, "coord_origin": "TOPLEFT" }, "text": "Table Images", "orig": "Table Images", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 33, "label": "text", "bbox": { "l": 193.53, "t": 524.51, "r": 220.32, "b": 528.78, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 53, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 193.53, "r_y0": 528.78, "r_x1": 220.32, "r_y1": 528.78, "r_x2": 220.32, "r_y2": 524.51, "r_x3": 193.53, "r_y3": 524.51, "coord_origin": "TOPLEFT" }, "text": "Standardized", "orig": "Standardized", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 34, "label": "text", "bbox": { "l": 199.47, "t": 529.82, "r": 214.38, "b": 534.08, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 54, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 199.47, "r_y0": 534.08, "r_x1": 214.38, "r_y1": 534.08, "r_x2": 214.38, "r_y2": 529.82, "r_x3": 199.47, "r_y3": 529.82, "coord_origin": "TOPLEFT" }, "text": "Images", "orig": "Images", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 35, "label": "text", "bbox": { "l": 273.61, "t": 509.91, "r": 284.47, "b": 514.17, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 55, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 273.61, "r_y0": 514.17, "r_x1": 284.47, "r_y1": 514.17, "r_x2": 284.47, "r_y2": 509.91, "r_x3": 273.61, "r_y3": 509.91, "coord_origin": "TOPLEFT" }, "text": "BBox", "orig": "BBox", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 36, "label": "text", "bbox": { "l": 270.45, "t": 513.69, "r": 287.63, "b": 517.96, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 56, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 270.45, "r_y0": 517.96, "r_x1": 287.63, "r_y1": 517.96, "r_x2": 287.63, "r_y2": 513.69, "r_x3": 270.45, "r_y3": 513.69, "coord_origin": "TOPLEFT" }, "text": "Decoder", "orig": "Decoder", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 37, "label": "text", "bbox": { "l": 332.48, "t": 508.14, "r": 348.14, "b": 512.41, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 57, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 332.48, "r_y0": 512.41, "r_x1": 348.14, "r_y1": 512.41, "r_x2": 348.14, "r_y2": 508.14, "r_x3": 332.48, "r_y3": 508.14, "coord_origin": "TOPLEFT" }, "text": "BBoxes", "orig": "BBoxes", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 38, "label": "text", "bbox": { "l": 376.69, "t": 521.12, "r": 407.25, "b": 525.38, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 58, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 376.69, "r_y0": 525.38, "r_x1": 407.25, "r_y1": 525.38, "r_x2": 407.25, "r_y2": 521.12, "r_x3": 376.69, "r_y3": 521.12, "coord_origin": "TOPLEFT" }, "text": "BBoxes can be", "orig": "BBoxes can be", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 39, "label": "text", "bbox": { "l": 373.91, "t": 525.67, "r": 410.04, "b": 529.93, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 59, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 373.91, "r_y0": 529.93, "r_x1": 410.04, "r_y1": 529.93, "r_x2": 410.04, "r_y2": 525.67, "r_x3": 373.91, "r_y3": 525.67, "coord_origin": "TOPLEFT" }, "text": "traced back to the", "orig": "traced back to the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 40, "label": "text", "bbox": { "l": 375.3, "t": 530.21, "r": 408.65, "b": 534.47, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 60, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 375.3, "r_y0": 534.47, "r_x1": 408.65, "r_y1": 534.47, "r_x2": 408.65, "r_y2": 530.21, "r_x3": 375.3, "r_y3": 530.21, "coord_origin": "TOPLEFT" }, "text": "original image to", "orig": "original image to", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 41, "label": "text", "bbox": { "l": 377.07, "t": 534.76, "r": 406.88, "b": 539.02, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 61, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 377.07, "r_y0": 539.02, "r_x1": 406.88, "r_y1": 539.02, "r_x2": 406.88, "r_y2": 534.76, "r_x3": 377.07, "r_y3": 534.76, "coord_origin": "TOPLEFT" }, "text": "extract content", "orig": "extract content", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 42, "label": "text", "bbox": { "l": 383.57, "t": 563.24, "r": 433.77, "b": 567.5, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 62, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 383.57, "r_y0": 567.5, "r_x1": 433.77, "r_y1": 567.5, "r_x2": 433.77, "r_y2": 563.24, "r_x3": 383.57, "r_y3": 563.24, "coord_origin": "TOPLEFT" }, "text": "Structure Tags sequence", "orig": "Structure Tags sequence", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 43, "label": "text", "bbox": { "l": 383.53, "t": 567.79, "r": 433.81, "b": 572.05, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 63, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 383.53, "r_y0": 572.05, "r_x1": 433.81, "r_y1": 572.05, "r_x2": 433.81, "r_y2": 567.79, "r_x3": 383.53, "r_y3": 567.79, "coord_origin": "TOPLEFT" }, "text": "provide full description of", "orig": "provide full description of", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 44, "label": "text", "bbox": { "l": 390.48, "t": 572.33, "r": 426.86, "b": 576.59, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 64, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 390.48, "r_y0": 576.59, "r_x1": 426.86, "r_y1": 576.59, "r_x2": 426.86, "r_y2": 572.33, "r_x3": 390.48, "r_y3": 572.33, "coord_origin": "TOPLEFT" }, "text": "the table structure", "orig": "the table structure", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 45, "label": "text", "bbox": { "l": 293.95, "t": 577.89, "r": 323.17, "b": 582.15, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 65, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 293.95, "r_y0": 582.15, "r_x1": 323.17, "r_y1": 582.15, "r_x2": 323.17, "r_y2": 577.89, "r_x3": 293.95, "r_y3": 577.89, "coord_origin": "TOPLEFT" }, "text": "Structure Tags", "orig": "Structure Tags", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 46, "label": "text", "bbox": { "l": 293.95, "t": 582.44, "r": 324.59, "b": 586.7, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 66, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 293.95, "r_y0": 586.7, "r_x1": 324.59, "r_y1": 586.7, "r_x2": 324.59, "r_y2": 582.44, "r_x3": 293.95, "r_y3": 582.44, "coord_origin": "TOPLEFT" }, "text": "in OTSL format", "orig": "in OTSL format", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 47, "label": "text", "bbox": { "l": 333.08, "t": 541.82, "r": 364.15, "b": 546.09, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 67, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 333.08, "r_y0": 546.09, "r_x1": 364.15, "r_y1": 546.09, "r_x2": 364.15, "r_y2": 541.82, "r_x3": 333.08, "r_y3": 541.82, "coord_origin": "TOPLEFT" }, "text": "BBoxes in sync", "orig": "BBoxes in sync", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 48, "label": "text", "bbox": { "l": 333.08, "t": 545.61, "r": 369.72, "b": 549.87, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 68, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 333.08, "r_y0": 549.87, "r_x1": 369.72, "r_y1": 549.87, "r_x2": 369.72, "r_y2": 545.61, "r_x3": 333.08, "r_y3": 545.61, "coord_origin": "TOPLEFT" }, "text": "with tag sequence", "orig": "with tag sequence", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 49, "label": "text", "bbox": { "l": 232.66, "t": 515.24, "r": 249.59, "b": 519.5, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 69, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 232.66, "r_y0": 519.5, "r_x1": 249.59, "r_y1": 519.5, "r_x2": 249.59, "r_y2": 515.24, "r_x3": 232.66, "r_y3": 515.24, "coord_origin": "TOPLEFT" }, "text": "Encoder", "orig": "Encoder", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 50, "label": "text", "bbox": { "l": 269.82, "t": 545.97, "r": 288.26, "b": 550.23, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 70, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 269.82, "r_y0": 550.23, "r_x1": 288.26, "r_y1": 550.23, "r_x2": 288.26, "r_y2": 545.97, "r_x3": 269.82, "r_y3": 545.97, "coord_origin": "TOPLEFT" }, "text": "Structure", "orig": "Structure", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 51, "label": "text", "bbox": { "l": 270.45, "t": 549.76, "r": 287.63, "b": 554.02, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 71, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 270.45, "r_y0": 554.02, "r_x1": 287.63, "r_y1": 554.02, "r_x2": 287.63, "r_y2": 549.76, "r_x3": 270.45, "r_y3": 549.76, "coord_origin": "TOPLEFT" }, "text": "Decoder", "orig": "Decoder", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 52, "label": "text", "bbox": { "l": 332.18, "t": 515.91, "r": 358.11, "b": 520.18, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 72, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 332.18, "r_y0": 520.18, "r_x1": 358.11, "r_y1": 520.18, "r_x2": 358.11, "r_y2": 515.91, "r_x3": 332.18, "r_y3": 515.91, "coord_origin": "TOPLEFT" }, "text": "[x1, y2, x2, y2]", "orig": "[x1, y2, x2, y2]", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 53, "label": "text", "bbox": { "l": 332.18, "t": 521.97, "r": 361.58, "b": 526.24, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 73, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 332.18, "r_y0": 526.24, "r_x1": 361.58, "r_y1": 526.24, "r_x2": 361.58, "r_y2": 521.97, "r_x3": 332.18, "r_y3": 521.97, "coord_origin": "TOPLEFT" }, "text": "[x1', y2', x2', y2']", "orig": "[x1', y2', x2', y2']", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 54, "label": "text", "bbox": { "l": 332.18, "t": 528.03, "r": 364.76, "b": 532.3, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 74, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 332.18, "r_y0": 532.3, "r_x1": 364.76, "r_y1": 532.3, "r_x2": 364.76, "r_y2": 528.03, "r_x3": 332.18, "r_y3": 528.03, "coord_origin": "TOPLEFT" }, "text": "[x1'', y2'', x2'', y2'']", "orig": "[x1'', y2'', x2'', y2'']", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 55, "label": "text", "bbox": { "l": 332.18, "t": 534.09, "r": 335.97, "b": 538.36, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 75, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 332.18, "r_y0": 538.36, "r_x1": 335.97, "r_y1": 538.36, "r_x2": 335.97, "r_y2": 534.09, "r_x3": 332.18, "r_y3": 534.09, "coord_origin": "TOPLEFT" }, "text": "...", "orig": "...", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 56, "label": "text", "bbox": { "l": 326.89, "t": 516.4, "r": 329.42, "b": 520.66, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 76, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 326.89, "r_y0": 520.66, "r_x1": 329.42, "r_y1": 520.66, "r_x2": 329.42, "r_y2": 516.4, "r_x3": 326.89, "r_y3": 516.4, "coord_origin": "TOPLEFT" }, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 57, "label": "text", "bbox": { "l": 327.04, "t": 522.42, "r": 329.57, "b": 526.69, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 77, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 327.04, "r_y0": 526.69, "r_x1": 329.57, "r_y1": 526.69, "r_x2": 329.57, "r_y2": 522.42, "r_x3": 327.04, "r_y3": 522.42, "coord_origin": "TOPLEFT" }, "text": "2", "orig": "2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 58, "label": "text", "bbox": { "l": 327.04, "t": 528.52, "r": 329.57, "b": 532.78, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 78, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 327.04, "r_y0": 532.78, "r_x1": 329.57, "r_y1": 532.78, "r_x2": 329.57, "r_y2": 528.52, "r_x3": 327.04, "r_y3": 528.52, "coord_origin": "TOPLEFT" }, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 59, "label": "text", "bbox": { "l": 424.14, "t": 527.44, "r": 426.67, "b": 531.71, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 79, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 424.14, "r_y0": 531.71, "r_x1": 426.67, "r_y1": 531.71, "r_x2": 426.67, "r_y2": 527.44, "r_x3": 424.14, "r_y3": 527.44, "coord_origin": "TOPLEFT" }, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 60, "label": "text", "bbox": { "l": 453.0, "t": 517.45, "r": 455.53, "b": 521.72, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 80, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 453.0, "r_y0": 521.72, "r_x1": 455.53, "r_y1": 521.72, "r_x2": 455.53, "r_y2": 517.45, "r_x3": 453.0, "r_y3": 517.45, "coord_origin": "TOPLEFT" }, "text": "2", "orig": "2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 61, "label": "text", "bbox": { "l": 423.86, "t": 517.06, "r": 426.39, "b": 521.33, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 81, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 423.86, "r_y0": 521.33, "r_x1": 426.39, "r_y1": 521.33, "r_x2": 426.39, "r_y2": 517.06, "r_x3": 423.86, "r_y3": 517.06, "coord_origin": "TOPLEFT" }, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 62, "label": "text", "bbox": { "l": 333.43, "t": 557.37, "r": 337.28, "b": 562.36, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 82, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 333.43, "r_y0": 562.36, "r_x1": 337.28, "r_y1": 562.36, "r_x2": 337.28, "r_y2": 557.37, "r_x3": 333.43, "r_y3": 557.37, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 63, "label": "text", "bbox": { "l": 340.35, "t": 557.32, "r": 344.2, "b": 562.31, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 83, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 340.35, "r_y0": 562.31, "r_x1": 344.2, "r_y1": 562.31, "r_x2": 344.2, "r_y2": 557.32, "r_x3": 340.35, "r_y3": 557.32, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 64, "label": "text", "bbox": { "l": 340.31, "t": 563.87, "r": 344.15, "b": 568.86, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 84, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 340.31, "r_y0": 568.86, "r_x1": 344.15, "r_y1": 568.86, "r_x2": 344.15, "r_y2": 563.87, "r_x3": 340.31, "r_y3": 563.87, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 65, "label": "text", "bbox": { "l": 346.8, "t": 563.87, "r": 350.64, "b": 568.86, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 85, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 346.8, "r_y0": 568.86, "r_x1": 350.64, "r_y1": 568.86, "r_x2": 350.64, "r_y2": 563.87, "r_x3": 346.8, "r_y3": 563.87, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 66, "label": "text", "bbox": { "l": 333.6, "t": 563.82, "r": 337.44, "b": 568.81, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 86, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 333.6, "r_y0": 568.81, "r_x1": 337.44, "r_y1": 568.81, "r_x2": 337.44, "r_y2": 563.82, "r_x3": 333.6, "r_y3": 563.82, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 67, "label": "text", "bbox": { "l": 340.38, "t": 570.43, "r": 344.22, "b": 575.42, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 87, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 340.38, "r_y0": 575.42, "r_x1": 344.22, "r_y1": 575.42, "r_x2": 344.22, "r_y2": 570.43, "r_x3": 340.38, "r_y3": 570.43, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 68, "label": "text", "bbox": { "l": 346.86, "t": 570.43, "r": 350.71, "b": 575.42, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 88, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 346.86, "r_y0": 575.42, "r_x1": 350.71, "r_y1": 575.42, "r_x2": 350.71, "r_y2": 570.43, "r_x3": 346.86, "r_y3": 570.43, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 69, "label": "text", "bbox": { "l": 333.66, "t": 570.38, "r": 337.5, "b": 575.37, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 89, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 333.66, "r_y0": 575.37, "r_x1": 337.5, "r_y1": 575.37, "r_x2": 337.5, "r_y2": 570.38, "r_x3": 333.66, "r_y3": 570.38, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 70, "label": "text", "bbox": { "l": 340.38, "t": 577.03, "r": 344.22, "b": 582.02, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 90, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 340.38, "r_y0": 582.02, "r_x1": 344.22, "r_y1": 582.02, "r_x2": 344.22, "r_y2": 577.03, "r_x3": 340.38, "r_y3": 577.03, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 71, "label": "text", "bbox": { "l": 346.87, "t": 577.03, "r": 350.71, "b": 582.02, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 91, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 346.87, "r_y0": 582.02, "r_x1": 350.71, "r_y1": 582.02, "r_x2": 350.71, "r_y2": 577.03, "r_x3": 346.87, "r_y3": 577.03, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 72, "label": "text", "bbox": { "l": 333.66, "t": 576.98, "r": 337.5, "b": 581.97, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 92, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 333.66, "r_y0": 581.97, "r_x1": 337.5, "r_y1": 581.97, "r_x2": 337.5, "r_y2": 576.98, "r_x3": 333.66, "r_y3": 576.98, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 73, "label": "text", "bbox": { "l": 340.28, "t": 583.4, "r": 344.12, "b": 588.39, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 93, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 340.28, "r_y0": 588.39, "r_x1": 344.12, "r_y1": 588.39, "r_x2": 344.12, "r_y2": 583.4, "r_x3": 340.28, "r_y3": 583.4, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 74, "label": "text", "bbox": { "l": 346.77, "t": 583.4, "r": 350.61, "b": 588.39, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 94, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 346.77, "r_y0": 588.39, "r_x1": 350.61, "r_y1": 588.39, "r_x2": 350.61, "r_y2": 583.4, "r_x3": 346.77, "r_y3": 583.4, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 75, "label": "text", "bbox": { "l": 333.57, "t": 583.35, "r": 337.41, "b": 588.35, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 95, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 333.57, "r_y0": 588.35, "r_x1": 337.41, "r_y1": 588.35, "r_x2": 337.41, "r_y2": 583.35, "r_x3": 333.57, "r_y3": 583.35, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 76, "label": "text", "bbox": { "l": 353.03, "t": 556.88, "r": 359.83, "b": 561.87, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 96, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 353.03, "r_y0": 561.87, "r_x1": 359.83, "r_y1": 561.87, "r_x2": 359.83, "r_y2": 556.88, "r_x3": 353.03, "r_y3": 556.88, "coord_origin": "TOPLEFT" }, "text": "NL", "orig": "NL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 77, "label": "text", "bbox": { "l": 353.19, "t": 563.58, "r": 359.99, "b": 568.57, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 97, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 353.19, "r_y0": 568.57, "r_x1": 359.99, "r_y1": 568.57, "r_x2": 359.99, "r_y2": 563.58, "r_x3": 353.19, "r_y3": 563.58, "coord_origin": "TOPLEFT" }, "text": "NL", "orig": "NL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 78, "label": "text", "bbox": { "l": 353.2, "t": 570.16, "r": 360.0, "b": 575.15, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 98, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 353.2, "r_y0": 575.15, "r_x1": 360.0, "r_y1": 575.15, "r_x2": 360.0, "r_y2": 570.16, "r_x3": 353.2, "r_y3": 570.16, "coord_origin": "TOPLEFT" }, "text": "NL", "orig": "NL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 79, "label": "text", "bbox": { "l": 353.15, "t": 576.77, "r": 359.95, "b": 581.76, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 99, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 353.15, "r_y0": 581.76, "r_x1": 359.95, "r_y1": 581.76, "r_x2": 359.95, "r_y2": 576.77, "r_x3": 353.15, "r_y3": 576.77, "coord_origin": "TOPLEFT" }, "text": "NL", "orig": "NL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 80, "label": "text", "bbox": { "l": 353.27, "t": 583.41, "r": 360.07, "b": 588.4, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 100, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 353.27, "r_y0": 588.4, "r_x1": 360.07, "r_y1": 588.4, "r_x2": 360.07, "r_y2": 583.41, "r_x3": 353.27, "r_y3": 583.41, "coord_origin": "TOPLEFT" }, "text": "NL", "orig": "NL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 81, "label": "text", "bbox": { "l": 347.38, "t": 557.08, "r": 350.34, "b": 562.07, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 101, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 347.38, "r_y0": 562.07, "r_x1": 350.34, "r_y1": 562.07, "r_x2": 350.34, "r_y2": 557.08, "r_x3": 347.38, "r_y3": 557.08, "coord_origin": "TOPLEFT" }, "text": "L", "orig": "L", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 82, "label": "text", "bbox": { "l": 331.14, "t": 564.29, "r": 333.67, "b": 568.55, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 102, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 331.14, "r_y0": 568.55, "r_x1": 333.67, "r_y1": 568.55, "r_x2": 333.67, "r_y2": 564.29, "r_x3": 331.14, "r_y3": 564.29, "coord_origin": "TOPLEFT" }, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 83, "label": "text", "bbox": { "l": 340.81, "t": 554.59, "r": 343.34, "b": 558.86, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 103, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 340.81, "r_y0": 558.86, "r_x1": 343.34, "r_y1": 558.86, "r_x2": 343.34, "r_y2": 554.59, "r_x3": 340.81, "r_y3": 554.59, "coord_origin": "TOPLEFT" }, "text": "2", "orig": "2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 84, "label": "text", "bbox": { "l": 330.98, "t": 554.83, "r": 333.51, "b": 559.09, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 104, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 330.98, "r_y0": 559.09, "r_x1": 333.51, "r_y1": 559.09, "r_x2": 333.51, "r_y2": 554.83, "r_x3": 330.98, "r_y3": 554.83, "coord_origin": "TOPLEFT" }, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] } ] }, { "id": 4, "label": "text", "bbox": { "l": 134.76, "t": 620.19, "r": 480.59, "b": 664.85, "coord_origin": "TOPLEFT" }, "confidence": 0.951, "cells": [ { "index": 105, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 149.71, "r_y0": 628.99, "r_x1": 480.59, "r_y1": 628.99, "r_x2": 480.59, "r_y2": 620.19, "r_x3": 149.71, "r_y3": 620.19, "coord_origin": "TOPLEFT" }, "text": "We rely on standard metrics such as Tree Edit Distance score (TEDs) for", "orig": "We rely on standard metrics such as Tree Edit Distance score (TEDs) for", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 106, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 640.94, "r_x1": 480.59, "r_y1": 640.94, "r_x2": 480.59, "r_y2": 632.15, "r_x3": 134.76, "r_y3": 632.15, "coord_origin": "TOPLEFT" }, "text": "table structure prediction, and Mean Average Precision (mAP) with 0.75 Inter-", "orig": "table structure prediction, and Mean Average Precision (mAP) with 0.75 Inter-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 107, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 652.9, "r_x1": 480.59, "r_y1": 652.9, "r_x2": 480.59, "r_y2": 644.1, "r_x3": 134.76, "r_y3": 644.1, "coord_origin": "TOPLEFT" }, "text": "section Over Union (IOU) threshold for the bounding-box predictions of table", "orig": "section Over Union (IOU) threshold for the bounding-box predictions of table", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 108, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 664.85, "r_x1": 480.59, "r_y1": 664.85, "r_x2": 480.59, "r_y2": 656.06, "r_x3": 134.76, "r_y3": 656.06, "coord_origin": "TOPLEFT" }, "text": "cells. The predicted OTSL structures were converted back to HTML format in", "orig": "cells. The predicted OTSL structures were converted back to HTML format in", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] } ] }, "tablestructure": { "table_map": {} }, "figures_classification": null, "equations_prediction": null, "vlm_response": null }, "assembled": { "elements": [ { "label": "page_header", "id": 9, "page_no": 7, "cluster": { "id": 9, "label": "page_header", "bbox": { "l": 134.76, "t": 93.77, "r": 139.37, "b": 101.84, "coord_origin": "TOPLEFT" }, "confidence": 0.83, "cells": [ { "index": 0, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 101.84, "r_x1": 139.37, "r_y1": 101.84, "r_x2": 139.37, "r_y2": 93.77, "r_x3": 134.76, "r_y3": 93.77, "coord_origin": "TOPLEFT" }, "text": "8", "orig": "8", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "8" }, { "label": "page_header", "id": 8, "page_no": 7, "cluster": { "id": 8, "label": "page_header", "bbox": { "l": 167.81, "t": 93.77, "r": 231.72, "b": 101.84, "coord_origin": "TOPLEFT" }, "confidence": 0.863, "cells": [ { "index": 1, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 167.81, "r_y0": 101.84, "r_x1": 178.08, "r_y1": 101.84, "r_x2": 178.08, "r_y2": 93.77, "r_x3": 167.81, "r_y3": 93.77, "coord_origin": "TOPLEFT" }, "text": "M.", "orig": "M.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 2, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 182.37, "r_y0": 101.84, "r_x1": 231.72, "r_y1": 101.84, "r_x2": 231.72, "r_y2": 93.77, "r_x3": 182.37, "r_y3": 93.77, "coord_origin": "TOPLEFT" }, "text": "Lysak, et al.", "orig": "Lysak, et al.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "M. Lysak, et al." }, { "label": "text", "id": 5, "page_no": 7, "cluster": { "id": 5, "label": "text", "bbox": { "l": 134.76, "t": 118.93, "r": 480.59, "b": 139.69, "coord_origin": "TOPLEFT" }, "confidence": 0.946, "cells": [ { "index": 3, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 127.73, "r_x1": 480.59, "r_y1": 127.73, "r_x2": 480.59, "r_y2": 118.93, "r_x3": 134.76, "r_y3": 118.93, "coord_origin": "TOPLEFT" }, "text": "reduces significantly the column drift seen in the HTML based models (see Fig-", "orig": "reduces significantly the column drift seen in the HTML based models (see Fig-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 4, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 139.69, "r_x1": 163.56, "r_y1": 139.69, "r_x2": 163.56, "r_y2": 130.89, "r_x3": 134.76, "r_y3": 130.89, "coord_origin": "TOPLEFT" }, "text": "ure 5).", "orig": "ure 5).", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "reduces significantly the column drift seen in the HTML based models (see Figure 5)." }, { "label": "section_header", "id": 2, "page_no": 7, "cluster": { "id": 2, "label": "section_header", "bbox": { "l": 134.76, "t": 161.56, "r": 319.35, "b": 170.36, "coord_origin": "TOPLEFT" }, "confidence": 0.955, "cells": [ { "index": 5, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 170.36, "r_x1": 149.4, "r_y1": 170.36, "r_x2": 149.4, "r_y2": 161.56, "r_x3": 134.76, "r_y3": 161.56, "coord_origin": "TOPLEFT" }, "text": "4.3", "orig": "4.3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 6, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 160.86, "r_y0": 170.36, "r_x1": 319.35, "r_y1": 170.36, "r_x2": 319.35, "r_y2": 161.56, "r_x3": 160.86, "r_y3": 161.56, "coord_origin": "TOPLEFT" }, "text": "Error-detection and -mitigation", "orig": "Error-detection and -mitigation", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "4.3 Error-detection and -mitigation" }, { "label": "text", "id": 0, "page_no": 7, "cluster": { "id": 0, "label": "text", "bbox": { "l": 134.76, "t": 182.28, "r": 480.6, "b": 298.68, "coord_origin": "TOPLEFT" }, "confidence": 0.988, "cells": [ { "index": 7, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 191.08, "r_x1": 480.6, "r_y1": 191.08, "r_x2": 480.6, "r_y2": 182.28, "r_x3": 134.76, "r_y3": 182.28, "coord_origin": "TOPLEFT" }, "text": "The design of OTSL allows to validate a table structure easily on an unfinished", "orig": "The design of OTSL allows to validate a table structure easily on an unfinished", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 8, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 203.03, "r_x1": 480.59, "r_y1": 203.03, "r_x2": 480.59, "r_y2": 194.24, "r_x3": 134.76, "r_y3": 194.24, "coord_origin": "TOPLEFT" }, "text": "sequence. The detection of an invalid sequence token is a clear indication of a", "orig": "sequence. The detection of an invalid sequence token is a clear indication of a", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 9, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 214.99, "r_x1": 480.59, "r_y1": 214.99, "r_x2": 480.59, "r_y2": 206.19, "r_x3": 134.76, "r_y3": 206.19, "coord_origin": "TOPLEFT" }, "text": "prediction mistake, however a valid sequence by itself does not guarantee pre-", "orig": "prediction mistake, however a valid sequence by itself does not guarantee pre-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 10, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 226.94, "r_x1": 480.59, "r_y1": 226.94, "r_x2": 480.59, "r_y2": 218.15, "r_x3": 134.76, "r_y3": 218.15, "coord_origin": "TOPLEFT" }, "text": "diction correctness. Different heuristics can be used to correct token errors in", "orig": "diction correctness. Different heuristics can be used to correct token errors in", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 11, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 238.9, "r_x1": 480.59, "r_y1": 238.9, "r_x2": 480.59, "r_y2": 230.1, "r_x3": 134.76, "r_y3": 230.1, "coord_origin": "TOPLEFT" }, "text": "an invalid sequence and thus increase the chances for accurate predictions. Such", "orig": "an invalid sequence and thus increase the chances for accurate predictions. Such", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 12, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 250.85, "r_x1": 480.59, "r_y1": 250.85, "r_x2": 480.59, "r_y2": 242.06, "r_x3": 134.76, "r_y3": 242.06, "coord_origin": "TOPLEFT" }, "text": "heuristics can be applied either after the prediction of each token, or at the end", "orig": "heuristics can be applied either after the prediction of each token, or at the end", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 13, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 262.81, "r_x1": 480.59, "r_y1": 262.81, "r_x2": 480.59, "r_y2": 254.01, "r_x3": 134.76, "r_y3": 254.01, "coord_origin": "TOPLEFT" }, "text": "on the entire predicted sequence. For example a simple heuristic which can cor-", "orig": "on the entire predicted sequence. For example a simple heuristic which can cor-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 14, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 274.77, "r_x1": 480.59, "r_y1": 274.77, "r_x2": 480.59, "r_y2": 265.97, "r_x3": 134.76, "r_y3": 265.97, "coord_origin": "TOPLEFT" }, "text": "rect the predicted OTSL sequence on-the-fly is to verify if the token with the", "orig": "rect the predicted OTSL sequence on-the-fly is to verify if the token with the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 15, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 286.72, "r_x1": 480.6, "r_y1": 286.72, "r_x2": 480.6, "r_y2": 277.92, "r_x3": 134.76, "r_y3": 277.92, "coord_origin": "TOPLEFT" }, "text": "highest prediction confidence invalidates the predicted sequence, and replace it", "orig": "highest prediction confidence invalidates the predicted sequence, and replace it", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 16, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 298.68, "r_x1": 469.4, "r_y1": 298.68, "r_x2": 469.4, "r_y2": 289.88, "r_x3": 134.76, "r_y3": 289.88, "coord_origin": "TOPLEFT" }, "text": "by the token with the next highest confidence until OTSL rules are satisfied.", "orig": "by the token with the next highest confidence until OTSL rules are satisfied.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "The design of OTSL allows to validate a table structure easily on an unfinished sequence. The detection of an invalid sequence token is a clear indication of a prediction mistake, however a valid sequence by itself does not guarantee prediction correctness. Different heuristics can be used to correct token errors in an invalid sequence and thus increase the chances for accurate predictions. Such heuristics can be applied either after the prediction of each token, or at the end on the entire predicted sequence. For example a simple heuristic which can correct the predicted OTSL sequence on-the-fly is to verify if the token with the highest prediction confidence invalidates the predicted sequence, and replace it by the token with the next highest confidence until OTSL rules are satisfied." }, { "label": "section_header", "id": 3, "page_no": 7, "cluster": { "id": 3, "label": "section_header", "bbox": { "l": 134.76, "t": 321.16, "r": 229.04, "b": 331.73, "coord_origin": "TOPLEFT" }, "confidence": 0.952, "cells": [ { "index": 17, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 331.73, "r_x1": 141.49, "r_y1": 331.73, "r_x2": 141.49, "r_y2": 321.16, "r_x3": 134.76, "r_y3": 321.16, "coord_origin": "TOPLEFT" }, "text": "5", "orig": "5", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 18, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 154.94, "r_y0": 331.73, "r_x1": 229.04, "r_y1": 331.73, "r_x2": 229.04, "r_y2": 321.16, "r_x3": 154.94, "r_y3": 321.16, "coord_origin": "TOPLEFT" }, "text": "Experiments", "orig": "Experiments", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "5 Experiments" }, { "label": "text", "id": 1, "page_no": 7, "cluster": { "id": 1, "label": "text", "bbox": { "l": 134.76, "t": 347.25, "r": 480.6, "b": 451.69, "coord_origin": "TOPLEFT" }, "confidence": 0.988, "cells": [ { "index": 19, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 356.05, "r_x1": 480.59, "r_y1": 356.05, "r_x2": 480.59, "r_y2": 347.25, "r_x3": 134.76, "r_y3": 347.25, "coord_origin": "TOPLEFT" }, "text": "To evaluate the impact of OTSL on prediction accuracy and inference times, we", "orig": "To evaluate the impact of OTSL on prediction accuracy and inference times, we", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 20, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 368.0, "r_x1": 480.59, "r_y1": 368.0, "r_x2": 480.59, "r_y2": 359.2, "r_x3": 134.76, "r_y3": 359.2, "coord_origin": "TOPLEFT" }, "text": "conducted a series of experiments based on the TableFormer model (Figure 4)", "orig": "conducted a series of experiments based on the TableFormer model (Figure 4)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 21, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 379.96, "r_x1": 480.59, "r_y1": 379.96, "r_x2": 480.59, "r_y2": 371.16, "r_x3": 134.76, "r_y3": 371.16, "coord_origin": "TOPLEFT" }, "text": "with two objectives: Firstly we evaluate the prediction quality and performance", "orig": "with two objectives: Firstly we evaluate the prediction quality and performance", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 22, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 391.91, "r_x1": 480.59, "r_y1": 391.91, "r_x2": 480.59, "r_y2": 383.11, "r_x3": 134.76, "r_y3": 383.11, "coord_origin": "TOPLEFT" }, "text": "of OTSL vs. HTML after performing Hyper Parameter Optimization (HPO) on", "orig": "of OTSL vs. HTML after performing Hyper Parameter Optimization (HPO) on", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 23, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 403.87, "r_x1": 148.6, "r_y1": 403.87, "r_x2": 148.6, "r_y2": 395.07, "r_x3": 134.76, "r_y3": 395.07, "coord_origin": "TOPLEFT" }, "text": "the", "orig": "the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 24, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.63, "r_y0": 403.87, "r_x1": 191.85, "r_y1": 403.87, "r_x2": 191.85, "r_y2": 395.07, "r_x3": 151.63, "r_y3": 395.07, "coord_origin": "TOPLEFT" }, "text": "canonical", "orig": "canonical", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 25, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 195.9, "r_y0": 403.87, "r_x1": 480.6, "r_y1": 403.87, "r_x2": 480.6, "r_y2": 395.07, "r_x3": 195.9, "r_y3": 395.07, "coord_origin": "TOPLEFT" }, "text": "PubTabNet data set. Secondly we pick the best hyper-parameters", "orig": "PubTabNet data set. Secondly we pick the best hyper-parameters", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 26, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.77, "r_y0": 415.82, "r_x1": 480.59, "r_y1": 415.82, "r_x2": 480.59, "r_y2": 407.02, "r_x3": 134.77, "r_y3": 407.02, "coord_origin": "TOPLEFT" }, "text": "found in the first step and evaluate how OTSL impacts the performance of", "orig": "found in the first step and evaluate how OTSL impacts the performance of", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 27, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.77, "r_y0": 427.78, "r_x1": 480.59, "r_y1": 427.78, "r_x2": 480.59, "r_y2": 418.98, "r_x3": 134.77, "r_y3": 418.98, "coord_origin": "TOPLEFT" }, "text": "TableFormer after training on other publicly available data sets (FinTabNet,", "orig": "TableFormer after training on other publicly available data sets (FinTabNet,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 28, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.77, "r_y0": 439.73, "r_x1": 480.59, "r_y1": 439.73, "r_x2": 480.59, "r_y2": 430.94, "r_x3": 134.77, "r_y3": 430.94, "coord_origin": "TOPLEFT" }, "text": "PubTables-1M [14]). The ground truth (GT) from all data sets has been con-", "orig": "PubTables-1M [14]). The ground truth (GT) from all data sets has been con-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 29, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.77, "r_y0": 451.69, "r_x1": 479.3, "r_y1": 451.69, "r_x2": 479.3, "r_y2": 442.89, "r_x3": 134.77, "r_y3": 442.89, "coord_origin": "TOPLEFT" }, "text": "verted into OTSL format for this purpose, and will be made publicly available.", "orig": "verted into OTSL format for this purpose, and will be made publicly available.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "To evaluate the impact of OTSL on prediction accuracy and inference times, we conducted a series of experiments based on the TableFormer model (Figure 4) with two objectives: Firstly we evaluate the prediction quality and performance of OTSL vs. HTML after performing Hyper Parameter Optimization (HPO) on the canonical PubTabNet data set. Secondly we pick the best hyper-parameters found in the first step and evaluate how OTSL impacts the performance of TableFormer after training on other publicly available data sets (FinTabNet, PubTables-1M [14]). The ground truth (GT) from all data sets has been converted into OTSL format for this purpose, and will be made publicly available." }, { "label": "caption", "id": 7, "page_no": 7, "cluster": { "id": 7, "label": "caption", "bbox": { "l": 134.77, "t": 484.65, "r": 480.59, "b": 503.74, "coord_origin": "TOPLEFT" }, "confidence": 0.93, "cells": [ { "index": 30, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.77, "r_y0": 492.57, "r_x1": 162.64, "r_y1": 492.57, "r_x2": 162.64, "r_y2": 484.65, "r_x3": 134.77, "r_y3": 484.65, "coord_origin": "TOPLEFT" }, "text": "Fig. 4.", "orig": "Fig. 4.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 31, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 165.2, "r_y0": 492.78, "r_x1": 480.59, "r_y1": 492.78, "r_x2": 480.59, "r_y2": 484.71, "r_x3": 165.2, "r_y3": 484.71, "coord_origin": "TOPLEFT" }, "text": "Architecture sketch of the TableFormer model, which is a representative for the", "orig": "Architecture sketch of the TableFormer model, which is a representative for the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 32, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.77, "r_y0": 503.74, "r_x1": 206.7, "r_y1": 503.74, "r_x2": 206.7, "r_y2": 495.67, "r_x3": 134.77, "r_y3": 495.67, "coord_origin": "TOPLEFT" }, "text": "Im2Seq approach.", "orig": "Im2Seq approach.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "Fig. 4. Architecture sketch of the TableFormer model, which is a representative for the Im2Seq approach." }, { "label": "picture", "id": 6, "page_no": 7, "cluster": { "id": 6, "label": "picture", "bbox": { "l": 140.71, "t": 508.06, "r": 472.73, "b": 593.68, "coord_origin": "TOPLEFT" }, "confidence": 0.93, "cells": [ { "index": 33, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 147.3, "r_y0": 543.1, "r_x1": 149.71, "r_y1": 543.1, "r_x2": 149.71, "r_y2": 540.73, "r_x3": 147.3, "r_y3": 540.73, "coord_origin": "TOPLEFT" }, "text": "1.", "orig": "1.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 34, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 150.91, "r_y0": 543.1, "r_x1": 155.72, "r_y1": 543.1, "r_x2": 155.72, "r_y2": 540.73, "r_x3": 150.91, "r_y3": 540.73, "coord_origin": "TOPLEFT" }, "text": "Item", "orig": "Item", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 35, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 162.76, "r_y0": 537.76, "r_x1": 172.3, "r_y1": 537.76, "r_x2": 172.3, "r_y2": 535.39, "r_x3": 162.76, "r_y3": 535.39, "coord_origin": "TOPLEFT" }, "text": "Amount", "orig": "Amount", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 36, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 147.64, "r_y0": 537.73, "r_x1": 155.92, "r_y1": 537.73, "r_x2": 155.92, "r_y2": 535.37, "r_x3": 147.64, "r_y3": 535.37, "coord_origin": "TOPLEFT" }, "text": "Names", "orig": "Names", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 37, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 158.48, "r_y0": 543.1, "r_x1": 164.1, "r_y1": 543.1, "r_x2": 164.1, "r_y2": 540.73, "r_x3": 158.48, "r_y3": 540.73, "coord_origin": "TOPLEFT" }, "text": "1000", "orig": "1000", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 38, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 158.48, "r_y0": 547.04, "r_x1": 162.7, "r_y1": 547.04, "r_x2": 162.7, "r_y2": 544.67, "r_x3": 158.48, "r_y3": 544.67, "coord_origin": "TOPLEFT" }, "text": "500", "orig": "500", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 39, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 158.48, "r_y0": 551.28, "r_x1": 164.1, "r_y1": 551.28, "r_x2": 164.1, "r_y2": 548.91, "r_x3": 158.48, "r_y3": 548.91, "coord_origin": "TOPLEFT" }, "text": "3500", "orig": "3500", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 40, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 158.48, "r_y0": 555.52, "r_x1": 162.7, "r_y1": 555.52, "r_x2": 162.7, "r_y2": 553.15, "r_x3": 158.48, "r_y3": 553.15, "coord_origin": "TOPLEFT" }, "text": "150", "orig": "150", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 41, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 168.82, "r_y0": 543.1, "r_x1": 172.89, "r_y1": 543.1, "r_x2": 172.89, "r_y2": 540.73, "r_x3": 168.82, "r_y3": 540.73, "coord_origin": "TOPLEFT" }, "text": "unit", "orig": "unit", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 42, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 168.82, "r_y0": 547.04, "r_x1": 172.89, "r_y1": 547.04, "r_x2": 172.89, "r_y2": 544.67, "r_x3": 168.82, "r_y3": 544.67, "coord_origin": "TOPLEFT" }, "text": "unit", "orig": "unit", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 43, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 168.82, "r_y0": 551.28, "r_x1": 172.89, "r_y1": 551.28, "r_x2": 172.89, "r_y2": 548.91, "r_x3": 168.82, "r_y3": 548.91, "coord_origin": "TOPLEFT" }, "text": "unit", "orig": "unit", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 44, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 168.82, "r_y0": 555.52, "r_x1": 172.89, "r_y1": 555.52, "r_x2": 172.89, "r_y2": 553.15, "r_x3": 168.82, "r_y3": 553.15, "coord_origin": "TOPLEFT" }, "text": "unit", "orig": "unit", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 45, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 147.3, "r_y0": 547.04, "r_x1": 149.71, "r_y1": 547.04, "r_x2": 149.71, "r_y2": 544.67, "r_x3": 147.3, "r_y3": 544.67, "coord_origin": "TOPLEFT" }, "text": "2.", "orig": "2.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 46, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 150.91, "r_y0": 547.04, "r_x1": 155.72, "r_y1": 547.04, "r_x2": 155.72, "r_y2": 544.67, "r_x3": 150.91, "r_y3": 544.67, "coord_origin": "TOPLEFT" }, "text": "Item", "orig": "Item", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 47, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 147.3, "r_y0": 551.28, "r_x1": 149.71, "r_y1": 551.28, "r_x2": 149.71, "r_y2": 548.91, "r_x3": 147.3, "r_y3": 548.91, "coord_origin": "TOPLEFT" }, "text": "3.", "orig": "3.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 48, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 150.91, "r_y0": 551.28, "r_x1": 155.72, "r_y1": 551.28, "r_x2": 155.72, "r_y2": 548.91, "r_x3": 150.91, "r_y3": 548.91, "coord_origin": "TOPLEFT" }, "text": "Item", "orig": "Item", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 49, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 147.3, "r_y0": 555.52, "r_x1": 149.71, "r_y1": 555.52, "r_x2": 149.71, "r_y2": 553.15, "r_x3": 147.3, "r_y3": 553.15, "coord_origin": "TOPLEFT" }, "text": "4.", "orig": "4.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 50, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 150.91, "r_y0": 555.52, "r_x1": 155.72, "r_y1": 555.52, "r_x2": 155.72, "r_y2": 553.15, "r_x3": 150.91, "r_y3": 553.15, "coord_origin": "TOPLEFT" }, "text": "Item", "orig": "Item", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 51, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 152.05, "r_y0": 521.27, "r_x1": 171.25, "r_y1": 521.27, "r_x2": 171.25, "r_y2": 517.01, "r_x3": 152.05, "r_y3": 517.01, "coord_origin": "TOPLEFT" }, "text": "Extracted", "orig": "Extracted", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 52, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 148.13, "r_y0": 526.58, "r_x1": 175.17, "r_y1": 526.58, "r_x2": 175.17, "r_y2": 522.31, "r_x3": 148.13, "r_y3": 522.31, "coord_origin": "TOPLEFT" }, "text": "Table Images", "orig": "Table Images", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 53, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 193.53, "r_y0": 528.78, "r_x1": 220.32, "r_y1": 528.78, "r_x2": 220.32, "r_y2": 524.51, "r_x3": 193.53, "r_y3": 524.51, "coord_origin": "TOPLEFT" }, "text": "Standardized", "orig": "Standardized", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 54, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 199.47, "r_y0": 534.08, "r_x1": 214.38, "r_y1": 534.08, "r_x2": 214.38, "r_y2": 529.82, "r_x3": 199.47, "r_y3": 529.82, "coord_origin": "TOPLEFT" }, "text": "Images", "orig": "Images", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 55, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 273.61, "r_y0": 514.17, "r_x1": 284.47, "r_y1": 514.17, "r_x2": 284.47, "r_y2": 509.91, "r_x3": 273.61, "r_y3": 509.91, "coord_origin": "TOPLEFT" }, "text": "BBox", "orig": "BBox", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 56, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 270.45, "r_y0": 517.96, "r_x1": 287.63, "r_y1": 517.96, "r_x2": 287.63, "r_y2": 513.69, "r_x3": 270.45, "r_y3": 513.69, "coord_origin": "TOPLEFT" }, "text": "Decoder", "orig": "Decoder", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 57, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 332.48, "r_y0": 512.41, "r_x1": 348.14, "r_y1": 512.41, "r_x2": 348.14, "r_y2": 508.14, "r_x3": 332.48, "r_y3": 508.14, "coord_origin": "TOPLEFT" }, "text": "BBoxes", "orig": "BBoxes", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 58, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 376.69, "r_y0": 525.38, "r_x1": 407.25, "r_y1": 525.38, "r_x2": 407.25, "r_y2": 521.12, "r_x3": 376.69, "r_y3": 521.12, "coord_origin": "TOPLEFT" }, "text": "BBoxes can be", "orig": "BBoxes can be", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 59, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 373.91, "r_y0": 529.93, "r_x1": 410.04, "r_y1": 529.93, "r_x2": 410.04, "r_y2": 525.67, "r_x3": 373.91, "r_y3": 525.67, "coord_origin": "TOPLEFT" }, "text": "traced back to the", "orig": "traced back to the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 60, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 375.3, "r_y0": 534.47, "r_x1": 408.65, "r_y1": 534.47, "r_x2": 408.65, "r_y2": 530.21, "r_x3": 375.3, "r_y3": 530.21, "coord_origin": "TOPLEFT" }, "text": "original image to", "orig": "original image to", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 61, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 377.07, "r_y0": 539.02, "r_x1": 406.88, "r_y1": 539.02, "r_x2": 406.88, "r_y2": 534.76, "r_x3": 377.07, "r_y3": 534.76, "coord_origin": "TOPLEFT" }, "text": "extract content", "orig": "extract content", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 62, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 383.57, "r_y0": 567.5, "r_x1": 433.77, "r_y1": 567.5, "r_x2": 433.77, "r_y2": 563.24, "r_x3": 383.57, "r_y3": 563.24, "coord_origin": "TOPLEFT" }, "text": "Structure Tags sequence", "orig": "Structure Tags sequence", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 63, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 383.53, "r_y0": 572.05, "r_x1": 433.81, "r_y1": 572.05, "r_x2": 433.81, "r_y2": 567.79, "r_x3": 383.53, "r_y3": 567.79, "coord_origin": "TOPLEFT" }, "text": "provide full description of", "orig": "provide full description of", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 64, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 390.48, "r_y0": 576.59, "r_x1": 426.86, "r_y1": 576.59, "r_x2": 426.86, "r_y2": 572.33, "r_x3": 390.48, "r_y3": 572.33, "coord_origin": "TOPLEFT" }, "text": "the table structure", "orig": "the table structure", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 65, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 293.95, "r_y0": 582.15, "r_x1": 323.17, "r_y1": 582.15, "r_x2": 323.17, "r_y2": 577.89, "r_x3": 293.95, "r_y3": 577.89, "coord_origin": "TOPLEFT" }, "text": "Structure Tags", "orig": "Structure Tags", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 66, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 293.95, "r_y0": 586.7, "r_x1": 324.59, "r_y1": 586.7, "r_x2": 324.59, "r_y2": 582.44, "r_x3": 293.95, "r_y3": 582.44, "coord_origin": "TOPLEFT" }, "text": "in OTSL format", "orig": "in OTSL format", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 67, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 333.08, "r_y0": 546.09, "r_x1": 364.15, "r_y1": 546.09, "r_x2": 364.15, "r_y2": 541.82, "r_x3": 333.08, "r_y3": 541.82, "coord_origin": "TOPLEFT" }, "text": "BBoxes in sync", "orig": "BBoxes in sync", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 68, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 333.08, "r_y0": 549.87, "r_x1": 369.72, "r_y1": 549.87, "r_x2": 369.72, "r_y2": 545.61, "r_x3": 333.08, "r_y3": 545.61, "coord_origin": "TOPLEFT" }, "text": "with tag sequence", "orig": "with tag sequence", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 69, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 232.66, "r_y0": 519.5, "r_x1": 249.59, "r_y1": 519.5, "r_x2": 249.59, "r_y2": 515.24, "r_x3": 232.66, "r_y3": 515.24, "coord_origin": "TOPLEFT" }, "text": "Encoder", "orig": "Encoder", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 70, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 269.82, "r_y0": 550.23, "r_x1": 288.26, "r_y1": 550.23, "r_x2": 288.26, "r_y2": 545.97, "r_x3": 269.82, "r_y3": 545.97, "coord_origin": "TOPLEFT" }, "text": "Structure", "orig": "Structure", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 71, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 270.45, "r_y0": 554.02, "r_x1": 287.63, "r_y1": 554.02, "r_x2": 287.63, "r_y2": 549.76, "r_x3": 270.45, "r_y3": 549.76, "coord_origin": "TOPLEFT" }, "text": "Decoder", "orig": "Decoder", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 72, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 332.18, "r_y0": 520.18, "r_x1": 358.11, "r_y1": 520.18, "r_x2": 358.11, "r_y2": 515.91, "r_x3": 332.18, "r_y3": 515.91, "coord_origin": "TOPLEFT" }, "text": "[x1, y2, x2, y2]", "orig": "[x1, y2, x2, y2]", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 73, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 332.18, "r_y0": 526.24, "r_x1": 361.58, "r_y1": 526.24, "r_x2": 361.58, "r_y2": 521.97, "r_x3": 332.18, "r_y3": 521.97, "coord_origin": "TOPLEFT" }, "text": "[x1', y2', x2', y2']", "orig": "[x1', y2', x2', y2']", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 74, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 332.18, "r_y0": 532.3, "r_x1": 364.76, "r_y1": 532.3, "r_x2": 364.76, "r_y2": 528.03, "r_x3": 332.18, "r_y3": 528.03, "coord_origin": "TOPLEFT" }, "text": "[x1'', y2'', x2'', y2'']", "orig": "[x1'', y2'', x2'', y2'']", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 75, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 332.18, "r_y0": 538.36, "r_x1": 335.97, "r_y1": 538.36, "r_x2": 335.97, "r_y2": 534.09, "r_x3": 332.18, "r_y3": 534.09, "coord_origin": "TOPLEFT" }, "text": "...", "orig": "...", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 76, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 326.89, "r_y0": 520.66, "r_x1": 329.42, "r_y1": 520.66, "r_x2": 329.42, "r_y2": 516.4, "r_x3": 326.89, "r_y3": 516.4, "coord_origin": "TOPLEFT" }, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 77, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 327.04, "r_y0": 526.69, "r_x1": 329.57, "r_y1": 526.69, "r_x2": 329.57, "r_y2": 522.42, "r_x3": 327.04, "r_y3": 522.42, "coord_origin": "TOPLEFT" }, "text": "2", "orig": "2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 78, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 327.04, "r_y0": 532.78, "r_x1": 329.57, "r_y1": 532.78, "r_x2": 329.57, "r_y2": 528.52, "r_x3": 327.04, "r_y3": 528.52, "coord_origin": "TOPLEFT" }, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 79, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 424.14, "r_y0": 531.71, "r_x1": 426.67, "r_y1": 531.71, "r_x2": 426.67, "r_y2": 527.44, "r_x3": 424.14, "r_y3": 527.44, "coord_origin": "TOPLEFT" }, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 80, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 453.0, "r_y0": 521.72, "r_x1": 455.53, "r_y1": 521.72, "r_x2": 455.53, "r_y2": 517.45, "r_x3": 453.0, "r_y3": 517.45, "coord_origin": "TOPLEFT" }, "text": "2", "orig": "2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 81, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 423.86, "r_y0": 521.33, "r_x1": 426.39, "r_y1": 521.33, "r_x2": 426.39, "r_y2": 517.06, "r_x3": 423.86, "r_y3": 517.06, "coord_origin": "TOPLEFT" }, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 82, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 333.43, "r_y0": 562.36, "r_x1": 337.28, "r_y1": 562.36, "r_x2": 337.28, "r_y2": 557.37, "r_x3": 333.43, "r_y3": 557.37, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 83, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 340.35, "r_y0": 562.31, "r_x1": 344.2, "r_y1": 562.31, "r_x2": 344.2, "r_y2": 557.32, "r_x3": 340.35, "r_y3": 557.32, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 84, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 340.31, "r_y0": 568.86, "r_x1": 344.15, "r_y1": 568.86, "r_x2": 344.15, "r_y2": 563.87, "r_x3": 340.31, "r_y3": 563.87, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 85, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 346.8, "r_y0": 568.86, "r_x1": 350.64, "r_y1": 568.86, "r_x2": 350.64, "r_y2": 563.87, "r_x3": 346.8, "r_y3": 563.87, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 86, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 333.6, "r_y0": 568.81, "r_x1": 337.44, "r_y1": 568.81, "r_x2": 337.44, "r_y2": 563.82, "r_x3": 333.6, "r_y3": 563.82, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 87, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 340.38, "r_y0": 575.42, "r_x1": 344.22, "r_y1": 575.42, "r_x2": 344.22, "r_y2": 570.43, "r_x3": 340.38, "r_y3": 570.43, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 88, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 346.86, "r_y0": 575.42, "r_x1": 350.71, "r_y1": 575.42, "r_x2": 350.71, "r_y2": 570.43, "r_x3": 346.86, "r_y3": 570.43, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 89, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 333.66, "r_y0": 575.37, "r_x1": 337.5, "r_y1": 575.37, "r_x2": 337.5, "r_y2": 570.38, "r_x3": 333.66, "r_y3": 570.38, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 90, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 340.38, "r_y0": 582.02, "r_x1": 344.22, "r_y1": 582.02, "r_x2": 344.22, "r_y2": 577.03, "r_x3": 340.38, "r_y3": 577.03, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 91, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 346.87, "r_y0": 582.02, "r_x1": 350.71, "r_y1": 582.02, "r_x2": 350.71, "r_y2": 577.03, "r_x3": 346.87, "r_y3": 577.03, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 92, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 333.66, "r_y0": 581.97, "r_x1": 337.5, "r_y1": 581.97, "r_x2": 337.5, "r_y2": 576.98, "r_x3": 333.66, "r_y3": 576.98, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 93, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 340.28, "r_y0": 588.39, "r_x1": 344.12, "r_y1": 588.39, "r_x2": 344.12, "r_y2": 583.4, "r_x3": 340.28, "r_y3": 583.4, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 94, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 346.77, "r_y0": 588.39, "r_x1": 350.61, "r_y1": 588.39, "r_x2": 350.61, "r_y2": 583.4, "r_x3": 346.77, "r_y3": 583.4, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 95, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 333.57, "r_y0": 588.35, "r_x1": 337.41, "r_y1": 588.35, "r_x2": 337.41, "r_y2": 583.35, "r_x3": 333.57, "r_y3": 583.35, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 96, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 353.03, "r_y0": 561.87, "r_x1": 359.83, "r_y1": 561.87, "r_x2": 359.83, "r_y2": 556.88, "r_x3": 353.03, "r_y3": 556.88, "coord_origin": "TOPLEFT" }, "text": "NL", "orig": "NL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 97, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 353.19, "r_y0": 568.57, "r_x1": 359.99, "r_y1": 568.57, "r_x2": 359.99, "r_y2": 563.58, "r_x3": 353.19, "r_y3": 563.58, "coord_origin": "TOPLEFT" }, "text": "NL", "orig": "NL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 98, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 353.2, "r_y0": 575.15, "r_x1": 360.0, "r_y1": 575.15, "r_x2": 360.0, "r_y2": 570.16, "r_x3": 353.2, "r_y3": 570.16, "coord_origin": "TOPLEFT" }, "text": "NL", "orig": "NL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 99, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 353.15, "r_y0": 581.76, "r_x1": 359.95, "r_y1": 581.76, "r_x2": 359.95, "r_y2": 576.77, "r_x3": 353.15, "r_y3": 576.77, "coord_origin": "TOPLEFT" }, "text": "NL", "orig": "NL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 100, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 353.27, "r_y0": 588.4, "r_x1": 360.07, "r_y1": 588.4, "r_x2": 360.07, "r_y2": 583.41, "r_x3": 353.27, "r_y3": 583.41, "coord_origin": "TOPLEFT" }, "text": "NL", "orig": "NL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 101, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 347.38, "r_y0": 562.07, "r_x1": 350.34, "r_y1": 562.07, "r_x2": 350.34, "r_y2": 557.08, "r_x3": 347.38, "r_y3": 557.08, "coord_origin": "TOPLEFT" }, "text": "L", "orig": "L", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 102, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 331.14, "r_y0": 568.55, "r_x1": 333.67, "r_y1": 568.55, "r_x2": 333.67, "r_y2": 564.29, "r_x3": 331.14, "r_y3": 564.29, "coord_origin": "TOPLEFT" }, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 103, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 340.81, "r_y0": 558.86, "r_x1": 343.34, "r_y1": 558.86, "r_x2": 343.34, "r_y2": 554.59, "r_x3": 340.81, "r_y3": 554.59, "coord_origin": "TOPLEFT" }, "text": "2", "orig": "2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 104, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 330.98, "r_y0": 559.09, "r_x1": 333.51, "r_y1": 559.09, "r_x2": 333.51, "r_y2": 554.83, "r_x3": 330.98, "r_y3": 554.83, "coord_origin": "TOPLEFT" }, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [ { "id": 13, "label": "text", "bbox": { "l": 147.3, "t": 540.73, "r": 149.71, "b": 543.1, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 33, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 147.3, "r_y0": 543.1, "r_x1": 149.71, "r_y1": 543.1, "r_x2": 149.71, "r_y2": 540.73, "r_x3": 147.3, "r_y3": 540.73, "coord_origin": "TOPLEFT" }, "text": "1.", "orig": "1.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 14, "label": "text", "bbox": { "l": 150.91, "t": 540.73, "r": 155.72, "b": 543.1, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 34, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 150.91, "r_y0": 543.1, "r_x1": 155.72, "r_y1": 543.1, "r_x2": 155.72, "r_y2": 540.73, "r_x3": 150.91, "r_y3": 540.73, "coord_origin": "TOPLEFT" }, "text": "Item", "orig": "Item", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 15, "label": "text", "bbox": { "l": 162.76, "t": 535.39, "r": 172.3, "b": 537.76, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 35, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 162.76, "r_y0": 537.76, "r_x1": 172.3, "r_y1": 537.76, "r_x2": 172.3, "r_y2": 535.39, "r_x3": 162.76, "r_y3": 535.39, "coord_origin": "TOPLEFT" }, "text": "Amount", "orig": "Amount", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 16, "label": "text", "bbox": { "l": 147.64, "t": 535.37, "r": 155.92, "b": 537.73, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 36, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 147.64, "r_y0": 537.73, "r_x1": 155.92, "r_y1": 537.73, "r_x2": 155.92, "r_y2": 535.37, "r_x3": 147.64, "r_y3": 535.37, "coord_origin": "TOPLEFT" }, "text": "Names", "orig": "Names", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 17, "label": "text", "bbox": { "l": 158.48, "t": 540.73, "r": 164.1, "b": 543.1, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 37, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 158.48, "r_y0": 543.1, "r_x1": 164.1, "r_y1": 543.1, "r_x2": 164.1, "r_y2": 540.73, "r_x3": 158.48, "r_y3": 540.73, "coord_origin": "TOPLEFT" }, "text": "1000", "orig": "1000", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 18, "label": "text", "bbox": { "l": 158.48, "t": 544.67, "r": 162.7, "b": 547.04, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 38, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 158.48, "r_y0": 547.04, "r_x1": 162.7, "r_y1": 547.04, "r_x2": 162.7, "r_y2": 544.67, "r_x3": 158.48, "r_y3": 544.67, "coord_origin": "TOPLEFT" }, "text": "500", "orig": "500", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 19, "label": "text", "bbox": { "l": 158.48, "t": 548.91, "r": 164.1, "b": 551.28, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 39, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 158.48, "r_y0": 551.28, "r_x1": 164.1, "r_y1": 551.28, "r_x2": 164.1, "r_y2": 548.91, "r_x3": 158.48, "r_y3": 548.91, "coord_origin": "TOPLEFT" }, "text": "3500", "orig": "3500", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 20, "label": "text", "bbox": { "l": 158.48, "t": 553.15, "r": 162.7, "b": 555.52, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 40, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 158.48, "r_y0": 555.52, "r_x1": 162.7, "r_y1": 555.52, "r_x2": 162.7, "r_y2": 553.15, "r_x3": 158.48, "r_y3": 553.15, "coord_origin": "TOPLEFT" }, "text": "150", "orig": "150", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 21, "label": "text", "bbox": { "l": 168.82, "t": 540.73, "r": 172.89, "b": 543.1, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 41, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 168.82, "r_y0": 543.1, "r_x1": 172.89, "r_y1": 543.1, "r_x2": 172.89, "r_y2": 540.73, "r_x3": 168.82, "r_y3": 540.73, "coord_origin": "TOPLEFT" }, "text": "unit", "orig": "unit", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 22, "label": "text", "bbox": { "l": 168.82, "t": 544.67, "r": 172.89, "b": 547.04, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 42, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 168.82, "r_y0": 547.04, "r_x1": 172.89, "r_y1": 547.04, "r_x2": 172.89, "r_y2": 544.67, "r_x3": 168.82, "r_y3": 544.67, "coord_origin": "TOPLEFT" }, "text": "unit", "orig": "unit", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 23, "label": "text", "bbox": { "l": 168.82, "t": 548.91, "r": 172.89, "b": 551.28, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 43, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 168.82, "r_y0": 551.28, "r_x1": 172.89, "r_y1": 551.28, "r_x2": 172.89, "r_y2": 548.91, "r_x3": 168.82, "r_y3": 548.91, "coord_origin": "TOPLEFT" }, "text": "unit", "orig": "unit", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 24, "label": "text", "bbox": { "l": 168.82, "t": 553.15, "r": 172.89, "b": 555.52, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 44, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 168.82, "r_y0": 555.52, "r_x1": 172.89, "r_y1": 555.52, "r_x2": 172.89, "r_y2": 553.15, "r_x3": 168.82, "r_y3": 553.15, "coord_origin": "TOPLEFT" }, "text": "unit", "orig": "unit", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 25, "label": "text", "bbox": { "l": 147.3, "t": 544.67, "r": 149.71, "b": 547.04, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 45, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 147.3, "r_y0": 547.04, "r_x1": 149.71, "r_y1": 547.04, "r_x2": 149.71, "r_y2": 544.67, "r_x3": 147.3, "r_y3": 544.67, "coord_origin": "TOPLEFT" }, "text": "2.", "orig": "2.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 26, "label": "text", "bbox": { "l": 150.91, "t": 544.67, "r": 155.72, "b": 547.04, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 46, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 150.91, "r_y0": 547.04, "r_x1": 155.72, "r_y1": 547.04, "r_x2": 155.72, "r_y2": 544.67, "r_x3": 150.91, "r_y3": 544.67, "coord_origin": "TOPLEFT" }, "text": "Item", "orig": "Item", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 27, "label": "text", "bbox": { "l": 147.3, "t": 548.91, "r": 149.71, "b": 551.28, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 47, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 147.3, "r_y0": 551.28, "r_x1": 149.71, "r_y1": 551.28, "r_x2": 149.71, "r_y2": 548.91, "r_x3": 147.3, "r_y3": 548.91, "coord_origin": "TOPLEFT" }, "text": "3.", "orig": "3.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 28, "label": "text", "bbox": { "l": 150.91, "t": 548.91, "r": 155.72, "b": 551.28, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 48, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 150.91, "r_y0": 551.28, "r_x1": 155.72, "r_y1": 551.28, "r_x2": 155.72, "r_y2": 548.91, "r_x3": 150.91, "r_y3": 548.91, "coord_origin": "TOPLEFT" }, "text": "Item", "orig": "Item", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 29, "label": "text", "bbox": { "l": 147.3, "t": 553.15, "r": 149.71, "b": 555.52, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 49, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 147.3, "r_y0": 555.52, "r_x1": 149.71, "r_y1": 555.52, "r_x2": 149.71, "r_y2": 553.15, "r_x3": 147.3, "r_y3": 553.15, "coord_origin": "TOPLEFT" }, "text": "4.", "orig": "4.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 30, "label": "text", "bbox": { "l": 150.91, "t": 553.15, "r": 155.72, "b": 555.52, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 50, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 150.91, "r_y0": 555.52, "r_x1": 155.72, "r_y1": 555.52, "r_x2": 155.72, "r_y2": 553.15, "r_x3": 150.91, "r_y3": 553.15, "coord_origin": "TOPLEFT" }, "text": "Item", "orig": "Item", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 31, "label": "text", "bbox": { "l": 152.05, "t": 517.01, "r": 171.25, "b": 521.27, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 51, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 152.05, "r_y0": 521.27, "r_x1": 171.25, "r_y1": 521.27, "r_x2": 171.25, "r_y2": 517.01, "r_x3": 152.05, "r_y3": 517.01, "coord_origin": "TOPLEFT" }, "text": "Extracted", "orig": "Extracted", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 32, "label": "text", "bbox": { "l": 148.13, "t": 522.31, "r": 175.17, "b": 526.58, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 52, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 148.13, "r_y0": 526.58, "r_x1": 175.17, "r_y1": 526.58, "r_x2": 175.17, "r_y2": 522.31, "r_x3": 148.13, "r_y3": 522.31, "coord_origin": "TOPLEFT" }, "text": "Table Images", "orig": "Table Images", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 33, "label": "text", "bbox": { "l": 193.53, "t": 524.51, "r": 220.32, "b": 528.78, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 53, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 193.53, "r_y0": 528.78, "r_x1": 220.32, "r_y1": 528.78, "r_x2": 220.32, "r_y2": 524.51, "r_x3": 193.53, "r_y3": 524.51, "coord_origin": "TOPLEFT" }, "text": "Standardized", "orig": "Standardized", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 34, "label": "text", "bbox": { "l": 199.47, "t": 529.82, "r": 214.38, "b": 534.08, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 54, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 199.47, "r_y0": 534.08, "r_x1": 214.38, "r_y1": 534.08, "r_x2": 214.38, "r_y2": 529.82, "r_x3": 199.47, "r_y3": 529.82, "coord_origin": "TOPLEFT" }, "text": "Images", "orig": "Images", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 35, "label": "text", "bbox": { "l": 273.61, "t": 509.91, "r": 284.47, "b": 514.17, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 55, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 273.61, "r_y0": 514.17, "r_x1": 284.47, "r_y1": 514.17, "r_x2": 284.47, "r_y2": 509.91, "r_x3": 273.61, "r_y3": 509.91, "coord_origin": "TOPLEFT" }, "text": "BBox", "orig": "BBox", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 36, "label": "text", "bbox": { "l": 270.45, "t": 513.69, "r": 287.63, "b": 517.96, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 56, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 270.45, "r_y0": 517.96, "r_x1": 287.63, "r_y1": 517.96, "r_x2": 287.63, "r_y2": 513.69, "r_x3": 270.45, "r_y3": 513.69, "coord_origin": "TOPLEFT" }, "text": "Decoder", "orig": "Decoder", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 37, "label": "text", "bbox": { "l": 332.48, "t": 508.14, "r": 348.14, "b": 512.41, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 57, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 332.48, "r_y0": 512.41, "r_x1": 348.14, "r_y1": 512.41, "r_x2": 348.14, "r_y2": 508.14, "r_x3": 332.48, "r_y3": 508.14, "coord_origin": "TOPLEFT" }, "text": "BBoxes", "orig": "BBoxes", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 38, "label": "text", "bbox": { "l": 376.69, "t": 521.12, "r": 407.25, "b": 525.38, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 58, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 376.69, "r_y0": 525.38, "r_x1": 407.25, "r_y1": 525.38, "r_x2": 407.25, "r_y2": 521.12, "r_x3": 376.69, "r_y3": 521.12, "coord_origin": "TOPLEFT" }, "text": "BBoxes can be", "orig": "BBoxes can be", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 39, "label": "text", "bbox": { "l": 373.91, "t": 525.67, "r": 410.04, "b": 529.93, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 59, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 373.91, "r_y0": 529.93, "r_x1": 410.04, "r_y1": 529.93, "r_x2": 410.04, "r_y2": 525.67, "r_x3": 373.91, "r_y3": 525.67, "coord_origin": "TOPLEFT" }, "text": "traced back to the", "orig": "traced back to the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 40, "label": "text", "bbox": { "l": 375.3, "t": 530.21, "r": 408.65, "b": 534.47, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 60, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 375.3, "r_y0": 534.47, "r_x1": 408.65, "r_y1": 534.47, "r_x2": 408.65, "r_y2": 530.21, "r_x3": 375.3, "r_y3": 530.21, "coord_origin": "TOPLEFT" }, "text": "original image to", "orig": "original image to", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 41, "label": "text", "bbox": { "l": 377.07, "t": 534.76, "r": 406.88, "b": 539.02, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 61, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 377.07, "r_y0": 539.02, "r_x1": 406.88, "r_y1": 539.02, "r_x2": 406.88, "r_y2": 534.76, "r_x3": 377.07, "r_y3": 534.76, "coord_origin": "TOPLEFT" }, "text": "extract content", "orig": "extract content", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 42, "label": "text", "bbox": { "l": 383.57, "t": 563.24, "r": 433.77, "b": 567.5, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 62, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 383.57, "r_y0": 567.5, "r_x1": 433.77, "r_y1": 567.5, "r_x2": 433.77, "r_y2": 563.24, "r_x3": 383.57, "r_y3": 563.24, "coord_origin": "TOPLEFT" }, "text": "Structure Tags sequence", "orig": "Structure Tags sequence", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 43, "label": "text", "bbox": { "l": 383.53, "t": 567.79, "r": 433.81, "b": 572.05, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 63, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 383.53, "r_y0": 572.05, "r_x1": 433.81, "r_y1": 572.05, "r_x2": 433.81, "r_y2": 567.79, "r_x3": 383.53, "r_y3": 567.79, "coord_origin": "TOPLEFT" }, "text": "provide full description of", "orig": "provide full description of", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 44, "label": "text", "bbox": { "l": 390.48, "t": 572.33, "r": 426.86, "b": 576.59, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 64, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 390.48, "r_y0": 576.59, "r_x1": 426.86, "r_y1": 576.59, "r_x2": 426.86, "r_y2": 572.33, "r_x3": 390.48, "r_y3": 572.33, "coord_origin": "TOPLEFT" }, "text": "the table structure", "orig": "the table structure", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 45, "label": "text", "bbox": { "l": 293.95, "t": 577.89, "r": 323.17, "b": 582.15, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 65, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 293.95, "r_y0": 582.15, "r_x1": 323.17, "r_y1": 582.15, "r_x2": 323.17, "r_y2": 577.89, "r_x3": 293.95, "r_y3": 577.89, "coord_origin": "TOPLEFT" }, "text": "Structure Tags", "orig": "Structure Tags", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 46, "label": "text", "bbox": { "l": 293.95, "t": 582.44, "r": 324.59, "b": 586.7, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 66, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 293.95, "r_y0": 586.7, "r_x1": 324.59, "r_y1": 586.7, "r_x2": 324.59, "r_y2": 582.44, "r_x3": 293.95, "r_y3": 582.44, "coord_origin": "TOPLEFT" }, "text": "in OTSL format", "orig": "in OTSL format", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 47, "label": "text", "bbox": { "l": 333.08, "t": 541.82, "r": 364.15, "b": 546.09, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 67, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 333.08, "r_y0": 546.09, "r_x1": 364.15, "r_y1": 546.09, "r_x2": 364.15, "r_y2": 541.82, "r_x3": 333.08, "r_y3": 541.82, "coord_origin": "TOPLEFT" }, "text": "BBoxes in sync", "orig": "BBoxes in sync", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 48, "label": "text", "bbox": { "l": 333.08, "t": 545.61, "r": 369.72, "b": 549.87, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 68, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 333.08, "r_y0": 549.87, "r_x1": 369.72, "r_y1": 549.87, "r_x2": 369.72, "r_y2": 545.61, "r_x3": 333.08, "r_y3": 545.61, "coord_origin": "TOPLEFT" }, "text": "with tag sequence", "orig": "with tag sequence", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 49, "label": "text", "bbox": { "l": 232.66, "t": 515.24, "r": 249.59, "b": 519.5, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 69, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 232.66, "r_y0": 519.5, "r_x1": 249.59, "r_y1": 519.5, "r_x2": 249.59, "r_y2": 515.24, "r_x3": 232.66, "r_y3": 515.24, "coord_origin": "TOPLEFT" }, "text": "Encoder", "orig": "Encoder", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 50, "label": "text", "bbox": { "l": 269.82, "t": 545.97, "r": 288.26, "b": 550.23, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 70, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 269.82, "r_y0": 550.23, "r_x1": 288.26, "r_y1": 550.23, "r_x2": 288.26, "r_y2": 545.97, "r_x3": 269.82, "r_y3": 545.97, "coord_origin": "TOPLEFT" }, "text": "Structure", "orig": "Structure", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 51, "label": "text", "bbox": { "l": 270.45, "t": 549.76, "r": 287.63, "b": 554.02, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 71, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 270.45, "r_y0": 554.02, "r_x1": 287.63, "r_y1": 554.02, "r_x2": 287.63, "r_y2": 549.76, "r_x3": 270.45, "r_y3": 549.76, "coord_origin": "TOPLEFT" }, "text": "Decoder", "orig": "Decoder", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 52, "label": "text", "bbox": { "l": 332.18, "t": 515.91, "r": 358.11, "b": 520.18, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 72, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 332.18, "r_y0": 520.18, "r_x1": 358.11, "r_y1": 520.18, "r_x2": 358.11, "r_y2": 515.91, "r_x3": 332.18, "r_y3": 515.91, "coord_origin": "TOPLEFT" }, "text": "[x1, y2, x2, y2]", "orig": "[x1, y2, x2, y2]", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 53, "label": "text", "bbox": { "l": 332.18, "t": 521.97, "r": 361.58, "b": 526.24, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 73, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 332.18, "r_y0": 526.24, "r_x1": 361.58, "r_y1": 526.24, "r_x2": 361.58, "r_y2": 521.97, "r_x3": 332.18, "r_y3": 521.97, "coord_origin": "TOPLEFT" }, "text": "[x1', y2', x2', y2']", "orig": "[x1', y2', x2', y2']", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 54, "label": "text", "bbox": { "l": 332.18, "t": 528.03, "r": 364.76, "b": 532.3, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 74, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 332.18, "r_y0": 532.3, "r_x1": 364.76, "r_y1": 532.3, "r_x2": 364.76, "r_y2": 528.03, "r_x3": 332.18, "r_y3": 528.03, "coord_origin": "TOPLEFT" }, "text": "[x1'', y2'', x2'', y2'']", "orig": "[x1'', y2'', x2'', y2'']", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 55, "label": "text", "bbox": { "l": 332.18, "t": 534.09, "r": 335.97, "b": 538.36, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 75, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 332.18, "r_y0": 538.36, "r_x1": 335.97, "r_y1": 538.36, "r_x2": 335.97, "r_y2": 534.09, "r_x3": 332.18, "r_y3": 534.09, "coord_origin": "TOPLEFT" }, "text": "...", "orig": "...", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 56, "label": "text", "bbox": { "l": 326.89, "t": 516.4, "r": 329.42, "b": 520.66, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 76, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 326.89, "r_y0": 520.66, "r_x1": 329.42, "r_y1": 520.66, "r_x2": 329.42, "r_y2": 516.4, "r_x3": 326.89, "r_y3": 516.4, "coord_origin": "TOPLEFT" }, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 57, "label": "text", "bbox": { "l": 327.04, "t": 522.42, "r": 329.57, "b": 526.69, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 77, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 327.04, "r_y0": 526.69, "r_x1": 329.57, "r_y1": 526.69, "r_x2": 329.57, "r_y2": 522.42, "r_x3": 327.04, "r_y3": 522.42, "coord_origin": "TOPLEFT" }, "text": "2", "orig": "2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 58, "label": "text", "bbox": { "l": 327.04, "t": 528.52, "r": 329.57, "b": 532.78, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 78, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 327.04, "r_y0": 532.78, "r_x1": 329.57, "r_y1": 532.78, "r_x2": 329.57, "r_y2": 528.52, "r_x3": 327.04, "r_y3": 528.52, "coord_origin": "TOPLEFT" }, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 59, "label": "text", "bbox": { "l": 424.14, "t": 527.44, "r": 426.67, "b": 531.71, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 79, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 424.14, "r_y0": 531.71, "r_x1": 426.67, "r_y1": 531.71, "r_x2": 426.67, "r_y2": 527.44, "r_x3": 424.14, "r_y3": 527.44, "coord_origin": "TOPLEFT" }, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 60, "label": "text", "bbox": { "l": 453.0, "t": 517.45, "r": 455.53, "b": 521.72, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 80, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 453.0, "r_y0": 521.72, "r_x1": 455.53, "r_y1": 521.72, "r_x2": 455.53, "r_y2": 517.45, "r_x3": 453.0, "r_y3": 517.45, "coord_origin": "TOPLEFT" }, "text": "2", "orig": "2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 61, "label": "text", "bbox": { "l": 423.86, "t": 517.06, "r": 426.39, "b": 521.33, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 81, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 423.86, "r_y0": 521.33, "r_x1": 426.39, "r_y1": 521.33, "r_x2": 426.39, "r_y2": 517.06, "r_x3": 423.86, "r_y3": 517.06, "coord_origin": "TOPLEFT" }, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 62, "label": "text", "bbox": { "l": 333.43, "t": 557.37, "r": 337.28, "b": 562.36, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 82, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 333.43, "r_y0": 562.36, "r_x1": 337.28, "r_y1": 562.36, "r_x2": 337.28, "r_y2": 557.37, "r_x3": 333.43, "r_y3": 557.37, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 63, "label": "text", "bbox": { "l": 340.35, "t": 557.32, "r": 344.2, "b": 562.31, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 83, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 340.35, "r_y0": 562.31, "r_x1": 344.2, "r_y1": 562.31, "r_x2": 344.2, "r_y2": 557.32, "r_x3": 340.35, "r_y3": 557.32, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 64, "label": "text", "bbox": { "l": 340.31, "t": 563.87, "r": 344.15, "b": 568.86, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 84, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 340.31, "r_y0": 568.86, "r_x1": 344.15, "r_y1": 568.86, "r_x2": 344.15, "r_y2": 563.87, "r_x3": 340.31, "r_y3": 563.87, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 65, "label": "text", "bbox": { "l": 346.8, "t": 563.87, "r": 350.64, "b": 568.86, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 85, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 346.8, "r_y0": 568.86, "r_x1": 350.64, "r_y1": 568.86, "r_x2": 350.64, "r_y2": 563.87, "r_x3": 346.8, "r_y3": 563.87, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 66, "label": "text", "bbox": { "l": 333.6, "t": 563.82, "r": 337.44, "b": 568.81, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 86, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 333.6, "r_y0": 568.81, "r_x1": 337.44, "r_y1": 568.81, "r_x2": 337.44, "r_y2": 563.82, "r_x3": 333.6, "r_y3": 563.82, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 67, "label": "text", "bbox": { "l": 340.38, "t": 570.43, "r": 344.22, "b": 575.42, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 87, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 340.38, "r_y0": 575.42, "r_x1": 344.22, "r_y1": 575.42, "r_x2": 344.22, "r_y2": 570.43, "r_x3": 340.38, "r_y3": 570.43, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 68, "label": "text", "bbox": { "l": 346.86, "t": 570.43, "r": 350.71, "b": 575.42, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 88, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 346.86, "r_y0": 575.42, "r_x1": 350.71, "r_y1": 575.42, "r_x2": 350.71, "r_y2": 570.43, "r_x3": 346.86, "r_y3": 570.43, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 69, "label": "text", "bbox": { "l": 333.66, "t": 570.38, "r": 337.5, "b": 575.37, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 89, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 333.66, "r_y0": 575.37, "r_x1": 337.5, "r_y1": 575.37, "r_x2": 337.5, "r_y2": 570.38, "r_x3": 333.66, "r_y3": 570.38, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 70, "label": "text", "bbox": { "l": 340.38, "t": 577.03, "r": 344.22, "b": 582.02, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 90, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 340.38, "r_y0": 582.02, "r_x1": 344.22, "r_y1": 582.02, "r_x2": 344.22, "r_y2": 577.03, "r_x3": 340.38, "r_y3": 577.03, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 71, "label": "text", "bbox": { "l": 346.87, "t": 577.03, "r": 350.71, "b": 582.02, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 91, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 346.87, "r_y0": 582.02, "r_x1": 350.71, "r_y1": 582.02, "r_x2": 350.71, "r_y2": 577.03, "r_x3": 346.87, "r_y3": 577.03, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 72, "label": "text", "bbox": { "l": 333.66, "t": 576.98, "r": 337.5, "b": 581.97, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 92, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 333.66, "r_y0": 581.97, "r_x1": 337.5, "r_y1": 581.97, "r_x2": 337.5, "r_y2": 576.98, "r_x3": 333.66, "r_y3": 576.98, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 73, "label": "text", "bbox": { "l": 340.28, "t": 583.4, "r": 344.12, "b": 588.39, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 93, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 340.28, "r_y0": 588.39, "r_x1": 344.12, "r_y1": 588.39, "r_x2": 344.12, "r_y2": 583.4, "r_x3": 340.28, "r_y3": 583.4, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 74, "label": "text", "bbox": { "l": 346.77, "t": 583.4, "r": 350.61, "b": 588.39, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 94, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 346.77, "r_y0": 588.39, "r_x1": 350.61, "r_y1": 588.39, "r_x2": 350.61, "r_y2": 583.4, "r_x3": 346.77, "r_y3": 583.4, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 75, "label": "text", "bbox": { "l": 333.57, "t": 583.35, "r": 337.41, "b": 588.35, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 95, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 333.57, "r_y0": 588.35, "r_x1": 337.41, "r_y1": 588.35, "r_x2": 337.41, "r_y2": 583.35, "r_x3": 333.57, "r_y3": 583.35, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 76, "label": "text", "bbox": { "l": 353.03, "t": 556.88, "r": 359.83, "b": 561.87, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 96, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 353.03, "r_y0": 561.87, "r_x1": 359.83, "r_y1": 561.87, "r_x2": 359.83, "r_y2": 556.88, "r_x3": 353.03, "r_y3": 556.88, "coord_origin": "TOPLEFT" }, "text": "NL", "orig": "NL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 77, "label": "text", "bbox": { "l": 353.19, "t": 563.58, "r": 359.99, "b": 568.57, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 97, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 353.19, "r_y0": 568.57, "r_x1": 359.99, "r_y1": 568.57, "r_x2": 359.99, "r_y2": 563.58, "r_x3": 353.19, "r_y3": 563.58, "coord_origin": "TOPLEFT" }, "text": "NL", "orig": "NL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 78, "label": "text", "bbox": { "l": 353.2, "t": 570.16, "r": 360.0, "b": 575.15, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 98, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 353.2, "r_y0": 575.15, "r_x1": 360.0, "r_y1": 575.15, "r_x2": 360.0, "r_y2": 570.16, "r_x3": 353.2, "r_y3": 570.16, "coord_origin": "TOPLEFT" }, "text": "NL", "orig": "NL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 79, "label": "text", "bbox": { "l": 353.15, "t": 576.77, "r": 359.95, "b": 581.76, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 99, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 353.15, "r_y0": 581.76, "r_x1": 359.95, "r_y1": 581.76, "r_x2": 359.95, "r_y2": 576.77, "r_x3": 353.15, "r_y3": 576.77, "coord_origin": "TOPLEFT" }, "text": "NL", "orig": "NL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 80, "label": "text", "bbox": { "l": 353.27, "t": 583.41, "r": 360.07, "b": 588.4, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 100, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 353.27, "r_y0": 588.4, "r_x1": 360.07, "r_y1": 588.4, "r_x2": 360.07, "r_y2": 583.41, "r_x3": 353.27, "r_y3": 583.41, "coord_origin": "TOPLEFT" }, "text": "NL", "orig": "NL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 81, "label": "text", "bbox": { "l": 347.38, "t": 557.08, "r": 350.34, "b": 562.07, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 101, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 347.38, "r_y0": 562.07, "r_x1": 350.34, "r_y1": 562.07, "r_x2": 350.34, "r_y2": 557.08, "r_x3": 347.38, "r_y3": 557.08, "coord_origin": "TOPLEFT" }, "text": "L", "orig": "L", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 82, "label": "text", "bbox": { "l": 331.14, "t": 564.29, "r": 333.67, "b": 568.55, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 102, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 331.14, "r_y0": 568.55, "r_x1": 333.67, "r_y1": 568.55, "r_x2": 333.67, "r_y2": 564.29, "r_x3": 331.14, "r_y3": 564.29, "coord_origin": "TOPLEFT" }, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 83, "label": "text", "bbox": { "l": 340.81, "t": 554.59, "r": 343.34, "b": 558.86, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 103, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 340.81, "r_y0": 558.86, "r_x1": 343.34, "r_y1": 558.86, "r_x2": 343.34, "r_y2": 554.59, "r_x3": 340.81, "r_y3": 554.59, "coord_origin": "TOPLEFT" }, "text": "2", "orig": "2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 84, "label": "text", "bbox": { "l": 330.98, "t": 554.83, "r": 333.51, "b": 559.09, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 104, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 330.98, "r_y0": 559.09, "r_x1": 333.51, "r_y1": 559.09, "r_x2": 333.51, "r_y2": 554.83, "r_x3": 330.98, "r_y3": 554.83, "coord_origin": "TOPLEFT" }, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] } ] }, "text": "", "annotations": [], "provenance": null, "predicted_class": null, "confidence": null }, { "label": "text", "id": 4, "page_no": 7, "cluster": { "id": 4, "label": "text", "bbox": { "l": 134.76, "t": 620.19, "r": 480.59, "b": 664.85, "coord_origin": "TOPLEFT" }, "confidence": 0.951, "cells": [ { "index": 105, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 149.71, "r_y0": 628.99, "r_x1": 480.59, "r_y1": 628.99, "r_x2": 480.59, "r_y2": 620.19, "r_x3": 149.71, "r_y3": 620.19, "coord_origin": "TOPLEFT" }, "text": "We rely on standard metrics such as Tree Edit Distance score (TEDs) for", "orig": "We rely on standard metrics such as Tree Edit Distance score (TEDs) for", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 106, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 640.94, "r_x1": 480.59, "r_y1": 640.94, "r_x2": 480.59, "r_y2": 632.15, "r_x3": 134.76, "r_y3": 632.15, "coord_origin": "TOPLEFT" }, "text": "table structure prediction, and Mean Average Precision (mAP) with 0.75 Inter-", "orig": "table structure prediction, and Mean Average Precision (mAP) with 0.75 Inter-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 107, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 652.9, "r_x1": 480.59, "r_y1": 652.9, "r_x2": 480.59, "r_y2": 644.1, "r_x3": 134.76, "r_y3": 644.1, "coord_origin": "TOPLEFT" }, "text": "section Over Union (IOU) threshold for the bounding-box predictions of table", "orig": "section Over Union (IOU) threshold for the bounding-box predictions of table", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 108, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 664.85, "r_x1": 480.59, "r_y1": 664.85, "r_x2": 480.59, "r_y2": 656.06, "r_x3": 134.76, "r_y3": 656.06, "coord_origin": "TOPLEFT" }, "text": "cells. The predicted OTSL structures were converted back to HTML format in", "orig": "cells. The predicted OTSL structures were converted back to HTML format in", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "We rely on standard metrics such as Tree Edit Distance score (TEDs) for table structure prediction, and Mean Average Precision (mAP) with 0.75 Intersection Over Union (IOU) threshold for the bounding-box predictions of table cells. The predicted OTSL structures were converted back to HTML format in" } ], "body": [ { "label": "text", "id": 5, "page_no": 7, "cluster": { "id": 5, "label": "text", "bbox": { "l": 134.76, "t": 118.93, "r": 480.59, "b": 139.69, "coord_origin": "TOPLEFT" }, "confidence": 0.946, "cells": [ { "index": 3, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 127.73, "r_x1": 480.59, "r_y1": 127.73, "r_x2": 480.59, "r_y2": 118.93, "r_x3": 134.76, "r_y3": 118.93, "coord_origin": "TOPLEFT" }, "text": "reduces significantly the column drift seen in the HTML based models (see Fig-", "orig": "reduces significantly the column drift seen in the HTML based models (see Fig-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 4, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 139.69, "r_x1": 163.56, "r_y1": 139.69, "r_x2": 163.56, "r_y2": 130.89, "r_x3": 134.76, "r_y3": 130.89, "coord_origin": "TOPLEFT" }, "text": "ure 5).", "orig": "ure 5).", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "reduces significantly the column drift seen in the HTML based models (see Figure 5)." }, { "label": "section_header", "id": 2, "page_no": 7, "cluster": { "id": 2, "label": "section_header", "bbox": { "l": 134.76, "t": 161.56, "r": 319.35, "b": 170.36, "coord_origin": "TOPLEFT" }, "confidence": 0.955, "cells": [ { "index": 5, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 170.36, "r_x1": 149.4, "r_y1": 170.36, "r_x2": 149.4, "r_y2": 161.56, "r_x3": 134.76, "r_y3": 161.56, "coord_origin": "TOPLEFT" }, "text": "4.3", "orig": "4.3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 6, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 160.86, "r_y0": 170.36, "r_x1": 319.35, "r_y1": 170.36, "r_x2": 319.35, "r_y2": 161.56, "r_x3": 160.86, "r_y3": 161.56, "coord_origin": "TOPLEFT" }, "text": "Error-detection and -mitigation", "orig": "Error-detection and -mitigation", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "4.3 Error-detection and -mitigation" }, { "label": "text", "id": 0, "page_no": 7, "cluster": { "id": 0, "label": "text", "bbox": { "l": 134.76, "t": 182.28, "r": 480.6, "b": 298.68, "coord_origin": "TOPLEFT" }, "confidence": 0.988, "cells": [ { "index": 7, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 191.08, "r_x1": 480.6, "r_y1": 191.08, "r_x2": 480.6, "r_y2": 182.28, "r_x3": 134.76, "r_y3": 182.28, "coord_origin": "TOPLEFT" }, "text": "The design of OTSL allows to validate a table structure easily on an unfinished", "orig": "The design of OTSL allows to validate a table structure easily on an unfinished", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 8, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 203.03, "r_x1": 480.59, "r_y1": 203.03, "r_x2": 480.59, "r_y2": 194.24, "r_x3": 134.76, "r_y3": 194.24, "coord_origin": "TOPLEFT" }, "text": "sequence. The detection of an invalid sequence token is a clear indication of a", "orig": "sequence. The detection of an invalid sequence token is a clear indication of a", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 9, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 214.99, "r_x1": 480.59, "r_y1": 214.99, "r_x2": 480.59, "r_y2": 206.19, "r_x3": 134.76, "r_y3": 206.19, "coord_origin": "TOPLEFT" }, "text": "prediction mistake, however a valid sequence by itself does not guarantee pre-", "orig": "prediction mistake, however a valid sequence by itself does not guarantee pre-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 10, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 226.94, "r_x1": 480.59, "r_y1": 226.94, "r_x2": 480.59, "r_y2": 218.15, "r_x3": 134.76, "r_y3": 218.15, "coord_origin": "TOPLEFT" }, "text": "diction correctness. Different heuristics can be used to correct token errors in", "orig": "diction correctness. Different heuristics can be used to correct token errors in", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 11, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 238.9, "r_x1": 480.59, "r_y1": 238.9, "r_x2": 480.59, "r_y2": 230.1, "r_x3": 134.76, "r_y3": 230.1, "coord_origin": "TOPLEFT" }, "text": "an invalid sequence and thus increase the chances for accurate predictions. Such", "orig": "an invalid sequence and thus increase the chances for accurate predictions. Such", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 12, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 250.85, "r_x1": 480.59, "r_y1": 250.85, "r_x2": 480.59, "r_y2": 242.06, "r_x3": 134.76, "r_y3": 242.06, "coord_origin": "TOPLEFT" }, "text": "heuristics can be applied either after the prediction of each token, or at the end", "orig": "heuristics can be applied either after the prediction of each token, or at the end", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 13, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 262.81, "r_x1": 480.59, "r_y1": 262.81, "r_x2": 480.59, "r_y2": 254.01, "r_x3": 134.76, "r_y3": 254.01, "coord_origin": "TOPLEFT" }, "text": "on the entire predicted sequence. For example a simple heuristic which can cor-", "orig": "on the entire predicted sequence. For example a simple heuristic which can cor-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 14, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 274.77, "r_x1": 480.59, "r_y1": 274.77, "r_x2": 480.59, "r_y2": 265.97, "r_x3": 134.76, "r_y3": 265.97, "coord_origin": "TOPLEFT" }, "text": "rect the predicted OTSL sequence on-the-fly is to verify if the token with the", "orig": "rect the predicted OTSL sequence on-the-fly is to verify if the token with the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 15, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 286.72, "r_x1": 480.6, "r_y1": 286.72, "r_x2": 480.6, "r_y2": 277.92, "r_x3": 134.76, "r_y3": 277.92, "coord_origin": "TOPLEFT" }, "text": "highest prediction confidence invalidates the predicted sequence, and replace it", "orig": "highest prediction confidence invalidates the predicted sequence, and replace it", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 16, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 298.68, "r_x1": 469.4, "r_y1": 298.68, "r_x2": 469.4, "r_y2": 289.88, "r_x3": 134.76, "r_y3": 289.88, "coord_origin": "TOPLEFT" }, "text": "by the token with the next highest confidence until OTSL rules are satisfied.", "orig": "by the token with the next highest confidence until OTSL rules are satisfied.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "The design of OTSL allows to validate a table structure easily on an unfinished sequence. The detection of an invalid sequence token is a clear indication of a prediction mistake, however a valid sequence by itself does not guarantee prediction correctness. Different heuristics can be used to correct token errors in an invalid sequence and thus increase the chances for accurate predictions. Such heuristics can be applied either after the prediction of each token, or at the end on the entire predicted sequence. For example a simple heuristic which can correct the predicted OTSL sequence on-the-fly is to verify if the token with the highest prediction confidence invalidates the predicted sequence, and replace it by the token with the next highest confidence until OTSL rules are satisfied." }, { "label": "section_header", "id": 3, "page_no": 7, "cluster": { "id": 3, "label": "section_header", "bbox": { "l": 134.76, "t": 321.16, "r": 229.04, "b": 331.73, "coord_origin": "TOPLEFT" }, "confidence": 0.952, "cells": [ { "index": 17, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 331.73, "r_x1": 141.49, "r_y1": 331.73, "r_x2": 141.49, "r_y2": 321.16, "r_x3": 134.76, "r_y3": 321.16, "coord_origin": "TOPLEFT" }, "text": "5", "orig": "5", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 18, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 154.94, "r_y0": 331.73, "r_x1": 229.04, "r_y1": 331.73, "r_x2": 229.04, "r_y2": 321.16, "r_x3": 154.94, "r_y3": 321.16, "coord_origin": "TOPLEFT" }, "text": "Experiments", "orig": "Experiments", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "5 Experiments" }, { "label": "text", "id": 1, "page_no": 7, "cluster": { "id": 1, "label": "text", "bbox": { "l": 134.76, "t": 347.25, "r": 480.6, "b": 451.69, "coord_origin": "TOPLEFT" }, "confidence": 0.988, "cells": [ { "index": 19, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 356.05, "r_x1": 480.59, "r_y1": 356.05, "r_x2": 480.59, "r_y2": 347.25, "r_x3": 134.76, "r_y3": 347.25, "coord_origin": "TOPLEFT" }, "text": "To evaluate the impact of OTSL on prediction accuracy and inference times, we", "orig": "To evaluate the impact of OTSL on prediction accuracy and inference times, we", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 20, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 368.0, "r_x1": 480.59, "r_y1": 368.0, "r_x2": 480.59, "r_y2": 359.2, "r_x3": 134.76, "r_y3": 359.2, "coord_origin": "TOPLEFT" }, "text": "conducted a series of experiments based on the TableFormer model (Figure 4)", "orig": "conducted a series of experiments based on the TableFormer model (Figure 4)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 21, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 379.96, "r_x1": 480.59, "r_y1": 379.96, "r_x2": 480.59, "r_y2": 371.16, "r_x3": 134.76, "r_y3": 371.16, "coord_origin": "TOPLEFT" }, "text": "with two objectives: Firstly we evaluate the prediction quality and performance", "orig": "with two objectives: Firstly we evaluate the prediction quality and performance", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 22, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 391.91, "r_x1": 480.59, "r_y1": 391.91, "r_x2": 480.59, "r_y2": 383.11, "r_x3": 134.76, "r_y3": 383.11, "coord_origin": "TOPLEFT" }, "text": "of OTSL vs. HTML after performing Hyper Parameter Optimization (HPO) on", "orig": "of OTSL vs. HTML after performing Hyper Parameter Optimization (HPO) on", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 23, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 403.87, "r_x1": 148.6, "r_y1": 403.87, "r_x2": 148.6, "r_y2": 395.07, "r_x3": 134.76, "r_y3": 395.07, "coord_origin": "TOPLEFT" }, "text": "the", "orig": "the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 24, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.63, "r_y0": 403.87, "r_x1": 191.85, "r_y1": 403.87, "r_x2": 191.85, "r_y2": 395.07, "r_x3": 151.63, "r_y3": 395.07, "coord_origin": "TOPLEFT" }, "text": "canonical", "orig": "canonical", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 25, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 195.9, "r_y0": 403.87, "r_x1": 480.6, "r_y1": 403.87, "r_x2": 480.6, "r_y2": 395.07, "r_x3": 195.9, "r_y3": 395.07, "coord_origin": "TOPLEFT" }, "text": "PubTabNet data set. Secondly we pick the best hyper-parameters", "orig": "PubTabNet data set. Secondly we pick the best hyper-parameters", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 26, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.77, "r_y0": 415.82, "r_x1": 480.59, "r_y1": 415.82, "r_x2": 480.59, "r_y2": 407.02, "r_x3": 134.77, "r_y3": 407.02, "coord_origin": "TOPLEFT" }, "text": "found in the first step and evaluate how OTSL impacts the performance of", "orig": "found in the first step and evaluate how OTSL impacts the performance of", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 27, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.77, "r_y0": 427.78, "r_x1": 480.59, "r_y1": 427.78, "r_x2": 480.59, "r_y2": 418.98, "r_x3": 134.77, "r_y3": 418.98, "coord_origin": "TOPLEFT" }, "text": "TableFormer after training on other publicly available data sets (FinTabNet,", "orig": "TableFormer after training on other publicly available data sets (FinTabNet,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 28, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.77, "r_y0": 439.73, "r_x1": 480.59, "r_y1": 439.73, "r_x2": 480.59, "r_y2": 430.94, "r_x3": 134.77, "r_y3": 430.94, "coord_origin": "TOPLEFT" }, "text": "PubTables-1M [14]). The ground truth (GT) from all data sets has been con-", "orig": "PubTables-1M [14]). The ground truth (GT) from all data sets has been con-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 29, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.77, "r_y0": 451.69, "r_x1": 479.3, "r_y1": 451.69, "r_x2": 479.3, "r_y2": 442.89, "r_x3": 134.77, "r_y3": 442.89, "coord_origin": "TOPLEFT" }, "text": "verted into OTSL format for this purpose, and will be made publicly available.", "orig": "verted into OTSL format for this purpose, and will be made publicly available.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "To evaluate the impact of OTSL on prediction accuracy and inference times, we conducted a series of experiments based on the TableFormer model (Figure 4) with two objectives: Firstly we evaluate the prediction quality and performance of OTSL vs. HTML after performing Hyper Parameter Optimization (HPO) on the canonical PubTabNet data set. Secondly we pick the best hyper-parameters found in the first step and evaluate how OTSL impacts the performance of TableFormer after training on other publicly available data sets (FinTabNet, PubTables-1M [14]). The ground truth (GT) from all data sets has been converted into OTSL format for this purpose, and will be made publicly available." }, { "label": "caption", "id": 7, "page_no": 7, "cluster": { "id": 7, "label": "caption", "bbox": { "l": 134.77, "t": 484.65, "r": 480.59, "b": 503.74, "coord_origin": "TOPLEFT" }, "confidence": 0.93, "cells": [ { "index": 30, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.77, "r_y0": 492.57, "r_x1": 162.64, "r_y1": 492.57, "r_x2": 162.64, "r_y2": 484.65, "r_x3": 134.77, "r_y3": 484.65, "coord_origin": "TOPLEFT" }, "text": "Fig. 4.", "orig": "Fig. 4.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 31, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 165.2, "r_y0": 492.78, "r_x1": 480.59, "r_y1": 492.78, "r_x2": 480.59, "r_y2": 484.71, "r_x3": 165.2, "r_y3": 484.71, "coord_origin": "TOPLEFT" }, "text": "Architecture sketch of the TableFormer model, which is a representative for the", "orig": "Architecture sketch of the TableFormer model, which is a representative for the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 32, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.77, "r_y0": 503.74, "r_x1": 206.7, "r_y1": 503.74, "r_x2": 206.7, "r_y2": 495.67, "r_x3": 134.77, "r_y3": 495.67, "coord_origin": "TOPLEFT" }, "text": "Im2Seq approach.", "orig": "Im2Seq approach.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "Fig. 4. Architecture sketch of the TableFormer model, which is a representative for the Im2Seq approach." }, { "label": "picture", "id": 6, "page_no": 7, "cluster": { "id": 6, "label": "picture", "bbox": { "l": 140.71, "t": 508.06, "r": 472.73, "b": 593.68, "coord_origin": "TOPLEFT" }, "confidence": 0.93, "cells": [ { "index": 33, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 147.3, "r_y0": 543.1, "r_x1": 149.71, "r_y1": 543.1, "r_x2": 149.71, "r_y2": 540.73, "r_x3": 147.3, "r_y3": 540.73, "coord_origin": "TOPLEFT" }, "text": "1.", "orig": "1.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 34, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 150.91, "r_y0": 543.1, "r_x1": 155.72, "r_y1": 543.1, "r_x2": 155.72, "r_y2": 540.73, "r_x3": 150.91, "r_y3": 540.73, "coord_origin": "TOPLEFT" }, "text": "Item", "orig": "Item", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 35, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 162.76, "r_y0": 537.76, "r_x1": 172.3, "r_y1": 537.76, "r_x2": 172.3, "r_y2": 535.39, "r_x3": 162.76, "r_y3": 535.39, "coord_origin": "TOPLEFT" }, "text": "Amount", "orig": "Amount", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 36, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 147.64, "r_y0": 537.73, "r_x1": 155.92, "r_y1": 537.73, "r_x2": 155.92, "r_y2": 535.37, "r_x3": 147.64, "r_y3": 535.37, "coord_origin": "TOPLEFT" }, "text": "Names", "orig": "Names", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 37, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 158.48, "r_y0": 543.1, "r_x1": 164.1, "r_y1": 543.1, "r_x2": 164.1, "r_y2": 540.73, "r_x3": 158.48, "r_y3": 540.73, "coord_origin": "TOPLEFT" }, "text": "1000", "orig": "1000", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 38, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 158.48, "r_y0": 547.04, "r_x1": 162.7, "r_y1": 547.04, "r_x2": 162.7, "r_y2": 544.67, "r_x3": 158.48, "r_y3": 544.67, "coord_origin": "TOPLEFT" }, "text": "500", "orig": "500", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 39, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 158.48, "r_y0": 551.28, "r_x1": 164.1, "r_y1": 551.28, "r_x2": 164.1, "r_y2": 548.91, "r_x3": 158.48, "r_y3": 548.91, "coord_origin": "TOPLEFT" }, "text": "3500", "orig": "3500", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 40, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 158.48, "r_y0": 555.52, "r_x1": 162.7, "r_y1": 555.52, "r_x2": 162.7, "r_y2": 553.15, "r_x3": 158.48, "r_y3": 553.15, "coord_origin": "TOPLEFT" }, "text": "150", "orig": "150", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 41, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 168.82, "r_y0": 543.1, "r_x1": 172.89, "r_y1": 543.1, "r_x2": 172.89, "r_y2": 540.73, "r_x3": 168.82, "r_y3": 540.73, "coord_origin": "TOPLEFT" }, "text": "unit", "orig": "unit", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 42, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 168.82, "r_y0": 547.04, "r_x1": 172.89, "r_y1": 547.04, "r_x2": 172.89, "r_y2": 544.67, "r_x3": 168.82, "r_y3": 544.67, "coord_origin": "TOPLEFT" }, "text": "unit", "orig": "unit", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 43, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 168.82, "r_y0": 551.28, "r_x1": 172.89, "r_y1": 551.28, "r_x2": 172.89, "r_y2": 548.91, "r_x3": 168.82, "r_y3": 548.91, "coord_origin": "TOPLEFT" }, "text": "unit", "orig": "unit", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 44, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 168.82, "r_y0": 555.52, "r_x1": 172.89, "r_y1": 555.52, "r_x2": 172.89, "r_y2": 553.15, "r_x3": 168.82, "r_y3": 553.15, "coord_origin": "TOPLEFT" }, "text": "unit", "orig": "unit", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 45, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 147.3, "r_y0": 547.04, "r_x1": 149.71, "r_y1": 547.04, "r_x2": 149.71, "r_y2": 544.67, "r_x3": 147.3, "r_y3": 544.67, "coord_origin": "TOPLEFT" }, "text": "2.", "orig": "2.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 46, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 150.91, "r_y0": 547.04, "r_x1": 155.72, "r_y1": 547.04, "r_x2": 155.72, "r_y2": 544.67, "r_x3": 150.91, "r_y3": 544.67, "coord_origin": "TOPLEFT" }, "text": "Item", "orig": "Item", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 47, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 147.3, "r_y0": 551.28, "r_x1": 149.71, "r_y1": 551.28, "r_x2": 149.71, "r_y2": 548.91, "r_x3": 147.3, "r_y3": 548.91, "coord_origin": "TOPLEFT" }, "text": "3.", "orig": "3.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 48, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 150.91, "r_y0": 551.28, "r_x1": 155.72, "r_y1": 551.28, "r_x2": 155.72, "r_y2": 548.91, "r_x3": 150.91, "r_y3": 548.91, "coord_origin": "TOPLEFT" }, "text": "Item", "orig": "Item", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 49, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 147.3, "r_y0": 555.52, "r_x1": 149.71, "r_y1": 555.52, "r_x2": 149.71, "r_y2": 553.15, "r_x3": 147.3, "r_y3": 553.15, "coord_origin": "TOPLEFT" }, "text": "4.", "orig": "4.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 50, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 150.91, "r_y0": 555.52, "r_x1": 155.72, "r_y1": 555.52, "r_x2": 155.72, "r_y2": 553.15, "r_x3": 150.91, "r_y3": 553.15, "coord_origin": "TOPLEFT" }, "text": "Item", "orig": "Item", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 51, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 152.05, "r_y0": 521.27, "r_x1": 171.25, "r_y1": 521.27, "r_x2": 171.25, "r_y2": 517.01, "r_x3": 152.05, "r_y3": 517.01, "coord_origin": "TOPLEFT" }, "text": "Extracted", "orig": "Extracted", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 52, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 148.13, "r_y0": 526.58, "r_x1": 175.17, "r_y1": 526.58, "r_x2": 175.17, "r_y2": 522.31, "r_x3": 148.13, "r_y3": 522.31, "coord_origin": "TOPLEFT" }, "text": "Table Images", "orig": "Table Images", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 53, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 193.53, "r_y0": 528.78, "r_x1": 220.32, "r_y1": 528.78, "r_x2": 220.32, "r_y2": 524.51, "r_x3": 193.53, "r_y3": 524.51, "coord_origin": "TOPLEFT" }, "text": "Standardized", "orig": "Standardized", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 54, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 199.47, "r_y0": 534.08, "r_x1": 214.38, "r_y1": 534.08, "r_x2": 214.38, "r_y2": 529.82, "r_x3": 199.47, "r_y3": 529.82, "coord_origin": "TOPLEFT" }, "text": "Images", "orig": "Images", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 55, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 273.61, "r_y0": 514.17, "r_x1": 284.47, "r_y1": 514.17, "r_x2": 284.47, "r_y2": 509.91, "r_x3": 273.61, "r_y3": 509.91, "coord_origin": "TOPLEFT" }, "text": "BBox", "orig": "BBox", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 56, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 270.45, "r_y0": 517.96, "r_x1": 287.63, "r_y1": 517.96, "r_x2": 287.63, "r_y2": 513.69, "r_x3": 270.45, "r_y3": 513.69, "coord_origin": "TOPLEFT" }, "text": "Decoder", "orig": "Decoder", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 57, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 332.48, "r_y0": 512.41, "r_x1": 348.14, "r_y1": 512.41, "r_x2": 348.14, "r_y2": 508.14, "r_x3": 332.48, "r_y3": 508.14, "coord_origin": "TOPLEFT" }, "text": "BBoxes", "orig": "BBoxes", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 58, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 376.69, "r_y0": 525.38, "r_x1": 407.25, "r_y1": 525.38, "r_x2": 407.25, "r_y2": 521.12, "r_x3": 376.69, "r_y3": 521.12, "coord_origin": "TOPLEFT" }, "text": "BBoxes can be", "orig": "BBoxes can be", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 59, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 373.91, "r_y0": 529.93, "r_x1": 410.04, "r_y1": 529.93, "r_x2": 410.04, "r_y2": 525.67, "r_x3": 373.91, "r_y3": 525.67, "coord_origin": "TOPLEFT" }, "text": "traced back to the", "orig": "traced back to the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 60, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 375.3, "r_y0": 534.47, "r_x1": 408.65, "r_y1": 534.47, "r_x2": 408.65, "r_y2": 530.21, "r_x3": 375.3, "r_y3": 530.21, "coord_origin": "TOPLEFT" }, "text": "original image to", "orig": "original image to", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 61, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 377.07, "r_y0": 539.02, "r_x1": 406.88, "r_y1": 539.02, "r_x2": 406.88, "r_y2": 534.76, "r_x3": 377.07, "r_y3": 534.76, "coord_origin": "TOPLEFT" }, "text": "extract content", "orig": "extract content", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 62, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 383.57, "r_y0": 567.5, "r_x1": 433.77, "r_y1": 567.5, "r_x2": 433.77, "r_y2": 563.24, "r_x3": 383.57, "r_y3": 563.24, "coord_origin": "TOPLEFT" }, "text": "Structure Tags sequence", "orig": "Structure Tags sequence", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 63, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 383.53, "r_y0": 572.05, "r_x1": 433.81, "r_y1": 572.05, "r_x2": 433.81, "r_y2": 567.79, "r_x3": 383.53, "r_y3": 567.79, "coord_origin": "TOPLEFT" }, "text": "provide full description of", "orig": "provide full description of", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 64, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 390.48, "r_y0": 576.59, "r_x1": 426.86, "r_y1": 576.59, "r_x2": 426.86, "r_y2": 572.33, "r_x3": 390.48, "r_y3": 572.33, "coord_origin": "TOPLEFT" }, "text": "the table structure", "orig": "the table structure", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 65, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 293.95, "r_y0": 582.15, "r_x1": 323.17, "r_y1": 582.15, "r_x2": 323.17, "r_y2": 577.89, "r_x3": 293.95, "r_y3": 577.89, "coord_origin": "TOPLEFT" }, "text": "Structure Tags", "orig": "Structure Tags", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 66, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 293.95, "r_y0": 586.7, "r_x1": 324.59, "r_y1": 586.7, "r_x2": 324.59, "r_y2": 582.44, "r_x3": 293.95, "r_y3": 582.44, "coord_origin": "TOPLEFT" }, "text": "in OTSL format", "orig": "in OTSL format", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 67, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 333.08, "r_y0": 546.09, "r_x1": 364.15, "r_y1": 546.09, "r_x2": 364.15, "r_y2": 541.82, "r_x3": 333.08, "r_y3": 541.82, "coord_origin": "TOPLEFT" }, "text": "BBoxes in sync", "orig": "BBoxes in sync", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 68, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 333.08, "r_y0": 549.87, "r_x1": 369.72, "r_y1": 549.87, "r_x2": 369.72, "r_y2": 545.61, "r_x3": 333.08, "r_y3": 545.61, "coord_origin": "TOPLEFT" }, "text": "with tag sequence", "orig": "with tag sequence", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 69, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 232.66, "r_y0": 519.5, "r_x1": 249.59, "r_y1": 519.5, "r_x2": 249.59, "r_y2": 515.24, "r_x3": 232.66, "r_y3": 515.24, "coord_origin": "TOPLEFT" }, "text": "Encoder", "orig": "Encoder", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 70, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 269.82, "r_y0": 550.23, "r_x1": 288.26, "r_y1": 550.23, "r_x2": 288.26, "r_y2": 545.97, "r_x3": 269.82, "r_y3": 545.97, "coord_origin": "TOPLEFT" }, "text": "Structure", "orig": "Structure", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 71, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 270.45, "r_y0": 554.02, "r_x1": 287.63, "r_y1": 554.02, "r_x2": 287.63, "r_y2": 549.76, "r_x3": 270.45, "r_y3": 549.76, "coord_origin": "TOPLEFT" }, "text": "Decoder", "orig": "Decoder", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 72, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 332.18, "r_y0": 520.18, "r_x1": 358.11, "r_y1": 520.18, "r_x2": 358.11, "r_y2": 515.91, "r_x3": 332.18, "r_y3": 515.91, "coord_origin": "TOPLEFT" }, "text": "[x1, y2, x2, y2]", "orig": "[x1, y2, x2, y2]", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 73, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 332.18, "r_y0": 526.24, "r_x1": 361.58, "r_y1": 526.24, "r_x2": 361.58, "r_y2": 521.97, "r_x3": 332.18, "r_y3": 521.97, "coord_origin": "TOPLEFT" }, "text": "[x1', y2', x2', y2']", "orig": "[x1', y2', x2', y2']", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 74, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 332.18, "r_y0": 532.3, "r_x1": 364.76, "r_y1": 532.3, "r_x2": 364.76, "r_y2": 528.03, "r_x3": 332.18, "r_y3": 528.03, "coord_origin": "TOPLEFT" }, "text": "[x1'', y2'', x2'', y2'']", "orig": "[x1'', y2'', x2'', y2'']", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 75, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 332.18, "r_y0": 538.36, "r_x1": 335.97, "r_y1": 538.36, "r_x2": 335.97, "r_y2": 534.09, "r_x3": 332.18, "r_y3": 534.09, "coord_origin": "TOPLEFT" }, "text": "...", "orig": "...", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 76, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 326.89, "r_y0": 520.66, "r_x1": 329.42, "r_y1": 520.66, "r_x2": 329.42, "r_y2": 516.4, "r_x3": 326.89, "r_y3": 516.4, "coord_origin": "TOPLEFT" }, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 77, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 327.04, "r_y0": 526.69, "r_x1": 329.57, "r_y1": 526.69, "r_x2": 329.57, "r_y2": 522.42, "r_x3": 327.04, "r_y3": 522.42, "coord_origin": "TOPLEFT" }, "text": "2", "orig": "2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 78, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 327.04, "r_y0": 532.78, "r_x1": 329.57, "r_y1": 532.78, "r_x2": 329.57, "r_y2": 528.52, "r_x3": 327.04, "r_y3": 528.52, "coord_origin": "TOPLEFT" }, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 79, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 424.14, "r_y0": 531.71, "r_x1": 426.67, "r_y1": 531.71, "r_x2": 426.67, "r_y2": 527.44, "r_x3": 424.14, "r_y3": 527.44, "coord_origin": "TOPLEFT" }, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 80, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 453.0, "r_y0": 521.72, "r_x1": 455.53, "r_y1": 521.72, "r_x2": 455.53, "r_y2": 517.45, "r_x3": 453.0, "r_y3": 517.45, "coord_origin": "TOPLEFT" }, "text": "2", "orig": "2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 81, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 423.86, "r_y0": 521.33, "r_x1": 426.39, "r_y1": 521.33, "r_x2": 426.39, "r_y2": 517.06, "r_x3": 423.86, "r_y3": 517.06, "coord_origin": "TOPLEFT" }, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 82, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 333.43, "r_y0": 562.36, "r_x1": 337.28, "r_y1": 562.36, "r_x2": 337.28, "r_y2": 557.37, "r_x3": 333.43, "r_y3": 557.37, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 83, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 340.35, "r_y0": 562.31, "r_x1": 344.2, "r_y1": 562.31, "r_x2": 344.2, "r_y2": 557.32, "r_x3": 340.35, "r_y3": 557.32, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 84, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 340.31, "r_y0": 568.86, "r_x1": 344.15, "r_y1": 568.86, "r_x2": 344.15, "r_y2": 563.87, "r_x3": 340.31, "r_y3": 563.87, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 85, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 346.8, "r_y0": 568.86, "r_x1": 350.64, "r_y1": 568.86, "r_x2": 350.64, "r_y2": 563.87, "r_x3": 346.8, "r_y3": 563.87, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 86, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 333.6, "r_y0": 568.81, "r_x1": 337.44, "r_y1": 568.81, "r_x2": 337.44, "r_y2": 563.82, "r_x3": 333.6, "r_y3": 563.82, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 87, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 340.38, "r_y0": 575.42, "r_x1": 344.22, "r_y1": 575.42, "r_x2": 344.22, "r_y2": 570.43, "r_x3": 340.38, "r_y3": 570.43, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 88, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 346.86, "r_y0": 575.42, "r_x1": 350.71, "r_y1": 575.42, "r_x2": 350.71, "r_y2": 570.43, "r_x3": 346.86, "r_y3": 570.43, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 89, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 333.66, "r_y0": 575.37, "r_x1": 337.5, "r_y1": 575.37, "r_x2": 337.5, "r_y2": 570.38, "r_x3": 333.66, "r_y3": 570.38, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 90, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 340.38, "r_y0": 582.02, "r_x1": 344.22, "r_y1": 582.02, "r_x2": 344.22, "r_y2": 577.03, "r_x3": 340.38, "r_y3": 577.03, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 91, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 346.87, "r_y0": 582.02, "r_x1": 350.71, "r_y1": 582.02, "r_x2": 350.71, "r_y2": 577.03, "r_x3": 346.87, "r_y3": 577.03, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 92, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 333.66, "r_y0": 581.97, "r_x1": 337.5, "r_y1": 581.97, "r_x2": 337.5, "r_y2": 576.98, "r_x3": 333.66, "r_y3": 576.98, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 93, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 340.28, "r_y0": 588.39, "r_x1": 344.12, "r_y1": 588.39, "r_x2": 344.12, "r_y2": 583.4, "r_x3": 340.28, "r_y3": 583.4, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 94, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 346.77, "r_y0": 588.39, "r_x1": 350.61, "r_y1": 588.39, "r_x2": 350.61, "r_y2": 583.4, "r_x3": 346.77, "r_y3": 583.4, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 95, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 333.57, "r_y0": 588.35, "r_x1": 337.41, "r_y1": 588.35, "r_x2": 337.41, "r_y2": 583.35, "r_x3": 333.57, "r_y3": 583.35, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 96, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 353.03, "r_y0": 561.87, "r_x1": 359.83, "r_y1": 561.87, "r_x2": 359.83, "r_y2": 556.88, "r_x3": 353.03, "r_y3": 556.88, "coord_origin": "TOPLEFT" }, "text": "NL", "orig": "NL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 97, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 353.19, "r_y0": 568.57, "r_x1": 359.99, "r_y1": 568.57, "r_x2": 359.99, "r_y2": 563.58, "r_x3": 353.19, "r_y3": 563.58, "coord_origin": "TOPLEFT" }, "text": "NL", "orig": "NL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 98, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 353.2, "r_y0": 575.15, "r_x1": 360.0, "r_y1": 575.15, "r_x2": 360.0, "r_y2": 570.16, "r_x3": 353.2, "r_y3": 570.16, "coord_origin": "TOPLEFT" }, "text": "NL", "orig": "NL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 99, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 353.15, "r_y0": 581.76, "r_x1": 359.95, "r_y1": 581.76, "r_x2": 359.95, "r_y2": 576.77, "r_x3": 353.15, "r_y3": 576.77, "coord_origin": "TOPLEFT" }, "text": "NL", "orig": "NL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 100, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 353.27, "r_y0": 588.4, "r_x1": 360.07, "r_y1": 588.4, "r_x2": 360.07, "r_y2": 583.41, "r_x3": 353.27, "r_y3": 583.41, "coord_origin": "TOPLEFT" }, "text": "NL", "orig": "NL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 101, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 347.38, "r_y0": 562.07, "r_x1": 350.34, "r_y1": 562.07, "r_x2": 350.34, "r_y2": 557.08, "r_x3": 347.38, "r_y3": 557.08, "coord_origin": "TOPLEFT" }, "text": "L", "orig": "L", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 102, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 331.14, "r_y0": 568.55, "r_x1": 333.67, "r_y1": 568.55, "r_x2": 333.67, "r_y2": 564.29, "r_x3": 331.14, "r_y3": 564.29, "coord_origin": "TOPLEFT" }, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 103, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 340.81, "r_y0": 558.86, "r_x1": 343.34, "r_y1": 558.86, "r_x2": 343.34, "r_y2": 554.59, "r_x3": 340.81, "r_y3": 554.59, "coord_origin": "TOPLEFT" }, "text": "2", "orig": "2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 104, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 330.98, "r_y0": 559.09, "r_x1": 333.51, "r_y1": 559.09, "r_x2": 333.51, "r_y2": 554.83, "r_x3": 330.98, "r_y3": 554.83, "coord_origin": "TOPLEFT" }, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [ { "id": 13, "label": "text", "bbox": { "l": 147.3, "t": 540.73, "r": 149.71, "b": 543.1, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 33, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 147.3, "r_y0": 543.1, "r_x1": 149.71, "r_y1": 543.1, "r_x2": 149.71, "r_y2": 540.73, "r_x3": 147.3, "r_y3": 540.73, "coord_origin": "TOPLEFT" }, "text": "1.", "orig": "1.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 14, "label": "text", "bbox": { "l": 150.91, "t": 540.73, "r": 155.72, "b": 543.1, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 34, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 150.91, "r_y0": 543.1, "r_x1": 155.72, "r_y1": 543.1, "r_x2": 155.72, "r_y2": 540.73, "r_x3": 150.91, "r_y3": 540.73, "coord_origin": "TOPLEFT" }, "text": "Item", "orig": "Item", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 15, "label": "text", "bbox": { "l": 162.76, "t": 535.39, "r": 172.3, "b": 537.76, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 35, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 162.76, "r_y0": 537.76, "r_x1": 172.3, "r_y1": 537.76, "r_x2": 172.3, "r_y2": 535.39, "r_x3": 162.76, "r_y3": 535.39, "coord_origin": "TOPLEFT" }, "text": "Amount", "orig": "Amount", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 16, "label": "text", "bbox": { "l": 147.64, "t": 535.37, "r": 155.92, "b": 537.73, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 36, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 147.64, "r_y0": 537.73, "r_x1": 155.92, "r_y1": 537.73, "r_x2": 155.92, "r_y2": 535.37, "r_x3": 147.64, "r_y3": 535.37, "coord_origin": "TOPLEFT" }, "text": "Names", "orig": "Names", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 17, "label": "text", "bbox": { "l": 158.48, "t": 540.73, "r": 164.1, "b": 543.1, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 37, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 158.48, "r_y0": 543.1, "r_x1": 164.1, "r_y1": 543.1, "r_x2": 164.1, "r_y2": 540.73, "r_x3": 158.48, "r_y3": 540.73, "coord_origin": "TOPLEFT" }, "text": "1000", "orig": "1000", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 18, "label": "text", "bbox": { "l": 158.48, "t": 544.67, "r": 162.7, "b": 547.04, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 38, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 158.48, "r_y0": 547.04, "r_x1": 162.7, "r_y1": 547.04, "r_x2": 162.7, "r_y2": 544.67, "r_x3": 158.48, "r_y3": 544.67, "coord_origin": "TOPLEFT" }, "text": "500", "orig": "500", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 19, "label": "text", "bbox": { "l": 158.48, "t": 548.91, "r": 164.1, "b": 551.28, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 39, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 158.48, "r_y0": 551.28, "r_x1": 164.1, "r_y1": 551.28, "r_x2": 164.1, "r_y2": 548.91, "r_x3": 158.48, "r_y3": 548.91, "coord_origin": "TOPLEFT" }, "text": "3500", "orig": "3500", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 20, "label": "text", "bbox": { "l": 158.48, "t": 553.15, "r": 162.7, "b": 555.52, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 40, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 158.48, "r_y0": 555.52, "r_x1": 162.7, "r_y1": 555.52, "r_x2": 162.7, "r_y2": 553.15, "r_x3": 158.48, "r_y3": 553.15, "coord_origin": "TOPLEFT" }, "text": "150", "orig": "150", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 21, "label": "text", "bbox": { "l": 168.82, "t": 540.73, "r": 172.89, "b": 543.1, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 41, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 168.82, "r_y0": 543.1, "r_x1": 172.89, "r_y1": 543.1, "r_x2": 172.89, "r_y2": 540.73, "r_x3": 168.82, "r_y3": 540.73, "coord_origin": "TOPLEFT" }, "text": "unit", "orig": "unit", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 22, "label": "text", "bbox": { "l": 168.82, "t": 544.67, "r": 172.89, "b": 547.04, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 42, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 168.82, "r_y0": 547.04, "r_x1": 172.89, "r_y1": 547.04, "r_x2": 172.89, "r_y2": 544.67, "r_x3": 168.82, "r_y3": 544.67, "coord_origin": "TOPLEFT" }, "text": "unit", "orig": "unit", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 23, "label": "text", "bbox": { "l": 168.82, "t": 548.91, "r": 172.89, "b": 551.28, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 43, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 168.82, "r_y0": 551.28, "r_x1": 172.89, "r_y1": 551.28, "r_x2": 172.89, "r_y2": 548.91, "r_x3": 168.82, "r_y3": 548.91, "coord_origin": "TOPLEFT" }, "text": "unit", "orig": "unit", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 24, "label": "text", "bbox": { "l": 168.82, "t": 553.15, "r": 172.89, "b": 555.52, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 44, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 168.82, "r_y0": 555.52, "r_x1": 172.89, "r_y1": 555.52, "r_x2": 172.89, "r_y2": 553.15, "r_x3": 168.82, "r_y3": 553.15, "coord_origin": "TOPLEFT" }, "text": "unit", "orig": "unit", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 25, "label": "text", "bbox": { "l": 147.3, "t": 544.67, "r": 149.71, "b": 547.04, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 45, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 147.3, "r_y0": 547.04, "r_x1": 149.71, "r_y1": 547.04, "r_x2": 149.71, "r_y2": 544.67, "r_x3": 147.3, "r_y3": 544.67, "coord_origin": "TOPLEFT" }, "text": "2.", "orig": "2.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 26, "label": "text", "bbox": { "l": 150.91, "t": 544.67, "r": 155.72, "b": 547.04, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 46, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 150.91, "r_y0": 547.04, "r_x1": 155.72, "r_y1": 547.04, "r_x2": 155.72, "r_y2": 544.67, "r_x3": 150.91, "r_y3": 544.67, "coord_origin": "TOPLEFT" }, "text": "Item", "orig": "Item", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 27, "label": "text", "bbox": { "l": 147.3, "t": 548.91, "r": 149.71, "b": 551.28, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 47, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 147.3, "r_y0": 551.28, "r_x1": 149.71, "r_y1": 551.28, "r_x2": 149.71, "r_y2": 548.91, "r_x3": 147.3, "r_y3": 548.91, "coord_origin": "TOPLEFT" }, "text": "3.", "orig": "3.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 28, "label": "text", "bbox": { "l": 150.91, "t": 548.91, "r": 155.72, "b": 551.28, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 48, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 150.91, "r_y0": 551.28, "r_x1": 155.72, "r_y1": 551.28, "r_x2": 155.72, "r_y2": 548.91, "r_x3": 150.91, "r_y3": 548.91, "coord_origin": "TOPLEFT" }, "text": "Item", "orig": "Item", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 29, "label": "text", "bbox": { "l": 147.3, "t": 553.15, "r": 149.71, "b": 555.52, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 49, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 147.3, "r_y0": 555.52, "r_x1": 149.71, "r_y1": 555.52, "r_x2": 149.71, "r_y2": 553.15, "r_x3": 147.3, "r_y3": 553.15, "coord_origin": "TOPLEFT" }, "text": "4.", "orig": "4.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 30, "label": "text", "bbox": { "l": 150.91, "t": 553.15, "r": 155.72, "b": 555.52, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 50, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 150.91, "r_y0": 555.52, "r_x1": 155.72, "r_y1": 555.52, "r_x2": 155.72, "r_y2": 553.15, "r_x3": 150.91, "r_y3": 553.15, "coord_origin": "TOPLEFT" }, "text": "Item", "orig": "Item", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 31, "label": "text", "bbox": { "l": 152.05, "t": 517.01, "r": 171.25, "b": 521.27, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 51, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 152.05, "r_y0": 521.27, "r_x1": 171.25, "r_y1": 521.27, "r_x2": 171.25, "r_y2": 517.01, "r_x3": 152.05, "r_y3": 517.01, "coord_origin": "TOPLEFT" }, "text": "Extracted", "orig": "Extracted", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 32, "label": "text", "bbox": { "l": 148.13, "t": 522.31, "r": 175.17, "b": 526.58, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 52, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 148.13, "r_y0": 526.58, "r_x1": 175.17, "r_y1": 526.58, "r_x2": 175.17, "r_y2": 522.31, "r_x3": 148.13, "r_y3": 522.31, "coord_origin": "TOPLEFT" }, "text": "Table Images", "orig": "Table Images", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 33, "label": "text", "bbox": { "l": 193.53, "t": 524.51, "r": 220.32, "b": 528.78, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 53, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 193.53, "r_y0": 528.78, "r_x1": 220.32, "r_y1": 528.78, "r_x2": 220.32, "r_y2": 524.51, "r_x3": 193.53, "r_y3": 524.51, "coord_origin": "TOPLEFT" }, "text": "Standardized", "orig": "Standardized", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 34, "label": "text", "bbox": { "l": 199.47, "t": 529.82, "r": 214.38, "b": 534.08, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 54, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 199.47, "r_y0": 534.08, "r_x1": 214.38, "r_y1": 534.08, "r_x2": 214.38, "r_y2": 529.82, "r_x3": 199.47, "r_y3": 529.82, "coord_origin": "TOPLEFT" }, "text": "Images", "orig": "Images", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 35, "label": "text", "bbox": { "l": 273.61, "t": 509.91, "r": 284.47, "b": 514.17, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 55, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 273.61, "r_y0": 514.17, "r_x1": 284.47, "r_y1": 514.17, "r_x2": 284.47, "r_y2": 509.91, "r_x3": 273.61, "r_y3": 509.91, "coord_origin": "TOPLEFT" }, "text": "BBox", "orig": "BBox", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 36, "label": "text", "bbox": { "l": 270.45, "t": 513.69, "r": 287.63, "b": 517.96, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 56, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 270.45, "r_y0": 517.96, "r_x1": 287.63, "r_y1": 517.96, "r_x2": 287.63, "r_y2": 513.69, "r_x3": 270.45, "r_y3": 513.69, "coord_origin": "TOPLEFT" }, "text": "Decoder", "orig": "Decoder", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 37, "label": "text", "bbox": { "l": 332.48, "t": 508.14, "r": 348.14, "b": 512.41, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 57, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 332.48, "r_y0": 512.41, "r_x1": 348.14, "r_y1": 512.41, "r_x2": 348.14, "r_y2": 508.14, "r_x3": 332.48, "r_y3": 508.14, "coord_origin": "TOPLEFT" }, "text": "BBoxes", "orig": "BBoxes", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 38, "label": "text", "bbox": { "l": 376.69, "t": 521.12, "r": 407.25, "b": 525.38, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 58, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 376.69, "r_y0": 525.38, "r_x1": 407.25, "r_y1": 525.38, "r_x2": 407.25, "r_y2": 521.12, "r_x3": 376.69, "r_y3": 521.12, "coord_origin": "TOPLEFT" }, "text": "BBoxes can be", "orig": "BBoxes can be", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 39, "label": "text", "bbox": { "l": 373.91, "t": 525.67, "r": 410.04, "b": 529.93, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 59, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 373.91, "r_y0": 529.93, "r_x1": 410.04, "r_y1": 529.93, "r_x2": 410.04, "r_y2": 525.67, "r_x3": 373.91, "r_y3": 525.67, "coord_origin": "TOPLEFT" }, "text": "traced back to the", "orig": "traced back to the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 40, "label": "text", "bbox": { "l": 375.3, "t": 530.21, "r": 408.65, "b": 534.47, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 60, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 375.3, "r_y0": 534.47, "r_x1": 408.65, "r_y1": 534.47, "r_x2": 408.65, "r_y2": 530.21, "r_x3": 375.3, "r_y3": 530.21, "coord_origin": "TOPLEFT" }, "text": "original image to", "orig": "original image to", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 41, "label": "text", "bbox": { "l": 377.07, "t": 534.76, "r": 406.88, "b": 539.02, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 61, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 377.07, "r_y0": 539.02, "r_x1": 406.88, "r_y1": 539.02, "r_x2": 406.88, "r_y2": 534.76, "r_x3": 377.07, "r_y3": 534.76, "coord_origin": "TOPLEFT" }, "text": "extract content", "orig": "extract content", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 42, "label": "text", "bbox": { "l": 383.57, "t": 563.24, "r": 433.77, "b": 567.5, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 62, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 383.57, "r_y0": 567.5, "r_x1": 433.77, "r_y1": 567.5, "r_x2": 433.77, "r_y2": 563.24, "r_x3": 383.57, "r_y3": 563.24, "coord_origin": "TOPLEFT" }, "text": "Structure Tags sequence", "orig": "Structure Tags sequence", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 43, "label": "text", "bbox": { "l": 383.53, "t": 567.79, "r": 433.81, "b": 572.05, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 63, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 383.53, "r_y0": 572.05, "r_x1": 433.81, "r_y1": 572.05, "r_x2": 433.81, "r_y2": 567.79, "r_x3": 383.53, "r_y3": 567.79, "coord_origin": "TOPLEFT" }, "text": "provide full description of", "orig": "provide full description of", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 44, "label": "text", "bbox": { "l": 390.48, "t": 572.33, "r": 426.86, "b": 576.59, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 64, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 390.48, "r_y0": 576.59, "r_x1": 426.86, "r_y1": 576.59, "r_x2": 426.86, "r_y2": 572.33, "r_x3": 390.48, "r_y3": 572.33, "coord_origin": "TOPLEFT" }, "text": "the table structure", "orig": "the table structure", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 45, "label": "text", "bbox": { "l": 293.95, "t": 577.89, "r": 323.17, "b": 582.15, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 65, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 293.95, "r_y0": 582.15, "r_x1": 323.17, "r_y1": 582.15, "r_x2": 323.17, "r_y2": 577.89, "r_x3": 293.95, "r_y3": 577.89, "coord_origin": "TOPLEFT" }, "text": "Structure Tags", "orig": "Structure Tags", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 46, "label": "text", "bbox": { "l": 293.95, "t": 582.44, "r": 324.59, "b": 586.7, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 66, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 293.95, "r_y0": 586.7, "r_x1": 324.59, "r_y1": 586.7, "r_x2": 324.59, "r_y2": 582.44, "r_x3": 293.95, "r_y3": 582.44, "coord_origin": "TOPLEFT" }, "text": "in OTSL format", "orig": "in OTSL format", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 47, "label": "text", "bbox": { "l": 333.08, "t": 541.82, "r": 364.15, "b": 546.09, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 67, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 333.08, "r_y0": 546.09, "r_x1": 364.15, "r_y1": 546.09, "r_x2": 364.15, "r_y2": 541.82, "r_x3": 333.08, "r_y3": 541.82, "coord_origin": "TOPLEFT" }, "text": "BBoxes in sync", "orig": "BBoxes in sync", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 48, "label": "text", "bbox": { "l": 333.08, "t": 545.61, "r": 369.72, "b": 549.87, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 68, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 333.08, "r_y0": 549.87, "r_x1": 369.72, "r_y1": 549.87, "r_x2": 369.72, "r_y2": 545.61, "r_x3": 333.08, "r_y3": 545.61, "coord_origin": "TOPLEFT" }, "text": "with tag sequence", "orig": "with tag sequence", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 49, "label": "text", "bbox": { "l": 232.66, "t": 515.24, "r": 249.59, "b": 519.5, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 69, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 232.66, "r_y0": 519.5, "r_x1": 249.59, "r_y1": 519.5, "r_x2": 249.59, "r_y2": 515.24, "r_x3": 232.66, "r_y3": 515.24, "coord_origin": "TOPLEFT" }, "text": "Encoder", "orig": "Encoder", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 50, "label": "text", "bbox": { "l": 269.82, "t": 545.97, "r": 288.26, "b": 550.23, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 70, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 269.82, "r_y0": 550.23, "r_x1": 288.26, "r_y1": 550.23, "r_x2": 288.26, "r_y2": 545.97, "r_x3": 269.82, "r_y3": 545.97, "coord_origin": "TOPLEFT" }, "text": "Structure", "orig": "Structure", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 51, "label": "text", "bbox": { "l": 270.45, "t": 549.76, "r": 287.63, "b": 554.02, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 71, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 270.45, "r_y0": 554.02, "r_x1": 287.63, "r_y1": 554.02, "r_x2": 287.63, "r_y2": 549.76, "r_x3": 270.45, "r_y3": 549.76, "coord_origin": "TOPLEFT" }, "text": "Decoder", "orig": "Decoder", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 52, "label": "text", "bbox": { "l": 332.18, "t": 515.91, "r": 358.11, "b": 520.18, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 72, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 332.18, "r_y0": 520.18, "r_x1": 358.11, "r_y1": 520.18, "r_x2": 358.11, "r_y2": 515.91, "r_x3": 332.18, "r_y3": 515.91, "coord_origin": "TOPLEFT" }, "text": "[x1, y2, x2, y2]", "orig": "[x1, y2, x2, y2]", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 53, "label": "text", "bbox": { "l": 332.18, "t": 521.97, "r": 361.58, "b": 526.24, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 73, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 332.18, "r_y0": 526.24, "r_x1": 361.58, "r_y1": 526.24, "r_x2": 361.58, "r_y2": 521.97, "r_x3": 332.18, "r_y3": 521.97, "coord_origin": "TOPLEFT" }, "text": "[x1', y2', x2', y2']", "orig": "[x1', y2', x2', y2']", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 54, "label": "text", "bbox": { "l": 332.18, "t": 528.03, "r": 364.76, "b": 532.3, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 74, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 332.18, "r_y0": 532.3, "r_x1": 364.76, "r_y1": 532.3, "r_x2": 364.76, "r_y2": 528.03, "r_x3": 332.18, "r_y3": 528.03, "coord_origin": "TOPLEFT" }, "text": "[x1'', y2'', x2'', y2'']", "orig": "[x1'', y2'', x2'', y2'']", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 55, "label": "text", "bbox": { "l": 332.18, "t": 534.09, "r": 335.97, "b": 538.36, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 75, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 332.18, "r_y0": 538.36, "r_x1": 335.97, "r_y1": 538.36, "r_x2": 335.97, "r_y2": 534.09, "r_x3": 332.18, "r_y3": 534.09, "coord_origin": "TOPLEFT" }, "text": "...", "orig": "...", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 56, "label": "text", "bbox": { "l": 326.89, "t": 516.4, "r": 329.42, "b": 520.66, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 76, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 326.89, "r_y0": 520.66, "r_x1": 329.42, "r_y1": 520.66, "r_x2": 329.42, "r_y2": 516.4, "r_x3": 326.89, "r_y3": 516.4, "coord_origin": "TOPLEFT" }, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 57, "label": "text", "bbox": { "l": 327.04, "t": 522.42, "r": 329.57, "b": 526.69, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 77, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 327.04, "r_y0": 526.69, "r_x1": 329.57, "r_y1": 526.69, "r_x2": 329.57, "r_y2": 522.42, "r_x3": 327.04, "r_y3": 522.42, "coord_origin": "TOPLEFT" }, "text": "2", "orig": "2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 58, "label": "text", "bbox": { "l": 327.04, "t": 528.52, "r": 329.57, "b": 532.78, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 78, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 327.04, "r_y0": 532.78, "r_x1": 329.57, "r_y1": 532.78, "r_x2": 329.57, "r_y2": 528.52, "r_x3": 327.04, "r_y3": 528.52, "coord_origin": "TOPLEFT" }, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 59, "label": "text", "bbox": { "l": 424.14, "t": 527.44, "r": 426.67, "b": 531.71, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 79, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 424.14, "r_y0": 531.71, "r_x1": 426.67, "r_y1": 531.71, "r_x2": 426.67, "r_y2": 527.44, "r_x3": 424.14, "r_y3": 527.44, "coord_origin": "TOPLEFT" }, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 60, "label": "text", "bbox": { "l": 453.0, "t": 517.45, "r": 455.53, "b": 521.72, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 80, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 453.0, "r_y0": 521.72, "r_x1": 455.53, "r_y1": 521.72, "r_x2": 455.53, "r_y2": 517.45, "r_x3": 453.0, "r_y3": 517.45, "coord_origin": "TOPLEFT" }, "text": "2", "orig": "2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 61, "label": "text", "bbox": { "l": 423.86, "t": 517.06, "r": 426.39, "b": 521.33, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 81, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 423.86, "r_y0": 521.33, "r_x1": 426.39, "r_y1": 521.33, "r_x2": 426.39, "r_y2": 517.06, "r_x3": 423.86, "r_y3": 517.06, "coord_origin": "TOPLEFT" }, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 62, "label": "text", "bbox": { "l": 333.43, "t": 557.37, "r": 337.28, "b": 562.36, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 82, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 333.43, "r_y0": 562.36, "r_x1": 337.28, "r_y1": 562.36, "r_x2": 337.28, "r_y2": 557.37, "r_x3": 333.43, "r_y3": 557.37, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 63, "label": "text", "bbox": { "l": 340.35, "t": 557.32, "r": 344.2, "b": 562.31, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 83, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 340.35, "r_y0": 562.31, "r_x1": 344.2, "r_y1": 562.31, "r_x2": 344.2, "r_y2": 557.32, "r_x3": 340.35, "r_y3": 557.32, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 64, "label": "text", "bbox": { "l": 340.31, "t": 563.87, "r": 344.15, "b": 568.86, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 84, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 340.31, "r_y0": 568.86, "r_x1": 344.15, "r_y1": 568.86, "r_x2": 344.15, "r_y2": 563.87, "r_x3": 340.31, "r_y3": 563.87, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 65, "label": "text", "bbox": { "l": 346.8, "t": 563.87, "r": 350.64, "b": 568.86, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 85, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 346.8, "r_y0": 568.86, "r_x1": 350.64, "r_y1": 568.86, "r_x2": 350.64, "r_y2": 563.87, "r_x3": 346.8, "r_y3": 563.87, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 66, "label": "text", "bbox": { "l": 333.6, "t": 563.82, "r": 337.44, "b": 568.81, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 86, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 333.6, "r_y0": 568.81, "r_x1": 337.44, "r_y1": 568.81, "r_x2": 337.44, "r_y2": 563.82, "r_x3": 333.6, "r_y3": 563.82, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 67, "label": "text", "bbox": { "l": 340.38, "t": 570.43, "r": 344.22, "b": 575.42, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 87, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 340.38, "r_y0": 575.42, "r_x1": 344.22, "r_y1": 575.42, "r_x2": 344.22, "r_y2": 570.43, "r_x3": 340.38, "r_y3": 570.43, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 68, "label": "text", "bbox": { "l": 346.86, "t": 570.43, "r": 350.71, "b": 575.42, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 88, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 346.86, "r_y0": 575.42, "r_x1": 350.71, "r_y1": 575.42, "r_x2": 350.71, "r_y2": 570.43, "r_x3": 346.86, "r_y3": 570.43, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 69, "label": "text", "bbox": { "l": 333.66, "t": 570.38, "r": 337.5, "b": 575.37, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 89, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 333.66, "r_y0": 575.37, "r_x1": 337.5, "r_y1": 575.37, "r_x2": 337.5, "r_y2": 570.38, "r_x3": 333.66, "r_y3": 570.38, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 70, "label": "text", "bbox": { "l": 340.38, "t": 577.03, "r": 344.22, "b": 582.02, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 90, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 340.38, "r_y0": 582.02, "r_x1": 344.22, "r_y1": 582.02, "r_x2": 344.22, "r_y2": 577.03, "r_x3": 340.38, "r_y3": 577.03, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 71, "label": "text", "bbox": { "l": 346.87, "t": 577.03, "r": 350.71, "b": 582.02, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 91, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 346.87, "r_y0": 582.02, "r_x1": 350.71, "r_y1": 582.02, "r_x2": 350.71, "r_y2": 577.03, "r_x3": 346.87, "r_y3": 577.03, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 72, "label": "text", "bbox": { "l": 333.66, "t": 576.98, "r": 337.5, "b": 581.97, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 92, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 333.66, "r_y0": 581.97, "r_x1": 337.5, "r_y1": 581.97, "r_x2": 337.5, "r_y2": 576.98, "r_x3": 333.66, "r_y3": 576.98, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 73, "label": "text", "bbox": { "l": 340.28, "t": 583.4, "r": 344.12, "b": 588.39, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 93, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 340.28, "r_y0": 588.39, "r_x1": 344.12, "r_y1": 588.39, "r_x2": 344.12, "r_y2": 583.4, "r_x3": 340.28, "r_y3": 583.4, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 74, "label": "text", "bbox": { "l": 346.77, "t": 583.4, "r": 350.61, "b": 588.39, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 94, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 346.77, "r_y0": 588.39, "r_x1": 350.61, "r_y1": 588.39, "r_x2": 350.61, "r_y2": 583.4, "r_x3": 346.77, "r_y3": 583.4, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 75, "label": "text", "bbox": { "l": 333.57, "t": 583.35, "r": 337.41, "b": 588.35, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 95, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 333.57, "r_y0": 588.35, "r_x1": 337.41, "r_y1": 588.35, "r_x2": 337.41, "r_y2": 583.35, "r_x3": 333.57, "r_y3": 583.35, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 76, "label": "text", "bbox": { "l": 353.03, "t": 556.88, "r": 359.83, "b": 561.87, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 96, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 353.03, "r_y0": 561.87, "r_x1": 359.83, "r_y1": 561.87, "r_x2": 359.83, "r_y2": 556.88, "r_x3": 353.03, "r_y3": 556.88, "coord_origin": "TOPLEFT" }, "text": "NL", "orig": "NL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 77, "label": "text", "bbox": { "l": 353.19, "t": 563.58, "r": 359.99, "b": 568.57, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 97, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 353.19, "r_y0": 568.57, "r_x1": 359.99, "r_y1": 568.57, "r_x2": 359.99, "r_y2": 563.58, "r_x3": 353.19, "r_y3": 563.58, "coord_origin": "TOPLEFT" }, "text": "NL", "orig": "NL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 78, "label": "text", "bbox": { "l": 353.2, "t": 570.16, "r": 360.0, "b": 575.15, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 98, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 353.2, "r_y0": 575.15, "r_x1": 360.0, "r_y1": 575.15, "r_x2": 360.0, "r_y2": 570.16, "r_x3": 353.2, "r_y3": 570.16, "coord_origin": "TOPLEFT" }, "text": "NL", "orig": "NL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 79, "label": "text", "bbox": { "l": 353.15, "t": 576.77, "r": 359.95, "b": 581.76, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 99, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 353.15, "r_y0": 581.76, "r_x1": 359.95, "r_y1": 581.76, "r_x2": 359.95, "r_y2": 576.77, "r_x3": 353.15, "r_y3": 576.77, "coord_origin": "TOPLEFT" }, "text": "NL", "orig": "NL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 80, "label": "text", "bbox": { "l": 353.27, "t": 583.41, "r": 360.07, "b": 588.4, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 100, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 353.27, "r_y0": 588.4, "r_x1": 360.07, "r_y1": 588.4, "r_x2": 360.07, "r_y2": 583.41, "r_x3": 353.27, "r_y3": 583.41, "coord_origin": "TOPLEFT" }, "text": "NL", "orig": "NL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 81, "label": "text", "bbox": { "l": 347.38, "t": 557.08, "r": 350.34, "b": 562.07, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 101, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 347.38, "r_y0": 562.07, "r_x1": 350.34, "r_y1": 562.07, "r_x2": 350.34, "r_y2": 557.08, "r_x3": 347.38, "r_y3": 557.08, "coord_origin": "TOPLEFT" }, "text": "L", "orig": "L", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 82, "label": "text", "bbox": { "l": 331.14, "t": 564.29, "r": 333.67, "b": 568.55, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 102, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 331.14, "r_y0": 568.55, "r_x1": 333.67, "r_y1": 568.55, "r_x2": 333.67, "r_y2": 564.29, "r_x3": 331.14, "r_y3": 564.29, "coord_origin": "TOPLEFT" }, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 83, "label": "text", "bbox": { "l": 340.81, "t": 554.59, "r": 343.34, "b": 558.86, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 103, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 340.81, "r_y0": 558.86, "r_x1": 343.34, "r_y1": 558.86, "r_x2": 343.34, "r_y2": 554.59, "r_x3": 340.81, "r_y3": 554.59, "coord_origin": "TOPLEFT" }, "text": "2", "orig": "2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 84, "label": "text", "bbox": { "l": 330.98, "t": 554.83, "r": 333.51, "b": 559.09, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 104, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 330.98, "r_y0": 559.09, "r_x1": 333.51, "r_y1": 559.09, "r_x2": 333.51, "r_y2": 554.83, "r_x3": 330.98, "r_y3": 554.83, "coord_origin": "TOPLEFT" }, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] } ] }, "text": "", "annotations": [], "provenance": null, "predicted_class": null, "confidence": null }, { "label": "text", "id": 4, "page_no": 7, "cluster": { "id": 4, "label": "text", "bbox": { "l": 134.76, "t": 620.19, "r": 480.59, "b": 664.85, "coord_origin": "TOPLEFT" }, "confidence": 0.951, "cells": [ { "index": 105, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 149.71, "r_y0": 628.99, "r_x1": 480.59, "r_y1": 628.99, "r_x2": 480.59, "r_y2": 620.19, "r_x3": 149.71, "r_y3": 620.19, "coord_origin": "TOPLEFT" }, "text": "We rely on standard metrics such as Tree Edit Distance score (TEDs) for", "orig": "We rely on standard metrics such as Tree Edit Distance score (TEDs) for", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 106, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 640.94, "r_x1": 480.59, "r_y1": 640.94, "r_x2": 480.59, "r_y2": 632.15, "r_x3": 134.76, "r_y3": 632.15, "coord_origin": "TOPLEFT" }, "text": "table structure prediction, and Mean Average Precision (mAP) with 0.75 Inter-", "orig": "table structure prediction, and Mean Average Precision (mAP) with 0.75 Inter-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 107, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 652.9, "r_x1": 480.59, "r_y1": 652.9, "r_x2": 480.59, "r_y2": 644.1, "r_x3": 134.76, "r_y3": 644.1, "coord_origin": "TOPLEFT" }, "text": "section Over Union (IOU) threshold for the bounding-box predictions of table", "orig": "section Over Union (IOU) threshold for the bounding-box predictions of table", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 108, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 664.85, "r_x1": 480.59, "r_y1": 664.85, "r_x2": 480.59, "r_y2": 656.06, "r_x3": 134.76, "r_y3": 656.06, "coord_origin": "TOPLEFT" }, "text": "cells. The predicted OTSL structures were converted back to HTML format in", "orig": "cells. The predicted OTSL structures were converted back to HTML format in", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "We rely on standard metrics such as Tree Edit Distance score (TEDs) for table structure prediction, and Mean Average Precision (mAP) with 0.75 Intersection Over Union (IOU) threshold for the bounding-box predictions of table cells. The predicted OTSL structures were converted back to HTML format in" } ], "headers": [ { "label": "page_header", "id": 9, "page_no": 7, "cluster": { "id": 9, "label": "page_header", "bbox": { "l": 134.76, "t": 93.77, "r": 139.37, "b": 101.84, "coord_origin": "TOPLEFT" }, "confidence": 0.83, "cells": [ { "index": 0, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 101.84, "r_x1": 139.37, "r_y1": 101.84, "r_x2": 139.37, "r_y2": 93.77, "r_x3": 134.76, "r_y3": 93.77, "coord_origin": "TOPLEFT" }, "text": "8", "orig": "8", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "8" }, { "label": "page_header", "id": 8, "page_no": 7, "cluster": { "id": 8, "label": "page_header", "bbox": { "l": 167.81, "t": 93.77, "r": 231.72, "b": 101.84, "coord_origin": "TOPLEFT" }, "confidence": 0.863, "cells": [ { "index": 1, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 167.81, "r_y0": 101.84, "r_x1": 178.08, "r_y1": 101.84, "r_x2": 178.08, "r_y2": 93.77, "r_x3": 167.81, "r_y3": 93.77, "coord_origin": "TOPLEFT" }, "text": "M.", "orig": "M.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 2, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 182.37, "r_y0": 101.84, "r_x1": 231.72, "r_y1": 101.84, "r_x2": 231.72, "r_y2": 93.77, "r_x3": 182.37, "r_y3": 93.77, "coord_origin": "TOPLEFT" }, "text": "Lysak, et al.", "orig": "Lysak, et al.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "M. Lysak, et al." } ] } }, { "page_no": 8, "size": { "width": 612.0, "height": 792.0 }, "parsed_page": { "dimension": { "angle": 0.0, "rect": { "r_x0": 0.0, "r_y0": 0.0, "r_x1": 612.0, "r_y1": 0.0, "r_x2": 612.0, "r_y2": 792.0, "r_x3": 0.0, "r_y3": 792.0, "coord_origin": "BOTTOMLEFT" }, "boundary_type": "crop_box", "art_bbox": { "l": 0.0, "t": 792.0, "r": 612.0, "b": 0.0, "coord_origin": "BOTTOMLEFT" }, "bleed_bbox": { "l": 0.0, "t": 792.0, "r": 612.0, "b": 0.0, "coord_origin": "BOTTOMLEFT" }, "crop_bbox": { "l": 0.0, "t": 792.0, "r": 612.0, "b": 0.0, "coord_origin": "BOTTOMLEFT" }, "media_bbox": { "l": 0.0, "t": 792.0, "r": 612.0, "b": 0.0, "coord_origin": "BOTTOMLEFT" }, "trim_bbox": { "l": 0.0, "t": 792.0, "r": 612.0, "b": 0.0, "coord_origin": "BOTTOMLEFT" } }, "bitmap_resources": [], "char_cells": [], "word_cells": [], "textline_cells": [ { "index": 0, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 194.48, "r_y0": 101.84, "r_x1": 447.54, "r_y1": 101.84, "r_x2": 447.54, "r_y2": 93.77, "r_x3": 194.48, "r_y3": 93.77, "coord_origin": "TOPLEFT" }, "text": "Optimized Table Tokenization for Table Structure Recognition", "orig": "Optimized Table Tokenization for Table Structure Recognition", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 1, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 475.98, "r_y0": 101.84, "r_x1": 480.59, "r_y1": 101.84, "r_x2": 480.59, "r_y2": 93.77, "r_x3": 475.98, "r_y3": 93.77, "coord_origin": "TOPLEFT" }, "text": "9", "orig": "9", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 2, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 127.73, "r_x1": 480.59, "r_y1": 127.73, "r_x2": 480.59, "r_y2": 118.93, "r_x3": 134.76, "r_y3": 118.93, "coord_origin": "TOPLEFT" }, "text": "order to compute the TED score. Inference timing results for all experiments", "orig": "order to compute the TED score. Inference timing results for all experiments", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 3, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 139.69, "r_x1": 480.6, "r_y1": 139.69, "r_x2": 480.6, "r_y2": 130.89, "r_x3": 134.76, "r_y3": 130.89, "coord_origin": "TOPLEFT" }, "text": "were obtained from the same machine on a single core with AMD EPYC 7763", "orig": "were obtained from the same machine on a single core with AMD EPYC 7763", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 4, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 151.64, "r_x1": 210.78, "r_y1": 151.64, "r_x2": 210.78, "r_y2": 142.84, "r_x3": 134.76, "r_y3": 142.84, "coord_origin": "TOPLEFT" }, "text": "CPU @2.45 GHz.", "orig": "CPU @2.45 GHz.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 5, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 177.99, "r_x1": 149.4, "r_y1": 177.99, "r_x2": 149.4, "r_y2": 169.19, "r_x3": 134.76, "r_y3": 169.19, "coord_origin": "TOPLEFT" }, "text": "5.1", "orig": "5.1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 6, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 160.86, "r_y0": 177.99, "r_x1": 318.45, "r_y1": 177.99, "r_x2": 318.45, "r_y2": 169.19, "r_x3": 160.86, "r_y3": 169.19, "coord_origin": "TOPLEFT" }, "text": "Hyper Parameter Optimization", "orig": "Hyper Parameter Optimization", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 7, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 194.38, "r_x1": 480.59, "r_y1": 194.38, "r_x2": 480.59, "r_y2": 185.59, "r_x3": 134.76, "r_y3": 185.59, "coord_origin": "TOPLEFT" }, "text": "We have chosen the PubTabNet data set to perform HPO, since it includes a", "orig": "We have chosen the PubTabNet data set to perform HPO, since it includes a", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 8, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 206.34, "r_x1": 480.59, "r_y1": 206.34, "r_x2": 480.59, "r_y2": 197.54, "r_x3": 134.76, "r_y3": 197.54, "coord_origin": "TOPLEFT" }, "text": "highly diverse set of tables. Also we report TED scores separately for simple and", "orig": "highly diverse set of tables. Also we report TED scores separately for simple and", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 9, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 218.29, "r_x1": 480.59, "r_y1": 218.29, "r_x2": 480.59, "r_y2": 209.5, "r_x3": 134.76, "r_y3": 209.5, "coord_origin": "TOPLEFT" }, "text": "complex tables (tables with cell spans). Results are presented in Table. 1. It is", "orig": "complex tables (tables with cell spans). Results are presented in Table. 1. It is", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 10, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 230.25, "r_x1": 480.59, "r_y1": 230.25, "r_x2": 480.59, "r_y2": 221.45, "r_x3": 134.76, "r_y3": 221.45, "coord_origin": "TOPLEFT" }, "text": "evident that with OTSL, our model achieves the same TED score and slightly", "orig": "evident that with OTSL, our model achieves the same TED score and slightly", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 11, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 242.2, "r_x1": 440.94, "r_y1": 242.2, "r_x2": 440.94, "r_y2": 233.41, "r_x3": 134.76, "r_y3": 233.41, "coord_origin": "TOPLEFT" }, "text": "better mAP scores in comparison to HTML. However OTSL yields a", "orig": "better mAP scores in comparison to HTML. However OTSL yields a", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 12, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 444.87, "r_y0": 242.2, "r_x1": 480.59, "r_y1": 242.2, "r_x2": 480.59, "r_y2": 233.41, "r_x3": 444.87, "r_y3": 233.41, "coord_origin": "TOPLEFT" }, "text": "2x speed", "orig": "2x speed", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 13, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 254.16, "r_x1": 145.2, "r_y1": 254.16, "r_x2": 145.2, "r_y2": 245.36, "r_x3": 134.76, "r_y3": 245.36, "coord_origin": "TOPLEFT" }, "text": "up", "orig": "up", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 14, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 149.15, "r_y0": 254.16, "r_x1": 311.22, "r_y1": 254.16, "r_x2": 311.22, "r_y2": 245.36, "r_x3": 149.15, "r_y3": 245.36, "coord_origin": "TOPLEFT" }, "text": "in the inference runtime over HTML.", "orig": "in the inference runtime over HTML.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 15, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 283.0, "r_x1": 160.12, "r_y1": 283.0, "r_x2": 160.12, "r_y2": 275.07, "r_x3": 134.76, "r_y3": 275.07, "coord_origin": "TOPLEFT" }, "text": "Table", "orig": "Table", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 16, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 167.35, "r_y0": 283.0, "r_x1": 175.6, "r_y1": 283.0, "r_x2": 175.6, "r_y2": 275.07, "r_x3": 167.35, "r_y3": 275.07, "coord_origin": "TOPLEFT" }, "text": "1.", "orig": "1.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 17, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 188.13, "r_y0": 283.2, "r_x1": 480.59, "r_y1": 283.2, "r_x2": 480.59, "r_y2": 275.14, "r_x3": 188.13, "r_y3": 275.14, "coord_origin": "TOPLEFT" }, "text": "HPO performed in OTSL and HTML representation on the same", "orig": "HPO performed in OTSL and HTML representation on the same", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 18, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 294.16, "r_x1": 480.59, "r_y1": 294.16, "r_x2": 480.59, "r_y2": 286.09, "r_x3": 134.76, "r_y3": 286.09, "coord_origin": "TOPLEFT" }, "text": "transformer-based TableFormer [9] architecture, trained only on PubTabNet [22]. Ef-", "orig": "transformer-based TableFormer [9] architecture, trained only on PubTabNet [22]. Ef-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 19, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 305.12, "r_x1": 480.6, "r_y1": 305.12, "r_x2": 480.6, "r_y2": 297.05, "r_x3": 134.76, "r_y3": 297.05, "coord_origin": "TOPLEFT" }, "text": "fects of reducing the # of layers in encoder and decoder stages of the model show that", "orig": "fects of reducing the # of layers in encoder and decoder stages of the model show that", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 20, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 316.08, "r_x1": 480.59, "r_y1": 316.08, "r_x2": 480.59, "r_y2": 308.01, "r_x3": 134.76, "r_y3": 308.01, "coord_origin": "TOPLEFT" }, "text": "smaller models trained on OTSL perform better, especially in recognizing complex", "orig": "smaller models trained on OTSL perform better, especially in recognizing complex", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 21, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 327.04, "r_x1": 480.59, "r_y1": 327.04, "r_x2": 480.59, "r_y2": 318.97, "r_x3": 134.76, "r_y3": 318.97, "coord_origin": "TOPLEFT" }, "text": "table structures, and maintain a much higher mAP score than the HTML counterpart.", "orig": "table structures, and maintain a much higher mAP score than the HTML counterpart.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 22, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 160.37, "r_y0": 349.8, "r_x1": 168.05, "r_y1": 349.8, "r_x2": 168.05, "r_y2": 341.73, "r_x3": 160.37, "r_y3": 341.73, "coord_origin": "TOPLEFT" }, "text": "#", "orig": "#", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 23, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 144.59, "r_y0": 362.76, "r_x1": 183.83, "r_y1": 362.76, "r_x2": 183.83, "r_y2": 354.69, "r_x3": 144.59, "r_y3": 354.69, "coord_origin": "TOPLEFT" }, "text": "enc-layers", "orig": "enc-layers", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 24, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 207.97, "r_y0": 349.8, "r_x1": 215.65, "r_y1": 349.8, "r_x2": 215.65, "r_y2": 341.73, "r_x3": 207.97, "r_y3": 341.73, "coord_origin": "TOPLEFT" }, "text": "#", "orig": "#", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 25, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 192.19, "r_y0": 362.76, "r_x1": 231.43, "r_y1": 362.76, "r_x2": 231.43, "r_y2": 354.69, "r_x3": 192.19, "r_y3": 354.69, "coord_origin": "TOPLEFT" }, "text": "dec-layers", "orig": "dec-layers", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 26, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 239.8, "r_y0": 355.28, "r_x1": 278.32, "r_y1": 355.28, "r_x2": 278.32, "r_y2": 347.21, "r_x3": 239.8, "r_y3": 347.21, "coord_origin": "TOPLEFT" }, "text": "Language", "orig": "Language", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 27, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 324.67, "r_y0": 349.8, "r_x1": 348.26, "r_y1": 349.8, "r_x2": 348.26, "r_y2": 341.73, "r_x3": 324.67, "r_y3": 341.73, "coord_origin": "TOPLEFT" }, "text": "TEDs", "orig": "TEDs", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 28, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 396.27, "r_y0": 349.8, "r_x1": 417.13, "r_y1": 349.8, "r_x2": 417.13, "r_y2": 341.73, "r_x3": 396.27, "r_y3": 341.73, "coord_origin": "TOPLEFT" }, "text": "mAP", "orig": "mAP", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 29, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 394.93, "r_y0": 360.76, "r_x1": 418.47, "r_y1": 360.76, "r_x2": 418.47, "r_y2": 352.69, "r_x3": 394.93, "r_y3": 352.69, "coord_origin": "TOPLEFT" }, "text": "(0.75)", "orig": "(0.75)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 30, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 430.77, "r_y0": 349.8, "r_x1": 467.14, "r_y1": 349.8, "r_x2": 467.14, "r_y2": 341.73, "r_x3": 430.77, "r_y3": 341.73, "coord_origin": "TOPLEFT" }, "text": "Inference", "orig": "Inference", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 31, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 427.15, "r_y0": 360.76, "r_x1": 470.76, "r_y1": 360.76, "r_x2": 470.76, "r_y2": 352.69, "r_x3": 427.15, "r_y3": 352.69, "coord_origin": "TOPLEFT" }, "text": "time (secs)", "orig": "time (secs)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 32, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 286.69, "r_y0": 362.76, "r_x1": 312.33, "r_y1": 362.76, "r_x2": 312.33, "r_y2": 354.69, "r_x3": 286.69, "r_y3": 354.69, "coord_origin": "TOPLEFT" }, "text": "simple", "orig": "simple", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 33, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 320.7, "r_y0": 362.76, "r_x1": 353.72, "r_y1": 362.76, "r_x2": 353.72, "r_y2": 354.69, "r_x3": 320.7, "r_y3": 354.69, "coord_origin": "TOPLEFT" }, "text": "complex", "orig": "complex", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 34, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 369.31, "r_y0": 362.76, "r_x1": 379.03, "r_y1": 362.76, "r_x2": 379.03, "r_y2": 354.69, "r_x3": 369.31, "r_y3": 354.69, "coord_origin": "TOPLEFT" }, "text": "all", "orig": "all", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 35, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 161.91, "r_y0": 381.59, "r_x1": 166.51, "r_y1": 381.59, "r_x2": 166.51, "r_y2": 373.52, "r_x3": 161.91, "r_y3": 373.52, "coord_origin": "TOPLEFT" }, "text": "6", "orig": "6", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 36, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 209.51, "r_y0": 381.59, "r_x1": 214.12, "r_y1": 381.59, "r_x2": 214.12, "r_y2": 373.52, "r_x3": 209.51, "r_y3": 373.52, "coord_origin": "TOPLEFT" }, "text": "6", "orig": "6", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 37, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 246.71, "r_y0": 376.11, "r_x1": 271.41, "r_y1": 376.11, "r_x2": 271.41, "r_y2": 368.04, "r_x3": 246.71, "r_y3": 368.04, "coord_origin": "TOPLEFT" }, "text": "OTSL", "orig": "OTSL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 38, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 289.02, "r_y0": 376.11, "r_x1": 310.0, "r_y1": 376.11, "r_x2": 310.0, "r_y2": 368.04, "r_x3": 289.02, "r_y3": 368.04, "coord_origin": "TOPLEFT" }, "text": "0.965", "orig": "0.965", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 39, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 326.72, "r_y0": 376.11, "r_x1": 347.7, "r_y1": 376.11, "r_x2": 347.7, "r_y2": 368.04, "r_x3": 326.72, "r_y3": 368.04, "coord_origin": "TOPLEFT" }, "text": "0.934", "orig": "0.934", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 40, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 363.68, "r_y0": 376.11, "r_x1": 384.66, "r_y1": 376.11, "r_x2": 384.66, "r_y2": 368.04, "r_x3": 363.68, "r_y3": 368.04, "coord_origin": "TOPLEFT" }, "text": "0.955", "orig": "0.955", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 41, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 397.27, "r_y0": 375.9, "r_x1": 416.13, "r_y1": 375.9, "r_x2": 416.13, "r_y2": 367.97, "r_x3": 397.27, "r_y3": 367.97, "coord_origin": "TOPLEFT" }, "text": "0.88", "orig": "0.88", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 42, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 439.53, "r_y0": 375.9, "r_x1": 458.38, "r_y1": 375.9, "r_x2": 458.38, "r_y2": 367.97, "r_x3": 439.53, "r_y3": 367.97, "coord_origin": "TOPLEFT" }, "text": "2.73", "orig": "2.73", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 43, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 245.18, "r_y0": 389.06, "r_x1": 272.94, "r_y1": 389.06, "r_x2": 272.94, "r_y2": 380.99, "r_x3": 245.18, "r_y3": 380.99, "coord_origin": "TOPLEFT" }, "text": "HTML", "orig": "HTML", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 44, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 289.02, "r_y0": 389.06, "r_x1": 310.0, "r_y1": 389.06, "r_x2": 310.0, "r_y2": 380.99, "r_x3": 289.02, "r_y3": 380.99, "coord_origin": "TOPLEFT" }, "text": "0.969", "orig": "0.969", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 45, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 326.72, "r_y0": 389.06, "r_x1": 347.7, "r_y1": 389.06, "r_x2": 347.7, "r_y2": 380.99, "r_x3": 326.72, "r_y3": 380.99, "coord_origin": "TOPLEFT" }, "text": "0.927", "orig": "0.927", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 46, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 363.68, "r_y0": 389.06, "r_x1": 384.66, "r_y1": 389.06, "r_x2": 384.66, "r_y2": 380.99, "r_x3": 363.68, "r_y3": 380.99, "coord_origin": "TOPLEFT" }, "text": "0.955", "orig": "0.955", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 47, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 396.21, "r_y0": 389.06, "r_x1": 417.19, "r_y1": 389.06, "r_x2": 417.19, "r_y2": 380.99, "r_x3": 396.21, "r_y3": 380.99, "coord_origin": "TOPLEFT" }, "text": "0.857", "orig": "0.857", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 48, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 440.77, "r_y0": 389.06, "r_x1": 457.15, "r_y1": 389.06, "r_x2": 457.15, "r_y2": 380.99, "r_x3": 440.77, "r_y3": 380.99, "coord_origin": "TOPLEFT" }, "text": "5.39", "orig": "5.39", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 49, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 161.91, "r_y0": 407.89, "r_x1": 166.51, "r_y1": 407.89, "r_x2": 166.51, "r_y2": 399.82, "r_x3": 161.91, "r_y3": 399.82, "coord_origin": "TOPLEFT" }, "text": "4", "orig": "4", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 50, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 209.51, "r_y0": 407.89, "r_x1": 214.12, "r_y1": 407.89, "r_x2": 214.12, "r_y2": 399.82, "r_x3": 209.51, "r_y3": 399.82, "coord_origin": "TOPLEFT" }, "text": "4", "orig": "4", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 51, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 246.71, "r_y0": 402.41, "r_x1": 271.41, "r_y1": 402.41, "r_x2": 271.41, "r_y2": 394.34, "r_x3": 246.71, "r_y3": 394.34, "coord_origin": "TOPLEFT" }, "text": "OTSL", "orig": "OTSL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 52, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 289.02, "r_y0": 402.41, "r_x1": 310.0, "r_y1": 402.41, "r_x2": 310.0, "r_y2": 394.34, "r_x3": 289.02, "r_y3": 394.34, "coord_origin": "TOPLEFT" }, "text": "0.938", "orig": "0.938", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 53, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 326.72, "r_y0": 402.41, "r_x1": 347.7, "r_y1": 402.41, "r_x2": 347.7, "r_y2": 394.34, "r_x3": 326.72, "r_y3": 394.34, "coord_origin": "TOPLEFT" }, "text": "0.904", "orig": "0.904", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 54, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 363.68, "r_y0": 402.41, "r_x1": 384.66, "r_y1": 402.41, "r_x2": 384.66, "r_y2": 394.34, "r_x3": 363.68, "r_y3": 394.34, "coord_origin": "TOPLEFT" }, "text": "0.927", "orig": "0.927", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 55, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 394.62, "r_y0": 402.2, "r_x1": 418.78, "r_y1": 402.2, "r_x2": 418.78, "r_y2": 394.28, "r_x3": 394.62, "r_y3": 394.28, "coord_origin": "TOPLEFT" }, "text": "0.853", "orig": "0.853", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 56, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 439.53, "r_y0": 402.2, "r_x1": 458.38, "r_y1": 402.2, "r_x2": 458.38, "r_y2": 394.28, "r_x3": 439.53, "r_y3": 394.28, "coord_origin": "TOPLEFT" }, "text": "1.97", "orig": "1.97", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 57, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 245.18, "r_y0": 415.36, "r_x1": 272.94, "r_y1": 415.36, "r_x2": 272.94, "r_y2": 407.29, "r_x3": 245.18, "r_y3": 407.29, "coord_origin": "TOPLEFT" }, "text": "HTML", "orig": "HTML", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 58, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 289.02, "r_y0": 415.36, "r_x1": 310.0, "r_y1": 415.36, "r_x2": 310.0, "r_y2": 407.29, "r_x3": 289.02, "r_y3": 407.29, "coord_origin": "TOPLEFT" }, "text": "0.952", "orig": "0.952", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 59, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 326.72, "r_y0": 415.36, "r_x1": 347.7, "r_y1": 415.36, "r_x2": 347.7, "r_y2": 407.29, "r_x3": 326.72, "r_y3": 407.29, "coord_origin": "TOPLEFT" }, "text": "0.909", "orig": "0.909", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 60, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 362.09, "r_y0": 415.15, "r_x1": 386.25, "r_y1": 415.15, "r_x2": 386.25, "r_y2": 407.23, "r_x3": 362.09, "r_y3": 407.23, "coord_origin": "TOPLEFT" }, "text": "0.938", "orig": "0.938", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 61, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 396.21, "r_y0": 415.36, "r_x1": 417.19, "r_y1": 415.36, "r_x2": 417.19, "r_y2": 407.29, "r_x3": 396.21, "r_y3": 407.29, "coord_origin": "TOPLEFT" }, "text": "0.843", "orig": "0.843", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 62, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 440.77, "r_y0": 415.36, "r_x1": 457.15, "r_y1": 415.36, "r_x2": 457.15, "r_y2": 407.29, "r_x3": 440.77, "r_y3": 407.29, "coord_origin": "TOPLEFT" }, "text": "3.77", "orig": "3.77", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 63, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 161.91, "r_y0": 434.19, "r_x1": 166.51, "r_y1": 434.19, "r_x2": 166.51, "r_y2": 426.12, "r_x3": 161.91, "r_y3": 426.12, "coord_origin": "TOPLEFT" }, "text": "2", "orig": "2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 64, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 209.51, "r_y0": 434.19, "r_x1": 214.12, "r_y1": 434.19, "r_x2": 214.12, "r_y2": 426.12, "r_x3": 209.51, "r_y3": 426.12, "coord_origin": "TOPLEFT" }, "text": "4", "orig": "4", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 65, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 246.71, "r_y0": 428.71, "r_x1": 271.41, "r_y1": 428.71, "r_x2": 271.41, "r_y2": 420.64, "r_x3": 246.71, "r_y3": 420.64, "coord_origin": "TOPLEFT" }, "text": "OTSL", "orig": "OTSL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 66, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 289.02, "r_y0": 428.71, "r_x1": 310.0, "r_y1": 428.71, "r_x2": 310.0, "r_y2": 420.64, "r_x3": 289.02, "r_y3": 420.64, "coord_origin": "TOPLEFT" }, "text": "0.923", "orig": "0.923", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 67, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 326.72, "r_y0": 428.71, "r_x1": 347.7, "r_y1": 428.71, "r_x2": 347.7, "r_y2": 420.64, "r_x3": 326.72, "r_y3": 420.64, "coord_origin": "TOPLEFT" }, "text": "0.897", "orig": "0.897", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 68, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 363.68, "r_y0": 428.71, "r_x1": 384.66, "r_y1": 428.71, "r_x2": 384.66, "r_y2": 420.64, "r_x3": 363.68, "r_y3": 420.64, "coord_origin": "TOPLEFT" }, "text": "0.915", "orig": "0.915", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 69, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 394.62, "r_y0": 428.5, "r_x1": 418.78, "r_y1": 428.5, "r_x2": 418.78, "r_y2": 420.58, "r_x3": 394.62, "r_y3": 420.58, "coord_origin": "TOPLEFT" }, "text": "0.859", "orig": "0.859", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 70, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 439.53, "r_y0": 428.5, "r_x1": 458.38, "r_y1": 428.5, "r_x2": 458.38, "r_y2": 420.58, "r_x3": 439.53, "r_y3": 420.58, "coord_origin": "TOPLEFT" }, "text": "1.91", "orig": "1.91", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 71, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 245.18, "r_y0": 441.66, "r_x1": 272.94, "r_y1": 441.66, "r_x2": 272.94, "r_y2": 433.59, "r_x3": 245.18, "r_y3": 433.59, "coord_origin": "TOPLEFT" }, "text": "HTML", "orig": "HTML", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 72, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 289.02, "r_y0": 441.66, "r_x1": 310.0, "r_y1": 441.66, "r_x2": 310.0, "r_y2": 433.59, "r_x3": 289.02, "r_y3": 433.59, "coord_origin": "TOPLEFT" }, "text": "0.945", "orig": "0.945", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 73, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 326.72, "r_y0": 441.66, "r_x1": 347.7, "r_y1": 441.66, "r_x2": 347.7, "r_y2": 433.59, "r_x3": 326.72, "r_y3": 433.59, "coord_origin": "TOPLEFT" }, "text": "0.901", "orig": "0.901", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 74, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 362.09, "r_y0": 441.45, "r_x1": 386.25, "r_y1": 441.45, "r_x2": 386.25, "r_y2": 433.53, "r_x3": 362.09, "r_y3": 433.53, "coord_origin": "TOPLEFT" }, "text": "0.931", "orig": "0.931", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 75, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 396.21, "r_y0": 441.66, "r_x1": 417.19, "r_y1": 441.66, "r_x2": 417.19, "r_y2": 433.59, "r_x3": 396.21, "r_y3": 433.59, "coord_origin": "TOPLEFT" }, "text": "0.834", "orig": "0.834", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 76, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 440.77, "r_y0": 441.66, "r_x1": 457.15, "r_y1": 441.66, "r_x2": 457.15, "r_y2": 433.59, "r_x3": 440.77, "r_y3": 433.59, "coord_origin": "TOPLEFT" }, "text": "3.81", "orig": "3.81", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 77, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 161.91, "r_y0": 460.49, "r_x1": 166.51, "r_y1": 460.49, "r_x2": 166.51, "r_y2": 452.42, "r_x3": 161.91, "r_y3": 452.42, "coord_origin": "TOPLEFT" }, "text": "4", "orig": "4", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 78, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 209.51, "r_y0": 460.49, "r_x1": 214.12, "r_y1": 460.49, "r_x2": 214.12, "r_y2": 452.42, "r_x3": 209.51, "r_y3": 452.42, "coord_origin": "TOPLEFT" }, "text": "2", "orig": "2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 79, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 246.71, "r_y0": 455.01, "r_x1": 271.41, "r_y1": 455.01, "r_x2": 271.41, "r_y2": 446.94, "r_x3": 246.71, "r_y3": 446.94, "coord_origin": "TOPLEFT" }, "text": "OTSL", "orig": "OTSL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 80, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 289.02, "r_y0": 455.01, "r_x1": 310.0, "r_y1": 455.01, "r_x2": 310.0, "r_y2": 446.94, "r_x3": 289.02, "r_y3": 446.94, "coord_origin": "TOPLEFT" }, "text": "0.952", "orig": "0.952", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 81, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 329.02, "r_y0": 455.01, "r_x1": 345.4, "r_y1": 455.01, "r_x2": 345.4, "r_y2": 446.94, "r_x3": 329.02, "r_y3": 446.94, "coord_origin": "TOPLEFT" }, "text": "0.92", "orig": "0.92", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 82, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 362.09, "r_y0": 454.8, "r_x1": 386.25, "r_y1": 454.8, "r_x2": 386.25, "r_y2": 446.88, "r_x3": 362.09, "r_y3": 446.88, "coord_origin": "TOPLEFT" }, "text": "0.942", "orig": "0.942", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 83, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 394.62, "r_y0": 454.8, "r_x1": 418.78, "r_y1": 454.8, "r_x2": 418.78, "r_y2": 446.88, "r_x3": 394.62, "r_y3": 446.88, "coord_origin": "TOPLEFT" }, "text": "0.857", "orig": "0.857", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 84, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 439.53, "r_y0": 454.8, "r_x1": 458.38, "r_y1": 454.8, "r_x2": 458.38, "r_y2": 446.88, "r_x3": 439.53, "r_y3": 446.88, "coord_origin": "TOPLEFT" }, "text": "1.22", "orig": "1.22", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 85, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 245.18, "r_y0": 467.96, "r_x1": 272.94, "r_y1": 467.96, "r_x2": 272.94, "r_y2": 459.89, "r_x3": 245.18, "r_y3": 459.89, "coord_origin": "TOPLEFT" }, "text": "HTML", "orig": "HTML", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 86, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 289.02, "r_y0": 467.96, "r_x1": 310.0, "r_y1": 467.96, "r_x2": 310.0, "r_y2": 459.89, "r_x3": 289.02, "r_y3": 459.89, "coord_origin": "TOPLEFT" }, "text": "0.944", "orig": "0.944", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 87, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 326.72, "r_y0": 467.96, "r_x1": 347.7, "r_y1": 467.96, "r_x2": 347.7, "r_y2": 459.89, "r_x3": 326.72, "r_y3": 459.89, "coord_origin": "TOPLEFT" }, "text": "0.903", "orig": "0.903", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 88, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 363.68, "r_y0": 467.96, "r_x1": 384.66, "r_y1": 467.96, "r_x2": 384.66, "r_y2": 459.89, "r_x3": 363.68, "r_y3": 459.89, "coord_origin": "TOPLEFT" }, "text": "0.931", "orig": "0.931", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 89, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 396.21, "r_y0": 467.96, "r_x1": 417.19, "r_y1": 467.96, "r_x2": 417.19, "r_y2": 459.89, "r_x3": 396.21, "r_y3": 459.89, "coord_origin": "TOPLEFT" }, "text": "0.824", "orig": "0.824", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 90, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 446.65, "r_y0": 467.96, "r_x1": 451.26, "r_y1": 467.96, "r_x2": 451.26, "r_y2": 459.89, "r_x3": 446.65, "r_y3": 459.89, "coord_origin": "TOPLEFT" }, "text": "2", "orig": "2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 91, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 516.96, "r_x1": 149.4, "r_y1": 516.96, "r_x2": 149.4, "r_y2": 508.15, "r_x3": 134.76, "r_y3": 508.15, "coord_origin": "TOPLEFT" }, "text": "5.2", "orig": "5.2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 92, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 160.86, "r_y0": 516.96, "r_x1": 264.4, "r_y1": 516.96, "r_x2": 264.4, "r_y2": 508.15, "r_x3": 160.86, "r_y3": 508.15, "coord_origin": "TOPLEFT" }, "text": "Quantitative Results", "orig": "Quantitative Results", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 93, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 533.35, "r_x1": 480.59, "r_y1": 533.35, "r_x2": 480.59, "r_y2": 524.55, "r_x3": 134.76, "r_y3": 524.55, "coord_origin": "TOPLEFT" }, "text": "We picked the model parameter configuration that produced the best prediction", "orig": "We picked the model parameter configuration that produced the best prediction", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 94, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 545.3, "r_x1": 480.59, "r_y1": 545.3, "r_x2": 480.59, "r_y2": 536.51, "r_x3": 134.76, "r_y3": 536.51, "coord_origin": "TOPLEFT" }, "text": "quality (enc=6, dec=6, heads=8) with PubTabNet alone, then independently", "orig": "quality (enc=6, dec=6, heads=8) with PubTabNet alone, then independently", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 95, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 557.26, "r_x1": 480.6, "r_y1": 557.26, "r_x2": 480.6, "r_y2": 548.46, "r_x3": 134.76, "r_y3": 548.46, "coord_origin": "TOPLEFT" }, "text": "trained and evaluated it on three publicly available data sets: PubTabNet (395k", "orig": "trained and evaluated it on three publicly available data sets: PubTabNet (395k", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 96, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 569.21, "r_x1": 480.59, "r_y1": 569.21, "r_x2": 480.59, "r_y2": 560.42, "r_x3": 134.76, "r_y3": 560.42, "coord_origin": "TOPLEFT" }, "text": "samples), FinTabNet (113k samples) and PubTables-1M (about 1M samples).", "orig": "samples), FinTabNet (113k samples) and PubTables-1M (about 1M samples).", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 97, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 581.17, "r_x1": 480.59, "r_y1": 581.17, "r_x2": 480.59, "r_y2": 572.37, "r_x3": 134.76, "r_y3": 572.37, "coord_origin": "TOPLEFT" }, "text": "Performance results are presented in Table. 2. It is clearly evident that the model", "orig": "Performance results are presented in Table. 2. It is clearly evident that the model", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 98, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 593.12, "r_x1": 480.6, "r_y1": 593.12, "r_x2": 480.6, "r_y2": 584.33, "r_x3": 134.76, "r_y3": 584.33, "coord_origin": "TOPLEFT" }, "text": "trained on OTSL outperforms HTML across the board, keeping high TEDs and", "orig": "trained on OTSL outperforms HTML across the board, keeping high TEDs and", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 99, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 605.08, "r_x1": 480.59, "r_y1": 605.08, "r_x2": 480.59, "r_y2": 596.28, "r_x3": 134.76, "r_y3": 596.28, "coord_origin": "TOPLEFT" }, "text": "mAP scores even on difficult financial tables (FinTabNet) that contain sparse", "orig": "mAP scores even on difficult financial tables (FinTabNet) that contain sparse", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 100, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 617.03, "r_x1": 206.79, "r_y1": 617.03, "r_x2": 206.79, "r_y2": 608.24, "r_x3": 134.76, "r_y3": 608.24, "coord_origin": "TOPLEFT" }, "text": "and large tables.", "orig": "and large tables.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 101, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 149.71, "r_y0": 628.99, "r_x1": 480.59, "r_y1": 628.99, "r_x2": 480.59, "r_y2": 620.19, "r_x3": 149.71, "r_y3": 620.19, "coord_origin": "TOPLEFT" }, "text": "Additionally, the results show that OTSL has an advantage over HTML", "orig": "Additionally, the results show that OTSL has an advantage over HTML", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 102, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 640.94, "r_x1": 480.6, "r_y1": 640.94, "r_x2": 480.6, "r_y2": 632.15, "r_x3": 134.76, "r_y3": 632.15, "coord_origin": "TOPLEFT" }, "text": "when applied on a bigger data set like PubTables-1M and achieves significantly", "orig": "when applied on a bigger data set like PubTables-1M and achieves significantly", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 103, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 652.9, "r_x1": 480.59, "r_y1": 652.9, "r_x2": 480.59, "r_y2": 644.1, "r_x3": 134.76, "r_y3": 644.1, "coord_origin": "TOPLEFT" }, "text": "improved scores. Finally, OTSL achieves faster inference due to fewer decoding", "orig": "improved scores. Finally, OTSL achieves faster inference due to fewer decoding", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 104, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 664.85, "r_x1": 405.8, "r_y1": 664.85, "r_x2": 405.8, "r_y2": 656.06, "r_x3": 134.76, "r_y3": 656.06, "coord_origin": "TOPLEFT" }, "text": "steps which is a result of the reduced sequence representation.", "orig": "steps which is a result of the reduced sequence representation.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "has_chars": false, "has_words": false, "has_lines": true, "image": null, "lines": [] }, "predictions": { "layout": { "clusters": [ { "id": 8, "label": "page_header", "bbox": { "l": 194.48, "t": 93.77, "r": 447.54, "b": 101.84, "coord_origin": "TOPLEFT" }, "confidence": 0.937, "cells": [ { "index": 0, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 194.48, "r_y0": 101.84, "r_x1": 447.54, "r_y1": 101.84, "r_x2": 447.54, "r_y2": 93.77, "r_x3": 194.48, "r_y3": 93.77, "coord_origin": "TOPLEFT" }, "text": "Optimized Table Tokenization for Table Structure Recognition", "orig": "Optimized Table Tokenization for Table Structure Recognition", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 9, "label": "page_header", "bbox": { "l": 475.98, "t": 93.77, "r": 480.59, "b": 101.84, "coord_origin": "TOPLEFT" }, "confidence": 0.886, "cells": [ { "index": 1, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 475.98, "r_y0": 101.84, "r_x1": 480.59, "r_y1": 101.84, "r_x2": 480.59, "r_y2": 93.77, "r_x3": 475.98, "r_y3": 93.77, "coord_origin": "TOPLEFT" }, "text": "9", "orig": "9", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 4, "label": "text", "bbox": { "l": 134.76, "t": 118.93, "r": 480.6, "b": 151.64, "coord_origin": "TOPLEFT" }, "confidence": 0.981, "cells": [ { "index": 2, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 127.73, "r_x1": 480.59, "r_y1": 127.73, "r_x2": 480.59, "r_y2": 118.93, "r_x3": 134.76, "r_y3": 118.93, "coord_origin": "TOPLEFT" }, "text": "order to compute the TED score. Inference timing results for all experiments", "orig": "order to compute the TED score. Inference timing results for all experiments", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 3, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 139.69, "r_x1": 480.6, "r_y1": 139.69, "r_x2": 480.6, "r_y2": 130.89, "r_x3": 134.76, "r_y3": 130.89, "coord_origin": "TOPLEFT" }, "text": "were obtained from the same machine on a single core with AMD EPYC 7763", "orig": "were obtained from the same machine on a single core with AMD EPYC 7763", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 4, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 151.64, "r_x1": 210.78, "r_y1": 151.64, "r_x2": 210.78, "r_y2": 142.84, "r_x3": 134.76, "r_y3": 142.84, "coord_origin": "TOPLEFT" }, "text": "CPU @2.45 GHz.", "orig": "CPU @2.45 GHz.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 6, "label": "section_header", "bbox": { "l": 134.76, "t": 169.19, "r": 318.45, "b": 177.99, "coord_origin": "TOPLEFT" }, "confidence": 0.958, "cells": [ { "index": 5, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 177.99, "r_x1": 149.4, "r_y1": 177.99, "r_x2": 149.4, "r_y2": 169.19, "r_x3": 134.76, "r_y3": 169.19, "coord_origin": "TOPLEFT" }, "text": "5.1", "orig": "5.1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 6, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 160.86, "r_y0": 177.99, "r_x1": 318.45, "r_y1": 177.99, "r_x2": 318.45, "r_y2": 169.19, "r_x3": 160.86, "r_y3": 169.19, "coord_origin": "TOPLEFT" }, "text": "Hyper Parameter Optimization", "orig": "Hyper Parameter Optimization", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 3, "label": "text", "bbox": { "l": 134.76, "t": 185.59, "r": 480.59, "b": 254.16, "coord_origin": "TOPLEFT" }, "confidence": 0.984, "cells": [ { "index": 7, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 194.38, "r_x1": 480.59, "r_y1": 194.38, "r_x2": 480.59, "r_y2": 185.59, "r_x3": 134.76, "r_y3": 185.59, "coord_origin": "TOPLEFT" }, "text": "We have chosen the PubTabNet data set to perform HPO, since it includes a", "orig": "We have chosen the PubTabNet data set to perform HPO, since it includes a", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 8, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 206.34, "r_x1": 480.59, "r_y1": 206.34, "r_x2": 480.59, "r_y2": 197.54, "r_x3": 134.76, "r_y3": 197.54, "coord_origin": "TOPLEFT" }, "text": "highly diverse set of tables. Also we report TED scores separately for simple and", "orig": "highly diverse set of tables. Also we report TED scores separately for simple and", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 9, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 218.29, "r_x1": 480.59, "r_y1": 218.29, "r_x2": 480.59, "r_y2": 209.5, "r_x3": 134.76, "r_y3": 209.5, "coord_origin": "TOPLEFT" }, "text": "complex tables (tables with cell spans). Results are presented in Table. 1. It is", "orig": "complex tables (tables with cell spans). Results are presented in Table. 1. It is", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 10, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 230.25, "r_x1": 480.59, "r_y1": 230.25, "r_x2": 480.59, "r_y2": 221.45, "r_x3": 134.76, "r_y3": 221.45, "coord_origin": "TOPLEFT" }, "text": "evident that with OTSL, our model achieves the same TED score and slightly", "orig": "evident that with OTSL, our model achieves the same TED score and slightly", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 11, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 242.2, "r_x1": 440.94, "r_y1": 242.2, "r_x2": 440.94, "r_y2": 233.41, "r_x3": 134.76, "r_y3": 233.41, "coord_origin": "TOPLEFT" }, "text": "better mAP scores in comparison to HTML. However OTSL yields a", "orig": "better mAP scores in comparison to HTML. However OTSL yields a", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 12, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 444.87, "r_y0": 242.2, "r_x1": 480.59, "r_y1": 242.2, "r_x2": 480.59, "r_y2": 233.41, "r_x3": 444.87, "r_y3": 233.41, "coord_origin": "TOPLEFT" }, "text": "2x speed", "orig": "2x speed", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 13, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 254.16, "r_x1": 145.2, "r_y1": 254.16, "r_x2": 145.2, "r_y2": 245.36, "r_x3": 134.76, "r_y3": 245.36, "coord_origin": "TOPLEFT" }, "text": "up", "orig": "up", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 14, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 149.15, "r_y0": 254.16, "r_x1": 311.22, "r_y1": 254.16, "r_x2": 311.22, "r_y2": 245.36, "r_x3": 149.15, "r_y3": 245.36, "coord_origin": "TOPLEFT" }, "text": "in the inference runtime over HTML.", "orig": "in the inference runtime over HTML.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 7, "label": "caption", "bbox": { "l": 134.76, "t": 275.07, "r": 480.6, "b": 327.04, "coord_origin": "TOPLEFT" }, "confidence": 0.957, "cells": [ { "index": 15, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 283.0, "r_x1": 160.12, "r_y1": 283.0, "r_x2": 160.12, "r_y2": 275.07, "r_x3": 134.76, "r_y3": 275.07, "coord_origin": "TOPLEFT" }, "text": "Table", "orig": "Table", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 16, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 167.35, "r_y0": 283.0, "r_x1": 175.6, "r_y1": 283.0, "r_x2": 175.6, "r_y2": 275.07, "r_x3": 167.35, "r_y3": 275.07, "coord_origin": "TOPLEFT" }, "text": "1.", "orig": "1.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 17, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 188.13, "r_y0": 283.2, "r_x1": 480.59, "r_y1": 283.2, "r_x2": 480.59, "r_y2": 275.14, "r_x3": 188.13, "r_y3": 275.14, "coord_origin": "TOPLEFT" }, "text": "HPO performed in OTSL and HTML representation on the same", "orig": "HPO performed in OTSL and HTML representation on the same", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 18, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 294.16, "r_x1": 480.59, "r_y1": 294.16, "r_x2": 480.59, "r_y2": 286.09, "r_x3": 134.76, "r_y3": 286.09, "coord_origin": "TOPLEFT" }, "text": "transformer-based TableFormer [9] architecture, trained only on PubTabNet [22]. Ef-", "orig": "transformer-based TableFormer [9] architecture, trained only on PubTabNet [22]. Ef-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 19, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 305.12, "r_x1": 480.6, "r_y1": 305.12, "r_x2": 480.6, "r_y2": 297.05, "r_x3": 134.76, "r_y3": 297.05, "coord_origin": "TOPLEFT" }, "text": "fects of reducing the # of layers in encoder and decoder stages of the model show that", "orig": "fects of reducing the # of layers in encoder and decoder stages of the model show that", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 20, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 316.08, "r_x1": 480.59, "r_y1": 316.08, "r_x2": 480.59, "r_y2": 308.01, "r_x3": 134.76, "r_y3": 308.01, "coord_origin": "TOPLEFT" }, "text": "smaller models trained on OTSL perform better, especially in recognizing complex", "orig": "smaller models trained on OTSL perform better, especially in recognizing complex", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 21, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 327.04, "r_x1": 480.59, "r_y1": 327.04, "r_x2": 480.59, "r_y2": 318.97, "r_x3": 134.76, "r_y3": 318.97, "coord_origin": "TOPLEFT" }, "text": "table structures, and maintain a much higher mAP score than the HTML counterpart.", "orig": "table structures, and maintain a much higher mAP score than the HTML counterpart.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 0, "label": "table", "bbox": { "l": 139.67, "t": 337.57, "r": 475.0, "b": 469.47, "coord_origin": "TOPLEFT" }, "confidence": 0.99, "cells": [ { "index": 22, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 160.37, "r_y0": 349.8, "r_x1": 168.05, "r_y1": 349.8, "r_x2": 168.05, "r_y2": 341.73, "r_x3": 160.37, "r_y3": 341.73, "coord_origin": "TOPLEFT" }, "text": "#", "orig": "#", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 23, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 144.59, "r_y0": 362.76, "r_x1": 183.83, "r_y1": 362.76, "r_x2": 183.83, "r_y2": 354.69, "r_x3": 144.59, "r_y3": 354.69, "coord_origin": "TOPLEFT" }, "text": "enc-layers", "orig": "enc-layers", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 24, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 207.97, "r_y0": 349.8, "r_x1": 215.65, "r_y1": 349.8, "r_x2": 215.65, "r_y2": 341.73, "r_x3": 207.97, "r_y3": 341.73, "coord_origin": "TOPLEFT" }, "text": "#", "orig": "#", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 25, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 192.19, "r_y0": 362.76, "r_x1": 231.43, "r_y1": 362.76, "r_x2": 231.43, "r_y2": 354.69, "r_x3": 192.19, "r_y3": 354.69, "coord_origin": "TOPLEFT" }, "text": "dec-layers", "orig": "dec-layers", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 26, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 239.8, "r_y0": 355.28, "r_x1": 278.32, "r_y1": 355.28, "r_x2": 278.32, "r_y2": 347.21, "r_x3": 239.8, "r_y3": 347.21, "coord_origin": "TOPLEFT" }, "text": "Language", "orig": "Language", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 27, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 324.67, "r_y0": 349.8, "r_x1": 348.26, "r_y1": 349.8, "r_x2": 348.26, "r_y2": 341.73, "r_x3": 324.67, "r_y3": 341.73, "coord_origin": "TOPLEFT" }, "text": "TEDs", "orig": "TEDs", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 28, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 396.27, "r_y0": 349.8, "r_x1": 417.13, "r_y1": 349.8, "r_x2": 417.13, "r_y2": 341.73, "r_x3": 396.27, "r_y3": 341.73, "coord_origin": "TOPLEFT" }, "text": "mAP", "orig": "mAP", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 29, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 394.93, "r_y0": 360.76, "r_x1": 418.47, "r_y1": 360.76, "r_x2": 418.47, "r_y2": 352.69, "r_x3": 394.93, "r_y3": 352.69, "coord_origin": "TOPLEFT" }, "text": "(0.75)", "orig": "(0.75)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 30, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 430.77, "r_y0": 349.8, "r_x1": 467.14, "r_y1": 349.8, "r_x2": 467.14, "r_y2": 341.73, "r_x3": 430.77, "r_y3": 341.73, "coord_origin": "TOPLEFT" }, "text": "Inference", "orig": "Inference", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 31, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 427.15, "r_y0": 360.76, "r_x1": 470.76, "r_y1": 360.76, "r_x2": 470.76, "r_y2": 352.69, "r_x3": 427.15, "r_y3": 352.69, "coord_origin": "TOPLEFT" }, "text": "time (secs)", "orig": "time (secs)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 32, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 286.69, "r_y0": 362.76, "r_x1": 312.33, "r_y1": 362.76, "r_x2": 312.33, "r_y2": 354.69, "r_x3": 286.69, "r_y3": 354.69, "coord_origin": "TOPLEFT" }, "text": "simple", "orig": "simple", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 33, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 320.7, "r_y0": 362.76, "r_x1": 353.72, "r_y1": 362.76, "r_x2": 353.72, "r_y2": 354.69, "r_x3": 320.7, "r_y3": 354.69, "coord_origin": "TOPLEFT" }, "text": "complex", "orig": "complex", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 34, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 369.31, "r_y0": 362.76, "r_x1": 379.03, "r_y1": 362.76, "r_x2": 379.03, "r_y2": 354.69, "r_x3": 369.31, "r_y3": 354.69, "coord_origin": "TOPLEFT" }, "text": "all", "orig": "all", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 35, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 161.91, "r_y0": 381.59, "r_x1": 166.51, "r_y1": 381.59, "r_x2": 166.51, "r_y2": 373.52, "r_x3": 161.91, "r_y3": 373.52, "coord_origin": "TOPLEFT" }, "text": "6", "orig": "6", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 36, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 209.51, "r_y0": 381.59, "r_x1": 214.12, "r_y1": 381.59, "r_x2": 214.12, "r_y2": 373.52, "r_x3": 209.51, "r_y3": 373.52, "coord_origin": "TOPLEFT" }, "text": "6", "orig": "6", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 37, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 246.71, "r_y0": 376.11, "r_x1": 271.41, "r_y1": 376.11, "r_x2": 271.41, "r_y2": 368.04, "r_x3": 246.71, "r_y3": 368.04, "coord_origin": "TOPLEFT" }, "text": "OTSL", "orig": "OTSL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 38, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 289.02, "r_y0": 376.11, "r_x1": 310.0, "r_y1": 376.11, "r_x2": 310.0, "r_y2": 368.04, "r_x3": 289.02, "r_y3": 368.04, "coord_origin": "TOPLEFT" }, "text": "0.965", "orig": "0.965", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 39, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 326.72, "r_y0": 376.11, "r_x1": 347.7, "r_y1": 376.11, "r_x2": 347.7, "r_y2": 368.04, "r_x3": 326.72, "r_y3": 368.04, "coord_origin": "TOPLEFT" }, "text": "0.934", "orig": "0.934", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 40, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 363.68, "r_y0": 376.11, "r_x1": 384.66, "r_y1": 376.11, "r_x2": 384.66, "r_y2": 368.04, "r_x3": 363.68, "r_y3": 368.04, "coord_origin": "TOPLEFT" }, "text": "0.955", "orig": "0.955", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 41, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 397.27, "r_y0": 375.9, "r_x1": 416.13, "r_y1": 375.9, "r_x2": 416.13, "r_y2": 367.97, "r_x3": 397.27, "r_y3": 367.97, "coord_origin": "TOPLEFT" }, "text": "0.88", "orig": "0.88", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 42, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 439.53, "r_y0": 375.9, "r_x1": 458.38, "r_y1": 375.9, "r_x2": 458.38, "r_y2": 367.97, "r_x3": 439.53, "r_y3": 367.97, "coord_origin": "TOPLEFT" }, "text": "2.73", "orig": "2.73", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 43, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 245.18, "r_y0": 389.06, "r_x1": 272.94, "r_y1": 389.06, "r_x2": 272.94, "r_y2": 380.99, "r_x3": 245.18, "r_y3": 380.99, "coord_origin": "TOPLEFT" }, "text": "HTML", "orig": "HTML", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 44, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 289.02, "r_y0": 389.06, "r_x1": 310.0, "r_y1": 389.06, "r_x2": 310.0, "r_y2": 380.99, "r_x3": 289.02, "r_y3": 380.99, "coord_origin": "TOPLEFT" }, "text": "0.969", "orig": "0.969", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 45, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 326.72, "r_y0": 389.06, "r_x1": 347.7, "r_y1": 389.06, "r_x2": 347.7, "r_y2": 380.99, "r_x3": 326.72, "r_y3": 380.99, "coord_origin": "TOPLEFT" }, "text": "0.927", "orig": "0.927", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 46, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 363.68, "r_y0": 389.06, "r_x1": 384.66, "r_y1": 389.06, "r_x2": 384.66, "r_y2": 380.99, "r_x3": 363.68, "r_y3": 380.99, "coord_origin": "TOPLEFT" }, "text": "0.955", "orig": "0.955", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 47, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 396.21, "r_y0": 389.06, "r_x1": 417.19, "r_y1": 389.06, "r_x2": 417.19, "r_y2": 380.99, "r_x3": 396.21, "r_y3": 380.99, "coord_origin": "TOPLEFT" }, "text": "0.857", "orig": "0.857", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 48, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 440.77, "r_y0": 389.06, "r_x1": 457.15, "r_y1": 389.06, "r_x2": 457.15, "r_y2": 380.99, "r_x3": 440.77, "r_y3": 380.99, "coord_origin": "TOPLEFT" }, "text": "5.39", "orig": "5.39", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 49, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 161.91, "r_y0": 407.89, "r_x1": 166.51, "r_y1": 407.89, "r_x2": 166.51, "r_y2": 399.82, "r_x3": 161.91, "r_y3": 399.82, "coord_origin": "TOPLEFT" }, "text": "4", "orig": "4", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 50, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 209.51, "r_y0": 407.89, "r_x1": 214.12, "r_y1": 407.89, "r_x2": 214.12, "r_y2": 399.82, "r_x3": 209.51, "r_y3": 399.82, "coord_origin": "TOPLEFT" }, "text": "4", "orig": "4", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 51, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 246.71, "r_y0": 402.41, "r_x1": 271.41, "r_y1": 402.41, "r_x2": 271.41, "r_y2": 394.34, "r_x3": 246.71, "r_y3": 394.34, "coord_origin": "TOPLEFT" }, "text": "OTSL", "orig": "OTSL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 52, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 289.02, "r_y0": 402.41, "r_x1": 310.0, "r_y1": 402.41, "r_x2": 310.0, "r_y2": 394.34, "r_x3": 289.02, "r_y3": 394.34, "coord_origin": "TOPLEFT" }, "text": "0.938", "orig": "0.938", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 53, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 326.72, "r_y0": 402.41, "r_x1": 347.7, "r_y1": 402.41, "r_x2": 347.7, "r_y2": 394.34, "r_x3": 326.72, "r_y3": 394.34, "coord_origin": "TOPLEFT" }, "text": "0.904", "orig": "0.904", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 54, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 363.68, "r_y0": 402.41, "r_x1": 384.66, "r_y1": 402.41, "r_x2": 384.66, "r_y2": 394.34, "r_x3": 363.68, "r_y3": 394.34, "coord_origin": "TOPLEFT" }, "text": "0.927", "orig": "0.927", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 55, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 394.62, "r_y0": 402.2, "r_x1": 418.78, "r_y1": 402.2, "r_x2": 418.78, "r_y2": 394.28, "r_x3": 394.62, "r_y3": 394.28, "coord_origin": "TOPLEFT" }, "text": "0.853", "orig": "0.853", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 56, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 439.53, "r_y0": 402.2, "r_x1": 458.38, "r_y1": 402.2, "r_x2": 458.38, "r_y2": 394.28, "r_x3": 439.53, "r_y3": 394.28, "coord_origin": "TOPLEFT" }, "text": "1.97", "orig": "1.97", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 57, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 245.18, "r_y0": 415.36, "r_x1": 272.94, "r_y1": 415.36, "r_x2": 272.94, "r_y2": 407.29, "r_x3": 245.18, "r_y3": 407.29, "coord_origin": "TOPLEFT" }, "text": "HTML", "orig": "HTML", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 58, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 289.02, "r_y0": 415.36, "r_x1": 310.0, "r_y1": 415.36, "r_x2": 310.0, "r_y2": 407.29, "r_x3": 289.02, "r_y3": 407.29, "coord_origin": "TOPLEFT" }, "text": "0.952", "orig": "0.952", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 59, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 326.72, "r_y0": 415.36, "r_x1": 347.7, "r_y1": 415.36, "r_x2": 347.7, "r_y2": 407.29, "r_x3": 326.72, "r_y3": 407.29, "coord_origin": "TOPLEFT" }, "text": "0.909", "orig": "0.909", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 60, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 362.09, "r_y0": 415.15, "r_x1": 386.25, "r_y1": 415.15, "r_x2": 386.25, "r_y2": 407.23, "r_x3": 362.09, "r_y3": 407.23, "coord_origin": "TOPLEFT" }, "text": "0.938", "orig": "0.938", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 61, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 396.21, "r_y0": 415.36, "r_x1": 417.19, "r_y1": 415.36, "r_x2": 417.19, "r_y2": 407.29, "r_x3": 396.21, "r_y3": 407.29, "coord_origin": "TOPLEFT" }, "text": "0.843", "orig": "0.843", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 62, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 440.77, "r_y0": 415.36, "r_x1": 457.15, "r_y1": 415.36, "r_x2": 457.15, "r_y2": 407.29, "r_x3": 440.77, "r_y3": 407.29, "coord_origin": "TOPLEFT" }, "text": "3.77", "orig": "3.77", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 63, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 161.91, "r_y0": 434.19, "r_x1": 166.51, "r_y1": 434.19, "r_x2": 166.51, "r_y2": 426.12, "r_x3": 161.91, "r_y3": 426.12, "coord_origin": "TOPLEFT" }, "text": "2", "orig": "2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 64, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 209.51, "r_y0": 434.19, "r_x1": 214.12, "r_y1": 434.19, "r_x2": 214.12, "r_y2": 426.12, "r_x3": 209.51, "r_y3": 426.12, "coord_origin": "TOPLEFT" }, "text": "4", "orig": "4", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 65, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 246.71, "r_y0": 428.71, "r_x1": 271.41, "r_y1": 428.71, "r_x2": 271.41, "r_y2": 420.64, "r_x3": 246.71, "r_y3": 420.64, "coord_origin": "TOPLEFT" }, "text": "OTSL", "orig": "OTSL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 66, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 289.02, "r_y0": 428.71, "r_x1": 310.0, "r_y1": 428.71, "r_x2": 310.0, "r_y2": 420.64, "r_x3": 289.02, "r_y3": 420.64, "coord_origin": "TOPLEFT" }, "text": "0.923", "orig": "0.923", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 67, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 326.72, "r_y0": 428.71, "r_x1": 347.7, "r_y1": 428.71, "r_x2": 347.7, "r_y2": 420.64, "r_x3": 326.72, "r_y3": 420.64, "coord_origin": "TOPLEFT" }, "text": "0.897", "orig": "0.897", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 68, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 363.68, "r_y0": 428.71, "r_x1": 384.66, "r_y1": 428.71, "r_x2": 384.66, "r_y2": 420.64, "r_x3": 363.68, "r_y3": 420.64, "coord_origin": "TOPLEFT" }, "text": "0.915", "orig": "0.915", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 69, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 394.62, "r_y0": 428.5, "r_x1": 418.78, "r_y1": 428.5, "r_x2": 418.78, "r_y2": 420.58, "r_x3": 394.62, "r_y3": 420.58, "coord_origin": "TOPLEFT" }, "text": "0.859", "orig": "0.859", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 70, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 439.53, "r_y0": 428.5, "r_x1": 458.38, "r_y1": 428.5, "r_x2": 458.38, "r_y2": 420.58, "r_x3": 439.53, "r_y3": 420.58, "coord_origin": "TOPLEFT" }, "text": "1.91", "orig": "1.91", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 71, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 245.18, "r_y0": 441.66, "r_x1": 272.94, "r_y1": 441.66, "r_x2": 272.94, "r_y2": 433.59, "r_x3": 245.18, "r_y3": 433.59, "coord_origin": "TOPLEFT" }, "text": "HTML", "orig": "HTML", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 72, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 289.02, "r_y0": 441.66, "r_x1": 310.0, "r_y1": 441.66, "r_x2": 310.0, "r_y2": 433.59, "r_x3": 289.02, "r_y3": 433.59, "coord_origin": "TOPLEFT" }, "text": "0.945", "orig": "0.945", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 73, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 326.72, "r_y0": 441.66, "r_x1": 347.7, "r_y1": 441.66, "r_x2": 347.7, "r_y2": 433.59, "r_x3": 326.72, "r_y3": 433.59, "coord_origin": "TOPLEFT" }, "text": "0.901", "orig": "0.901", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 74, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 362.09, "r_y0": 441.45, "r_x1": 386.25, "r_y1": 441.45, "r_x2": 386.25, "r_y2": 433.53, "r_x3": 362.09, "r_y3": 433.53, "coord_origin": "TOPLEFT" }, "text": "0.931", "orig": "0.931", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 75, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 396.21, "r_y0": 441.66, "r_x1": 417.19, "r_y1": 441.66, "r_x2": 417.19, "r_y2": 433.59, "r_x3": 396.21, "r_y3": 433.59, "coord_origin": "TOPLEFT" }, "text": "0.834", "orig": "0.834", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 76, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 440.77, "r_y0": 441.66, "r_x1": 457.15, "r_y1": 441.66, "r_x2": 457.15, "r_y2": 433.59, "r_x3": 440.77, "r_y3": 433.59, "coord_origin": "TOPLEFT" }, "text": "3.81", "orig": "3.81", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 77, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 161.91, "r_y0": 460.49, "r_x1": 166.51, "r_y1": 460.49, "r_x2": 166.51, "r_y2": 452.42, "r_x3": 161.91, "r_y3": 452.42, "coord_origin": "TOPLEFT" }, "text": "4", "orig": "4", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 78, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 209.51, "r_y0": 460.49, "r_x1": 214.12, "r_y1": 460.49, "r_x2": 214.12, "r_y2": 452.42, "r_x3": 209.51, "r_y3": 452.42, "coord_origin": "TOPLEFT" }, "text": "2", "orig": "2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 79, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 246.71, "r_y0": 455.01, "r_x1": 271.41, "r_y1": 455.01, "r_x2": 271.41, "r_y2": 446.94, "r_x3": 246.71, "r_y3": 446.94, "coord_origin": "TOPLEFT" }, "text": "OTSL", "orig": "OTSL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 80, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 289.02, "r_y0": 455.01, "r_x1": 310.0, "r_y1": 455.01, "r_x2": 310.0, "r_y2": 446.94, "r_x3": 289.02, "r_y3": 446.94, "coord_origin": "TOPLEFT" }, "text": "0.952", "orig": "0.952", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 81, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 329.02, "r_y0": 455.01, "r_x1": 345.4, "r_y1": 455.01, "r_x2": 345.4, "r_y2": 446.94, "r_x3": 329.02, "r_y3": 446.94, "coord_origin": "TOPLEFT" }, "text": "0.92", "orig": "0.92", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 82, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 362.09, "r_y0": 454.8, "r_x1": 386.25, "r_y1": 454.8, "r_x2": 386.25, "r_y2": 446.88, "r_x3": 362.09, "r_y3": 446.88, "coord_origin": "TOPLEFT" }, "text": "0.942", "orig": "0.942", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 83, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 394.62, "r_y0": 454.8, "r_x1": 418.78, "r_y1": 454.8, "r_x2": 418.78, "r_y2": 446.88, "r_x3": 394.62, "r_y3": 446.88, "coord_origin": "TOPLEFT" }, "text": "0.857", "orig": "0.857", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 84, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 439.53, "r_y0": 454.8, "r_x1": 458.38, "r_y1": 454.8, "r_x2": 458.38, "r_y2": 446.88, "r_x3": 439.53, "r_y3": 446.88, "coord_origin": "TOPLEFT" }, "text": "1.22", "orig": "1.22", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 85, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 245.18, "r_y0": 467.96, "r_x1": 272.94, "r_y1": 467.96, "r_x2": 272.94, "r_y2": 459.89, "r_x3": 245.18, "r_y3": 459.89, "coord_origin": "TOPLEFT" }, "text": "HTML", "orig": "HTML", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 86, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 289.02, "r_y0": 467.96, "r_x1": 310.0, "r_y1": 467.96, "r_x2": 310.0, "r_y2": 459.89, "r_x3": 289.02, "r_y3": 459.89, "coord_origin": "TOPLEFT" }, "text": "0.944", "orig": "0.944", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 87, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 326.72, "r_y0": 467.96, "r_x1": 347.7, "r_y1": 467.96, "r_x2": 347.7, "r_y2": 459.89, "r_x3": 326.72, "r_y3": 459.89, "coord_origin": "TOPLEFT" }, "text": "0.903", "orig": "0.903", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 88, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 363.68, "r_y0": 467.96, "r_x1": 384.66, "r_y1": 467.96, "r_x2": 384.66, "r_y2": 459.89, "r_x3": 363.68, "r_y3": 459.89, "coord_origin": "TOPLEFT" }, "text": "0.931", "orig": "0.931", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 89, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 396.21, "r_y0": 467.96, "r_x1": 417.19, "r_y1": 467.96, "r_x2": 417.19, "r_y2": 459.89, "r_x3": 396.21, "r_y3": 459.89, "coord_origin": "TOPLEFT" }, "text": "0.824", "orig": "0.824", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 90, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 446.65, "r_y0": 467.96, "r_x1": 451.26, "r_y1": 467.96, "r_x2": 451.26, "r_y2": 459.89, "r_x3": 446.65, "r_y3": 459.89, "coord_origin": "TOPLEFT" }, "text": "2", "orig": "2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [ { "id": 11, "label": "text", "bbox": { "l": 160.37, "t": 341.73, "r": 168.05, "b": 349.8, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 22, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 160.37, "r_y0": 349.8, "r_x1": 168.05, "r_y1": 349.8, "r_x2": 168.05, "r_y2": 341.73, "r_x3": 160.37, "r_y3": 341.73, "coord_origin": "TOPLEFT" }, "text": "#", "orig": "#", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 12, "label": "text", "bbox": { "l": 144.59, "t": 354.69, "r": 183.83, "b": 362.76, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 23, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 144.59, "r_y0": 362.76, "r_x1": 183.83, "r_y1": 362.76, "r_x2": 183.83, "r_y2": 354.69, "r_x3": 144.59, "r_y3": 354.69, "coord_origin": "TOPLEFT" }, "text": "enc-layers", "orig": "enc-layers", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 13, "label": "text", "bbox": { "l": 207.97, "t": 341.73, "r": 215.65, "b": 349.8, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 24, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 207.97, "r_y0": 349.8, "r_x1": 215.65, "r_y1": 349.8, "r_x2": 215.65, "r_y2": 341.73, "r_x3": 207.97, "r_y3": 341.73, "coord_origin": "TOPLEFT" }, "text": "#", "orig": "#", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 14, "label": "text", "bbox": { "l": 192.19, "t": 354.69, "r": 231.43, "b": 362.76, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 25, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 192.19, "r_y0": 362.76, "r_x1": 231.43, "r_y1": 362.76, "r_x2": 231.43, "r_y2": 354.69, "r_x3": 192.19, "r_y3": 354.69, "coord_origin": "TOPLEFT" }, "text": "dec-layers", "orig": "dec-layers", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 15, "label": "text", "bbox": { "l": 239.8, "t": 347.21, "r": 278.32, "b": 355.28, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 26, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 239.8, "r_y0": 355.28, "r_x1": 278.32, "r_y1": 355.28, "r_x2": 278.32, "r_y2": 347.21, "r_x3": 239.8, "r_y3": 347.21, "coord_origin": "TOPLEFT" }, "text": "Language", "orig": "Language", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 16, "label": "text", "bbox": { "l": 324.67, "t": 341.73, "r": 348.26, "b": 349.8, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 27, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 324.67, "r_y0": 349.8, "r_x1": 348.26, "r_y1": 349.8, "r_x2": 348.26, "r_y2": 341.73, "r_x3": 324.67, "r_y3": 341.73, "coord_origin": "TOPLEFT" }, "text": "TEDs", "orig": "TEDs", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 17, "label": "text", "bbox": { "l": 396.27, "t": 341.73, "r": 417.13, "b": 349.8, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 28, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 396.27, "r_y0": 349.8, "r_x1": 417.13, "r_y1": 349.8, "r_x2": 417.13, "r_y2": 341.73, "r_x3": 396.27, "r_y3": 341.73, "coord_origin": "TOPLEFT" }, "text": "mAP", "orig": "mAP", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 18, "label": "text", "bbox": { "l": 394.93, "t": 352.69, "r": 418.47, "b": 360.76, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 29, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 394.93, "r_y0": 360.76, "r_x1": 418.47, "r_y1": 360.76, "r_x2": 418.47, "r_y2": 352.69, "r_x3": 394.93, "r_y3": 352.69, "coord_origin": "TOPLEFT" }, "text": "(0.75)", "orig": "(0.75)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 19, "label": "text", "bbox": { "l": 430.77, "t": 341.73, "r": 467.14, "b": 349.8, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 30, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 430.77, "r_y0": 349.8, "r_x1": 467.14, "r_y1": 349.8, "r_x2": 467.14, "r_y2": 341.73, "r_x3": 430.77, "r_y3": 341.73, "coord_origin": "TOPLEFT" }, "text": "Inference", "orig": "Inference", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 20, "label": "text", "bbox": { "l": 427.15, "t": 352.69, "r": 470.76, "b": 360.76, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 31, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 427.15, "r_y0": 360.76, "r_x1": 470.76, "r_y1": 360.76, "r_x2": 470.76, "r_y2": 352.69, "r_x3": 427.15, "r_y3": 352.69, "coord_origin": "TOPLEFT" }, "text": "time (secs)", "orig": "time (secs)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 21, "label": "text", "bbox": { "l": 286.69, "t": 354.69, "r": 312.33, "b": 362.76, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 32, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 286.69, "r_y0": 362.76, "r_x1": 312.33, "r_y1": 362.76, "r_x2": 312.33, "r_y2": 354.69, "r_x3": 286.69, "r_y3": 354.69, "coord_origin": "TOPLEFT" }, "text": "simple", "orig": "simple", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 22, "label": "text", "bbox": { "l": 320.7, "t": 354.69, "r": 353.72, "b": 362.76, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 33, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 320.7, "r_y0": 362.76, "r_x1": 353.72, "r_y1": 362.76, "r_x2": 353.72, "r_y2": 354.69, "r_x3": 320.7, "r_y3": 354.69, "coord_origin": "TOPLEFT" }, "text": "complex", "orig": "complex", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 23, "label": "text", "bbox": { "l": 369.31, "t": 354.69, "r": 379.03, "b": 362.76, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 34, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 369.31, "r_y0": 362.76, "r_x1": 379.03, "r_y1": 362.76, "r_x2": 379.03, "r_y2": 354.69, "r_x3": 369.31, "r_y3": 354.69, "coord_origin": "TOPLEFT" }, "text": "all", "orig": "all", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 24, "label": "text", "bbox": { "l": 161.91, "t": 373.52, "r": 166.51, "b": 381.59, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 35, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 161.91, "r_y0": 381.59, "r_x1": 166.51, "r_y1": 381.59, "r_x2": 166.51, "r_y2": 373.52, "r_x3": 161.91, "r_y3": 373.52, "coord_origin": "TOPLEFT" }, "text": "6", "orig": "6", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 25, "label": "text", "bbox": { "l": 209.51, "t": 373.52, "r": 214.12, "b": 381.59, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 36, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 209.51, "r_y0": 381.59, "r_x1": 214.12, "r_y1": 381.59, "r_x2": 214.12, "r_y2": 373.52, "r_x3": 209.51, "r_y3": 373.52, "coord_origin": "TOPLEFT" }, "text": "6", "orig": "6", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 26, "label": "text", "bbox": { "l": 246.71, "t": 368.04, "r": 271.41, "b": 376.11, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 37, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 246.71, "r_y0": 376.11, "r_x1": 271.41, "r_y1": 376.11, "r_x2": 271.41, "r_y2": 368.04, "r_x3": 246.71, "r_y3": 368.04, "coord_origin": "TOPLEFT" }, "text": "OTSL", "orig": "OTSL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 27, "label": "text", "bbox": { "l": 289.02, "t": 368.04, "r": 310.0, "b": 376.11, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 38, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 289.02, "r_y0": 376.11, "r_x1": 310.0, "r_y1": 376.11, "r_x2": 310.0, "r_y2": 368.04, "r_x3": 289.02, "r_y3": 368.04, "coord_origin": "TOPLEFT" }, "text": "0.965", "orig": "0.965", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 28, "label": "text", "bbox": { "l": 326.72, "t": 368.04, "r": 347.7, "b": 376.11, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 39, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 326.72, "r_y0": 376.11, "r_x1": 347.7, "r_y1": 376.11, "r_x2": 347.7, "r_y2": 368.04, "r_x3": 326.72, "r_y3": 368.04, "coord_origin": "TOPLEFT" }, "text": "0.934", "orig": "0.934", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 29, "label": "text", "bbox": { "l": 363.68, "t": 368.04, "r": 384.66, "b": 376.11, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 40, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 363.68, "r_y0": 376.11, "r_x1": 384.66, "r_y1": 376.11, "r_x2": 384.66, "r_y2": 368.04, "r_x3": 363.68, "r_y3": 368.04, "coord_origin": "TOPLEFT" }, "text": "0.955", "orig": "0.955", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 30, "label": "text", "bbox": { "l": 397.27, "t": 367.97, "r": 416.13, "b": 375.9, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 41, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 397.27, "r_y0": 375.9, "r_x1": 416.13, "r_y1": 375.9, "r_x2": 416.13, "r_y2": 367.97, "r_x3": 397.27, "r_y3": 367.97, "coord_origin": "TOPLEFT" }, "text": "0.88", "orig": "0.88", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 31, "label": "text", "bbox": { "l": 439.53, "t": 367.97, "r": 458.38, "b": 375.9, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 42, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 439.53, "r_y0": 375.9, "r_x1": 458.38, "r_y1": 375.9, "r_x2": 458.38, "r_y2": 367.97, "r_x3": 439.53, "r_y3": 367.97, "coord_origin": "TOPLEFT" }, "text": "2.73", "orig": "2.73", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 32, "label": "text", "bbox": { "l": 245.18, "t": 380.99, "r": 272.94, "b": 389.06, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 43, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 245.18, "r_y0": 389.06, "r_x1": 272.94, "r_y1": 389.06, "r_x2": 272.94, "r_y2": 380.99, "r_x3": 245.18, "r_y3": 380.99, "coord_origin": "TOPLEFT" }, "text": "HTML", "orig": "HTML", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 33, "label": "text", "bbox": { "l": 289.02, "t": 380.99, "r": 310.0, "b": 389.06, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 44, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 289.02, "r_y0": 389.06, "r_x1": 310.0, "r_y1": 389.06, "r_x2": 310.0, "r_y2": 380.99, "r_x3": 289.02, "r_y3": 380.99, "coord_origin": "TOPLEFT" }, "text": "0.969", "orig": "0.969", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 34, "label": "text", "bbox": { "l": 326.72, "t": 380.99, "r": 347.7, "b": 389.06, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 45, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 326.72, "r_y0": 389.06, "r_x1": 347.7, "r_y1": 389.06, "r_x2": 347.7, "r_y2": 380.99, "r_x3": 326.72, "r_y3": 380.99, "coord_origin": "TOPLEFT" }, "text": "0.927", "orig": "0.927", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 35, "label": "text", "bbox": { "l": 363.68, "t": 380.99, "r": 384.66, "b": 389.06, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 46, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 363.68, "r_y0": 389.06, "r_x1": 384.66, "r_y1": 389.06, "r_x2": 384.66, "r_y2": 380.99, "r_x3": 363.68, "r_y3": 380.99, "coord_origin": "TOPLEFT" }, "text": "0.955", "orig": "0.955", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 36, "label": "text", "bbox": { "l": 396.21, "t": 380.99, "r": 417.19, "b": 389.06, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 47, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 396.21, "r_y0": 389.06, "r_x1": 417.19, "r_y1": 389.06, "r_x2": 417.19, "r_y2": 380.99, "r_x3": 396.21, "r_y3": 380.99, "coord_origin": "TOPLEFT" }, "text": "0.857", "orig": "0.857", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 37, "label": "text", "bbox": { "l": 440.77, "t": 380.99, "r": 457.15, "b": 389.06, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 48, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 440.77, "r_y0": 389.06, "r_x1": 457.15, "r_y1": 389.06, "r_x2": 457.15, "r_y2": 380.99, "r_x3": 440.77, "r_y3": 380.99, "coord_origin": "TOPLEFT" }, "text": "5.39", "orig": "5.39", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 38, "label": "text", "bbox": { "l": 161.91, "t": 399.82, "r": 166.51, "b": 407.89, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 49, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 161.91, "r_y0": 407.89, "r_x1": 166.51, "r_y1": 407.89, "r_x2": 166.51, "r_y2": 399.82, "r_x3": 161.91, "r_y3": 399.82, "coord_origin": "TOPLEFT" }, "text": "4", "orig": "4", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 39, "label": "text", "bbox": { "l": 209.51, "t": 399.82, "r": 214.12, "b": 407.89, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 50, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 209.51, "r_y0": 407.89, "r_x1": 214.12, "r_y1": 407.89, "r_x2": 214.12, "r_y2": 399.82, "r_x3": 209.51, "r_y3": 399.82, "coord_origin": "TOPLEFT" }, "text": "4", "orig": "4", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 40, "label": "text", "bbox": { "l": 246.71, "t": 394.34, "r": 271.41, "b": 402.41, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 51, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 246.71, "r_y0": 402.41, "r_x1": 271.41, "r_y1": 402.41, "r_x2": 271.41, "r_y2": 394.34, "r_x3": 246.71, "r_y3": 394.34, "coord_origin": "TOPLEFT" }, "text": "OTSL", "orig": "OTSL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 41, "label": "text", "bbox": { "l": 289.02, "t": 394.34, "r": 310.0, "b": 402.41, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 52, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 289.02, "r_y0": 402.41, "r_x1": 310.0, "r_y1": 402.41, "r_x2": 310.0, "r_y2": 394.34, "r_x3": 289.02, "r_y3": 394.34, "coord_origin": "TOPLEFT" }, "text": "0.938", "orig": "0.938", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 42, "label": "text", "bbox": { "l": 326.72, "t": 394.34, "r": 347.7, "b": 402.41, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 53, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 326.72, "r_y0": 402.41, "r_x1": 347.7, "r_y1": 402.41, "r_x2": 347.7, "r_y2": 394.34, "r_x3": 326.72, "r_y3": 394.34, "coord_origin": "TOPLEFT" }, "text": "0.904", "orig": "0.904", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 43, "label": "text", "bbox": { "l": 363.68, "t": 394.34, "r": 384.66, "b": 402.41, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 54, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 363.68, "r_y0": 402.41, "r_x1": 384.66, "r_y1": 402.41, "r_x2": 384.66, "r_y2": 394.34, "r_x3": 363.68, "r_y3": 394.34, "coord_origin": "TOPLEFT" }, "text": "0.927", "orig": "0.927", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 44, "label": "text", "bbox": { "l": 394.62, "t": 394.28, "r": 418.78, "b": 402.2, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 55, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 394.62, "r_y0": 402.2, "r_x1": 418.78, "r_y1": 402.2, "r_x2": 418.78, "r_y2": 394.28, "r_x3": 394.62, "r_y3": 394.28, "coord_origin": "TOPLEFT" }, "text": "0.853", "orig": "0.853", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 45, "label": "text", "bbox": { "l": 439.53, "t": 394.28, "r": 458.38, "b": 402.2, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 56, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 439.53, "r_y0": 402.2, "r_x1": 458.38, "r_y1": 402.2, "r_x2": 458.38, "r_y2": 394.28, "r_x3": 439.53, "r_y3": 394.28, "coord_origin": "TOPLEFT" }, "text": "1.97", "orig": "1.97", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 46, "label": "text", "bbox": { "l": 245.18, "t": 407.29, "r": 272.94, "b": 415.36, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 57, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 245.18, "r_y0": 415.36, "r_x1": 272.94, "r_y1": 415.36, "r_x2": 272.94, "r_y2": 407.29, "r_x3": 245.18, "r_y3": 407.29, "coord_origin": "TOPLEFT" }, "text": "HTML", "orig": "HTML", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 47, "label": "text", "bbox": { "l": 289.02, "t": 407.29, "r": 310.0, "b": 415.36, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 58, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 289.02, "r_y0": 415.36, "r_x1": 310.0, "r_y1": 415.36, "r_x2": 310.0, "r_y2": 407.29, "r_x3": 289.02, "r_y3": 407.29, "coord_origin": "TOPLEFT" }, "text": "0.952", "orig": "0.952", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 48, "label": "text", "bbox": { "l": 326.72, "t": 407.29, "r": 347.7, "b": 415.36, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 59, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 326.72, "r_y0": 415.36, "r_x1": 347.7, "r_y1": 415.36, "r_x2": 347.7, "r_y2": 407.29, "r_x3": 326.72, "r_y3": 407.29, "coord_origin": "TOPLEFT" }, "text": "0.909", "orig": "0.909", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 49, "label": "text", "bbox": { "l": 362.09, "t": 407.23, "r": 386.25, "b": 415.15, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 60, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 362.09, "r_y0": 415.15, "r_x1": 386.25, "r_y1": 415.15, "r_x2": 386.25, "r_y2": 407.23, "r_x3": 362.09, "r_y3": 407.23, "coord_origin": "TOPLEFT" }, "text": "0.938", "orig": "0.938", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 50, "label": "text", "bbox": { "l": 396.21, "t": 407.29, "r": 417.19, "b": 415.36, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 61, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 396.21, "r_y0": 415.36, "r_x1": 417.19, "r_y1": 415.36, "r_x2": 417.19, "r_y2": 407.29, "r_x3": 396.21, "r_y3": 407.29, "coord_origin": "TOPLEFT" }, "text": "0.843", "orig": "0.843", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 51, "label": "text", "bbox": { "l": 440.77, "t": 407.29, "r": 457.15, "b": 415.36, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 62, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 440.77, "r_y0": 415.36, "r_x1": 457.15, "r_y1": 415.36, "r_x2": 457.15, "r_y2": 407.29, "r_x3": 440.77, "r_y3": 407.29, "coord_origin": "TOPLEFT" }, "text": "3.77", "orig": "3.77", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 52, "label": "text", "bbox": { "l": 161.91, "t": 426.12, "r": 166.51, "b": 434.19, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 63, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 161.91, "r_y0": 434.19, "r_x1": 166.51, "r_y1": 434.19, "r_x2": 166.51, "r_y2": 426.12, "r_x3": 161.91, "r_y3": 426.12, "coord_origin": "TOPLEFT" }, "text": "2", "orig": "2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 53, "label": "text", "bbox": { "l": 209.51, "t": 426.12, "r": 214.12, "b": 434.19, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 64, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 209.51, "r_y0": 434.19, "r_x1": 214.12, "r_y1": 434.19, "r_x2": 214.12, "r_y2": 426.12, "r_x3": 209.51, "r_y3": 426.12, "coord_origin": "TOPLEFT" }, "text": "4", "orig": "4", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 54, "label": "text", "bbox": { "l": 246.71, "t": 420.64, "r": 271.41, "b": 428.71, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 65, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 246.71, "r_y0": 428.71, "r_x1": 271.41, "r_y1": 428.71, "r_x2": 271.41, "r_y2": 420.64, "r_x3": 246.71, "r_y3": 420.64, "coord_origin": "TOPLEFT" }, "text": "OTSL", "orig": "OTSL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 55, "label": "text", "bbox": { "l": 289.02, "t": 420.64, "r": 310.0, "b": 428.71, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 66, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 289.02, "r_y0": 428.71, "r_x1": 310.0, "r_y1": 428.71, "r_x2": 310.0, "r_y2": 420.64, "r_x3": 289.02, "r_y3": 420.64, "coord_origin": "TOPLEFT" }, "text": "0.923", "orig": "0.923", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 56, "label": "text", "bbox": { "l": 326.72, "t": 420.64, "r": 347.7, "b": 428.71, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 67, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 326.72, "r_y0": 428.71, "r_x1": 347.7, "r_y1": 428.71, "r_x2": 347.7, "r_y2": 420.64, "r_x3": 326.72, "r_y3": 420.64, "coord_origin": "TOPLEFT" }, "text": "0.897", "orig": "0.897", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 57, "label": "text", "bbox": { "l": 363.68, "t": 420.64, "r": 384.66, "b": 428.71, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 68, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 363.68, "r_y0": 428.71, "r_x1": 384.66, "r_y1": 428.71, "r_x2": 384.66, "r_y2": 420.64, "r_x3": 363.68, "r_y3": 420.64, "coord_origin": "TOPLEFT" }, "text": "0.915", "orig": "0.915", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 58, "label": "text", "bbox": { "l": 394.62, "t": 420.58, "r": 418.78, "b": 428.5, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 69, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 394.62, "r_y0": 428.5, "r_x1": 418.78, "r_y1": 428.5, "r_x2": 418.78, "r_y2": 420.58, "r_x3": 394.62, "r_y3": 420.58, "coord_origin": "TOPLEFT" }, "text": "0.859", "orig": "0.859", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 59, "label": "text", "bbox": { "l": 439.53, "t": 420.58, "r": 458.38, "b": 428.5, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 70, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 439.53, "r_y0": 428.5, "r_x1": 458.38, "r_y1": 428.5, "r_x2": 458.38, "r_y2": 420.58, "r_x3": 439.53, "r_y3": 420.58, "coord_origin": "TOPLEFT" }, "text": "1.91", "orig": "1.91", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 60, "label": "text", "bbox": { "l": 245.18, "t": 433.59, "r": 272.94, "b": 441.66, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 71, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 245.18, "r_y0": 441.66, "r_x1": 272.94, "r_y1": 441.66, "r_x2": 272.94, "r_y2": 433.59, "r_x3": 245.18, "r_y3": 433.59, "coord_origin": "TOPLEFT" }, "text": "HTML", "orig": "HTML", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 61, "label": "text", "bbox": { "l": 289.02, "t": 433.59, "r": 310.0, "b": 441.66, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 72, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 289.02, "r_y0": 441.66, "r_x1": 310.0, "r_y1": 441.66, "r_x2": 310.0, "r_y2": 433.59, "r_x3": 289.02, "r_y3": 433.59, "coord_origin": "TOPLEFT" }, "text": "0.945", "orig": "0.945", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 62, "label": "text", "bbox": { "l": 326.72, "t": 433.59, "r": 347.7, "b": 441.66, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 73, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 326.72, "r_y0": 441.66, "r_x1": 347.7, "r_y1": 441.66, "r_x2": 347.7, "r_y2": 433.59, "r_x3": 326.72, "r_y3": 433.59, "coord_origin": "TOPLEFT" }, "text": "0.901", "orig": "0.901", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 63, "label": "text", "bbox": { "l": 362.09, "t": 433.53, "r": 386.25, "b": 441.45, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 74, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 362.09, "r_y0": 441.45, "r_x1": 386.25, "r_y1": 441.45, "r_x2": 386.25, "r_y2": 433.53, "r_x3": 362.09, "r_y3": 433.53, "coord_origin": "TOPLEFT" }, "text": "0.931", "orig": "0.931", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 64, "label": "text", "bbox": { "l": 396.21, "t": 433.59, "r": 417.19, "b": 441.66, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 75, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 396.21, "r_y0": 441.66, "r_x1": 417.19, "r_y1": 441.66, "r_x2": 417.19, "r_y2": 433.59, "r_x3": 396.21, "r_y3": 433.59, "coord_origin": "TOPLEFT" }, "text": "0.834", "orig": "0.834", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 65, "label": "text", "bbox": { "l": 440.77, "t": 433.59, "r": 457.15, "b": 441.66, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 76, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 440.77, "r_y0": 441.66, "r_x1": 457.15, "r_y1": 441.66, "r_x2": 457.15, "r_y2": 433.59, "r_x3": 440.77, "r_y3": 433.59, "coord_origin": "TOPLEFT" }, "text": "3.81", "orig": "3.81", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 66, "label": "text", "bbox": { "l": 161.91, "t": 452.42, "r": 166.51, "b": 460.49, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 77, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 161.91, "r_y0": 460.49, "r_x1": 166.51, "r_y1": 460.49, "r_x2": 166.51, "r_y2": 452.42, "r_x3": 161.91, "r_y3": 452.42, "coord_origin": "TOPLEFT" }, "text": "4", "orig": "4", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 67, "label": "text", "bbox": { "l": 209.51, "t": 452.42, "r": 214.12, "b": 460.49, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 78, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 209.51, "r_y0": 460.49, "r_x1": 214.12, "r_y1": 460.49, "r_x2": 214.12, "r_y2": 452.42, "r_x3": 209.51, "r_y3": 452.42, "coord_origin": "TOPLEFT" }, "text": "2", "orig": "2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 68, "label": "text", "bbox": { "l": 246.71, "t": 446.94, "r": 271.41, "b": 455.01, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 79, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 246.71, "r_y0": 455.01, "r_x1": 271.41, "r_y1": 455.01, "r_x2": 271.41, "r_y2": 446.94, "r_x3": 246.71, "r_y3": 446.94, "coord_origin": "TOPLEFT" }, "text": "OTSL", "orig": "OTSL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 69, "label": "text", "bbox": { "l": 289.02, "t": 446.94, "r": 310.0, "b": 455.01, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 80, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 289.02, "r_y0": 455.01, "r_x1": 310.0, "r_y1": 455.01, "r_x2": 310.0, "r_y2": 446.94, "r_x3": 289.02, "r_y3": 446.94, "coord_origin": "TOPLEFT" }, "text": "0.952", "orig": "0.952", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 70, "label": "text", "bbox": { "l": 329.02, "t": 446.94, "r": 345.4, "b": 455.01, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 81, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 329.02, "r_y0": 455.01, "r_x1": 345.4, "r_y1": 455.01, "r_x2": 345.4, "r_y2": 446.94, "r_x3": 329.02, "r_y3": 446.94, "coord_origin": "TOPLEFT" }, "text": "0.92", "orig": "0.92", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 71, "label": "text", "bbox": { "l": 362.09, "t": 446.88, "r": 386.25, "b": 454.8, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 82, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 362.09, "r_y0": 454.8, "r_x1": 386.25, "r_y1": 454.8, "r_x2": 386.25, "r_y2": 446.88, "r_x3": 362.09, "r_y3": 446.88, "coord_origin": "TOPLEFT" }, "text": "0.942", "orig": "0.942", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 72, "label": "text", "bbox": { "l": 394.62, "t": 446.88, "r": 418.78, "b": 454.8, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 83, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 394.62, "r_y0": 454.8, "r_x1": 418.78, "r_y1": 454.8, "r_x2": 418.78, "r_y2": 446.88, "r_x3": 394.62, "r_y3": 446.88, "coord_origin": "TOPLEFT" }, "text": "0.857", "orig": "0.857", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 73, "label": "text", "bbox": { "l": 439.53, "t": 446.88, "r": 458.38, "b": 454.8, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 84, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 439.53, "r_y0": 454.8, "r_x1": 458.38, "r_y1": 454.8, "r_x2": 458.38, "r_y2": 446.88, "r_x3": 439.53, "r_y3": 446.88, "coord_origin": "TOPLEFT" }, "text": "1.22", "orig": "1.22", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 74, "label": "text", "bbox": { "l": 245.18, "t": 459.89, "r": 272.94, "b": 467.96, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 85, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 245.18, "r_y0": 467.96, "r_x1": 272.94, "r_y1": 467.96, "r_x2": 272.94, "r_y2": 459.89, "r_x3": 245.18, "r_y3": 459.89, "coord_origin": "TOPLEFT" }, "text": "HTML", "orig": "HTML", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 75, "label": "text", "bbox": { "l": 289.02, "t": 459.89, "r": 310.0, "b": 467.96, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 86, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 289.02, "r_y0": 467.96, "r_x1": 310.0, "r_y1": 467.96, "r_x2": 310.0, "r_y2": 459.89, "r_x3": 289.02, "r_y3": 459.89, "coord_origin": "TOPLEFT" }, "text": "0.944", "orig": "0.944", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 76, "label": "text", "bbox": { "l": 326.72, "t": 459.89, "r": 347.7, "b": 467.96, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 87, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 326.72, "r_y0": 467.96, "r_x1": 347.7, "r_y1": 467.96, "r_x2": 347.7, "r_y2": 459.89, "r_x3": 326.72, "r_y3": 459.89, "coord_origin": "TOPLEFT" }, "text": "0.903", "orig": "0.903", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 77, "label": "text", "bbox": { "l": 363.68, "t": 459.89, "r": 384.66, "b": 467.96, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 88, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 363.68, "r_y0": 467.96, "r_x1": 384.66, "r_y1": 467.96, "r_x2": 384.66, "r_y2": 459.89, "r_x3": 363.68, "r_y3": 459.89, "coord_origin": "TOPLEFT" }, "text": "0.931", "orig": "0.931", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 78, "label": "text", "bbox": { "l": 396.21, "t": 459.89, "r": 417.19, "b": 467.96, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 89, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 396.21, "r_y0": 467.96, "r_x1": 417.19, "r_y1": 467.96, "r_x2": 417.19, "r_y2": 459.89, "r_x3": 396.21, "r_y3": 459.89, "coord_origin": "TOPLEFT" }, "text": "0.824", "orig": "0.824", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 79, "label": "text", "bbox": { "l": 446.65, "t": 459.89, "r": 451.26, "b": 467.96, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 90, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 446.65, "r_y0": 467.96, "r_x1": 451.26, "r_y1": 467.96, "r_x2": 451.26, "r_y2": 459.89, "r_x3": 446.65, "r_y3": 459.89, "coord_origin": "TOPLEFT" }, "text": "2", "orig": "2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] } ] }, { "id": 5, "label": "section_header", "bbox": { "l": 134.76, "t": 508.15, "r": 264.4, "b": 516.96, "coord_origin": "TOPLEFT" }, "confidence": 0.959, "cells": [ { "index": 91, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 516.96, "r_x1": 149.4, "r_y1": 516.96, "r_x2": 149.4, "r_y2": 508.15, "r_x3": 134.76, "r_y3": 508.15, "coord_origin": "TOPLEFT" }, "text": "5.2", "orig": "5.2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 92, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 160.86, "r_y0": 516.96, "r_x1": 264.4, "r_y1": 516.96, "r_x2": 264.4, "r_y2": 508.15, "r_x3": 160.86, "r_y3": 508.15, "coord_origin": "TOPLEFT" }, "text": "Quantitative Results", "orig": "Quantitative Results", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 1, "label": "text", "bbox": { "l": 134.76, "t": 524.55, "r": 480.6, "b": 617.03, "coord_origin": "TOPLEFT" }, "confidence": 0.985, "cells": [ { "index": 93, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 533.35, "r_x1": 480.59, "r_y1": 533.35, "r_x2": 480.59, "r_y2": 524.55, "r_x3": 134.76, "r_y3": 524.55, "coord_origin": "TOPLEFT" }, "text": "We picked the model parameter configuration that produced the best prediction", "orig": "We picked the model parameter configuration that produced the best prediction", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 94, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 545.3, "r_x1": 480.59, "r_y1": 545.3, "r_x2": 480.59, "r_y2": 536.51, "r_x3": 134.76, "r_y3": 536.51, "coord_origin": "TOPLEFT" }, "text": "quality (enc=6, dec=6, heads=8) with PubTabNet alone, then independently", "orig": "quality (enc=6, dec=6, heads=8) with PubTabNet alone, then independently", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 95, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 557.26, "r_x1": 480.6, "r_y1": 557.26, "r_x2": 480.6, "r_y2": 548.46, "r_x3": 134.76, "r_y3": 548.46, "coord_origin": "TOPLEFT" }, "text": "trained and evaluated it on three publicly available data sets: PubTabNet (395k", "orig": "trained and evaluated it on three publicly available data sets: PubTabNet (395k", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 96, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 569.21, "r_x1": 480.59, "r_y1": 569.21, "r_x2": 480.59, "r_y2": 560.42, "r_x3": 134.76, "r_y3": 560.42, "coord_origin": "TOPLEFT" }, "text": "samples), FinTabNet (113k samples) and PubTables-1M (about 1M samples).", "orig": "samples), FinTabNet (113k samples) and PubTables-1M (about 1M samples).", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 97, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 581.17, "r_x1": 480.59, "r_y1": 581.17, "r_x2": 480.59, "r_y2": 572.37, "r_x3": 134.76, "r_y3": 572.37, "coord_origin": "TOPLEFT" }, "text": "Performance results are presented in Table. 2. It is clearly evident that the model", "orig": "Performance results are presented in Table. 2. It is clearly evident that the model", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 98, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 593.12, "r_x1": 480.6, "r_y1": 593.12, "r_x2": 480.6, "r_y2": 584.33, "r_x3": 134.76, "r_y3": 584.33, "coord_origin": "TOPLEFT" }, "text": "trained on OTSL outperforms HTML across the board, keeping high TEDs and", "orig": "trained on OTSL outperforms HTML across the board, keeping high TEDs and", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 99, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 605.08, "r_x1": 480.59, "r_y1": 605.08, "r_x2": 480.59, "r_y2": 596.28, "r_x3": 134.76, "r_y3": 596.28, "coord_origin": "TOPLEFT" }, "text": "mAP scores even on difficult financial tables (FinTabNet) that contain sparse", "orig": "mAP scores even on difficult financial tables (FinTabNet) that contain sparse", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 100, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 617.03, "r_x1": 206.79, "r_y1": 617.03, "r_x2": 206.79, "r_y2": 608.24, "r_x3": 134.76, "r_y3": 608.24, "coord_origin": "TOPLEFT" }, "text": "and large tables.", "orig": "and large tables.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 2, "label": "text", "bbox": { "l": 134.76, "t": 620.19, "r": 480.6, "b": 664.85, "coord_origin": "TOPLEFT" }, "confidence": 0.985, "cells": [ { "index": 101, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 149.71, "r_y0": 628.99, "r_x1": 480.59, "r_y1": 628.99, "r_x2": 480.59, "r_y2": 620.19, "r_x3": 149.71, "r_y3": 620.19, "coord_origin": "TOPLEFT" }, "text": "Additionally, the results show that OTSL has an advantage over HTML", "orig": "Additionally, the results show that OTSL has an advantage over HTML", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 102, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 640.94, "r_x1": 480.6, "r_y1": 640.94, "r_x2": 480.6, "r_y2": 632.15, "r_x3": 134.76, "r_y3": 632.15, "coord_origin": "TOPLEFT" }, "text": "when applied on a bigger data set like PubTables-1M and achieves significantly", "orig": "when applied on a bigger data set like PubTables-1M and achieves significantly", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 103, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 652.9, "r_x1": 480.59, "r_y1": 652.9, "r_x2": 480.59, "r_y2": 644.1, "r_x3": 134.76, "r_y3": 644.1, "coord_origin": "TOPLEFT" }, "text": "improved scores. Finally, OTSL achieves faster inference due to fewer decoding", "orig": "improved scores. Finally, OTSL achieves faster inference due to fewer decoding", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 104, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 664.85, "r_x1": 405.8, "r_y1": 664.85, "r_x2": 405.8, "r_y2": 656.06, "r_x3": 134.76, "r_y3": 656.06, "coord_origin": "TOPLEFT" }, "text": "steps which is a result of the reduced sequence representation.", "orig": "steps which is a result of the reduced sequence representation.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] } ] }, "tablestructure": { "table_map": { "0": { "label": "table", "id": 0, "page_no": 8, "cluster": { "id": 0, "label": "table", "bbox": { "l": 139.67, "t": 337.57, "r": 475.0, "b": 469.47, "coord_origin": "TOPLEFT" }, "confidence": 0.99, "cells": [ { "index": 22, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 160.37, "r_y0": 349.8, "r_x1": 168.05, "r_y1": 349.8, "r_x2": 168.05, "r_y2": 341.73, "r_x3": 160.37, "r_y3": 341.73, "coord_origin": "TOPLEFT" }, "text": "#", "orig": "#", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 23, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 144.59, "r_y0": 362.76, "r_x1": 183.83, "r_y1": 362.76, "r_x2": 183.83, "r_y2": 354.69, "r_x3": 144.59, "r_y3": 354.69, "coord_origin": "TOPLEFT" }, "text": "enc-layers", "orig": "enc-layers", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 24, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 207.97, "r_y0": 349.8, "r_x1": 215.65, "r_y1": 349.8, "r_x2": 215.65, "r_y2": 341.73, "r_x3": 207.97, "r_y3": 341.73, "coord_origin": "TOPLEFT" }, "text": "#", "orig": "#", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 25, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 192.19, "r_y0": 362.76, "r_x1": 231.43, "r_y1": 362.76, "r_x2": 231.43, "r_y2": 354.69, "r_x3": 192.19, "r_y3": 354.69, "coord_origin": "TOPLEFT" }, "text": "dec-layers", "orig": "dec-layers", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 26, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 239.8, "r_y0": 355.28, "r_x1": 278.32, "r_y1": 355.28, "r_x2": 278.32, "r_y2": 347.21, "r_x3": 239.8, "r_y3": 347.21, "coord_origin": "TOPLEFT" }, "text": "Language", "orig": "Language", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 27, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 324.67, "r_y0": 349.8, "r_x1": 348.26, "r_y1": 349.8, "r_x2": 348.26, "r_y2": 341.73, "r_x3": 324.67, "r_y3": 341.73, "coord_origin": "TOPLEFT" }, "text": "TEDs", "orig": "TEDs", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 28, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 396.27, "r_y0": 349.8, "r_x1": 417.13, "r_y1": 349.8, "r_x2": 417.13, "r_y2": 341.73, "r_x3": 396.27, "r_y3": 341.73, "coord_origin": "TOPLEFT" }, "text": "mAP", "orig": "mAP", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 29, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 394.93, "r_y0": 360.76, "r_x1": 418.47, "r_y1": 360.76, "r_x2": 418.47, "r_y2": 352.69, "r_x3": 394.93, "r_y3": 352.69, "coord_origin": "TOPLEFT" }, "text": "(0.75)", "orig": "(0.75)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 30, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 430.77, "r_y0": 349.8, "r_x1": 467.14, "r_y1": 349.8, "r_x2": 467.14, "r_y2": 341.73, "r_x3": 430.77, "r_y3": 341.73, "coord_origin": "TOPLEFT" }, "text": "Inference", "orig": "Inference", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 31, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 427.15, "r_y0": 360.76, "r_x1": 470.76, "r_y1": 360.76, "r_x2": 470.76, "r_y2": 352.69, "r_x3": 427.15, "r_y3": 352.69, "coord_origin": "TOPLEFT" }, "text": "time (secs)", "orig": "time (secs)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 32, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 286.69, "r_y0": 362.76, "r_x1": 312.33, "r_y1": 362.76, "r_x2": 312.33, "r_y2": 354.69, "r_x3": 286.69, "r_y3": 354.69, "coord_origin": "TOPLEFT" }, "text": "simple", "orig": "simple", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 33, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 320.7, "r_y0": 362.76, "r_x1": 353.72, "r_y1": 362.76, "r_x2": 353.72, "r_y2": 354.69, "r_x3": 320.7, "r_y3": 354.69, "coord_origin": "TOPLEFT" }, "text": "complex", "orig": "complex", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 34, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 369.31, "r_y0": 362.76, "r_x1": 379.03, "r_y1": 362.76, "r_x2": 379.03, "r_y2": 354.69, "r_x3": 369.31, "r_y3": 354.69, "coord_origin": "TOPLEFT" }, "text": "all", "orig": "all", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 35, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 161.91, "r_y0": 381.59, "r_x1": 166.51, "r_y1": 381.59, "r_x2": 166.51, "r_y2": 373.52, "r_x3": 161.91, "r_y3": 373.52, "coord_origin": "TOPLEFT" }, "text": "6", "orig": "6", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 36, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 209.51, "r_y0": 381.59, "r_x1": 214.12, "r_y1": 381.59, "r_x2": 214.12, "r_y2": 373.52, "r_x3": 209.51, "r_y3": 373.52, "coord_origin": "TOPLEFT" }, "text": "6", "orig": "6", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 37, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 246.71, "r_y0": 376.11, "r_x1": 271.41, "r_y1": 376.11, "r_x2": 271.41, "r_y2": 368.04, "r_x3": 246.71, "r_y3": 368.04, "coord_origin": "TOPLEFT" }, "text": "OTSL", "orig": "OTSL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 38, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 289.02, "r_y0": 376.11, "r_x1": 310.0, "r_y1": 376.11, "r_x2": 310.0, "r_y2": 368.04, "r_x3": 289.02, "r_y3": 368.04, "coord_origin": "TOPLEFT" }, "text": "0.965", "orig": "0.965", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 39, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 326.72, "r_y0": 376.11, "r_x1": 347.7, "r_y1": 376.11, "r_x2": 347.7, "r_y2": 368.04, "r_x3": 326.72, "r_y3": 368.04, "coord_origin": "TOPLEFT" }, "text": "0.934", "orig": "0.934", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 40, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 363.68, "r_y0": 376.11, "r_x1": 384.66, "r_y1": 376.11, "r_x2": 384.66, "r_y2": 368.04, "r_x3": 363.68, "r_y3": 368.04, "coord_origin": "TOPLEFT" }, "text": "0.955", "orig": "0.955", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 41, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 397.27, "r_y0": 375.9, "r_x1": 416.13, "r_y1": 375.9, "r_x2": 416.13, "r_y2": 367.97, "r_x3": 397.27, "r_y3": 367.97, "coord_origin": "TOPLEFT" }, "text": "0.88", "orig": "0.88", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 42, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 439.53, "r_y0": 375.9, "r_x1": 458.38, "r_y1": 375.9, "r_x2": 458.38, "r_y2": 367.97, "r_x3": 439.53, "r_y3": 367.97, "coord_origin": "TOPLEFT" }, "text": "2.73", "orig": "2.73", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 43, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 245.18, "r_y0": 389.06, "r_x1": 272.94, "r_y1": 389.06, "r_x2": 272.94, "r_y2": 380.99, "r_x3": 245.18, "r_y3": 380.99, "coord_origin": "TOPLEFT" }, "text": "HTML", "orig": "HTML", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 44, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 289.02, "r_y0": 389.06, "r_x1": 310.0, "r_y1": 389.06, "r_x2": 310.0, "r_y2": 380.99, "r_x3": 289.02, "r_y3": 380.99, "coord_origin": "TOPLEFT" }, "text": "0.969", "orig": "0.969", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 45, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 326.72, "r_y0": 389.06, "r_x1": 347.7, "r_y1": 389.06, "r_x2": 347.7, "r_y2": 380.99, "r_x3": 326.72, "r_y3": 380.99, "coord_origin": "TOPLEFT" }, "text": "0.927", "orig": "0.927", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 46, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 363.68, "r_y0": 389.06, "r_x1": 384.66, "r_y1": 389.06, "r_x2": 384.66, "r_y2": 380.99, "r_x3": 363.68, "r_y3": 380.99, "coord_origin": "TOPLEFT" }, "text": "0.955", "orig": "0.955", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 47, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 396.21, "r_y0": 389.06, "r_x1": 417.19, "r_y1": 389.06, "r_x2": 417.19, "r_y2": 380.99, "r_x3": 396.21, "r_y3": 380.99, "coord_origin": "TOPLEFT" }, "text": "0.857", "orig": "0.857", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 48, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 440.77, "r_y0": 389.06, "r_x1": 457.15, "r_y1": 389.06, "r_x2": 457.15, "r_y2": 380.99, "r_x3": 440.77, "r_y3": 380.99, "coord_origin": "TOPLEFT" }, "text": "5.39", "orig": "5.39", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 49, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 161.91, "r_y0": 407.89, "r_x1": 166.51, "r_y1": 407.89, "r_x2": 166.51, "r_y2": 399.82, "r_x3": 161.91, "r_y3": 399.82, "coord_origin": "TOPLEFT" }, "text": "4", "orig": "4", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 50, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 209.51, "r_y0": 407.89, "r_x1": 214.12, "r_y1": 407.89, "r_x2": 214.12, "r_y2": 399.82, "r_x3": 209.51, "r_y3": 399.82, "coord_origin": "TOPLEFT" }, "text": "4", "orig": "4", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 51, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 246.71, "r_y0": 402.41, "r_x1": 271.41, "r_y1": 402.41, "r_x2": 271.41, "r_y2": 394.34, "r_x3": 246.71, "r_y3": 394.34, "coord_origin": "TOPLEFT" }, "text": "OTSL", "orig": "OTSL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 52, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 289.02, "r_y0": 402.41, "r_x1": 310.0, "r_y1": 402.41, "r_x2": 310.0, "r_y2": 394.34, "r_x3": 289.02, "r_y3": 394.34, "coord_origin": "TOPLEFT" }, "text": "0.938", "orig": "0.938", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 53, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 326.72, "r_y0": 402.41, "r_x1": 347.7, "r_y1": 402.41, "r_x2": 347.7, "r_y2": 394.34, "r_x3": 326.72, "r_y3": 394.34, "coord_origin": "TOPLEFT" }, "text": "0.904", "orig": "0.904", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 54, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 363.68, "r_y0": 402.41, "r_x1": 384.66, "r_y1": 402.41, "r_x2": 384.66, "r_y2": 394.34, "r_x3": 363.68, "r_y3": 394.34, "coord_origin": "TOPLEFT" }, "text": "0.927", "orig": "0.927", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 55, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 394.62, "r_y0": 402.2, "r_x1": 418.78, "r_y1": 402.2, "r_x2": 418.78, "r_y2": 394.28, "r_x3": 394.62, "r_y3": 394.28, "coord_origin": "TOPLEFT" }, "text": "0.853", "orig": "0.853", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 56, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 439.53, "r_y0": 402.2, "r_x1": 458.38, "r_y1": 402.2, "r_x2": 458.38, "r_y2": 394.28, "r_x3": 439.53, "r_y3": 394.28, "coord_origin": "TOPLEFT" }, "text": "1.97", "orig": "1.97", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 57, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 245.18, "r_y0": 415.36, "r_x1": 272.94, "r_y1": 415.36, "r_x2": 272.94, "r_y2": 407.29, "r_x3": 245.18, "r_y3": 407.29, "coord_origin": "TOPLEFT" }, "text": "HTML", "orig": "HTML", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 58, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 289.02, "r_y0": 415.36, "r_x1": 310.0, "r_y1": 415.36, "r_x2": 310.0, "r_y2": 407.29, "r_x3": 289.02, "r_y3": 407.29, "coord_origin": "TOPLEFT" }, "text": "0.952", "orig": "0.952", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 59, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 326.72, "r_y0": 415.36, "r_x1": 347.7, "r_y1": 415.36, "r_x2": 347.7, "r_y2": 407.29, "r_x3": 326.72, "r_y3": 407.29, "coord_origin": "TOPLEFT" }, "text": "0.909", "orig": "0.909", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 60, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 362.09, "r_y0": 415.15, "r_x1": 386.25, "r_y1": 415.15, "r_x2": 386.25, "r_y2": 407.23, "r_x3": 362.09, "r_y3": 407.23, "coord_origin": "TOPLEFT" }, "text": "0.938", "orig": "0.938", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 61, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 396.21, "r_y0": 415.36, "r_x1": 417.19, "r_y1": 415.36, "r_x2": 417.19, "r_y2": 407.29, "r_x3": 396.21, "r_y3": 407.29, "coord_origin": "TOPLEFT" }, "text": "0.843", "orig": "0.843", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 62, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 440.77, "r_y0": 415.36, "r_x1": 457.15, "r_y1": 415.36, "r_x2": 457.15, "r_y2": 407.29, "r_x3": 440.77, "r_y3": 407.29, "coord_origin": "TOPLEFT" }, "text": "3.77", "orig": "3.77", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 63, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 161.91, "r_y0": 434.19, "r_x1": 166.51, "r_y1": 434.19, "r_x2": 166.51, "r_y2": 426.12, "r_x3": 161.91, "r_y3": 426.12, "coord_origin": "TOPLEFT" }, "text": "2", "orig": "2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 64, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 209.51, "r_y0": 434.19, "r_x1": 214.12, "r_y1": 434.19, "r_x2": 214.12, "r_y2": 426.12, "r_x3": 209.51, "r_y3": 426.12, "coord_origin": "TOPLEFT" }, "text": "4", "orig": "4", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 65, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 246.71, "r_y0": 428.71, "r_x1": 271.41, "r_y1": 428.71, "r_x2": 271.41, "r_y2": 420.64, "r_x3": 246.71, "r_y3": 420.64, "coord_origin": "TOPLEFT" }, "text": "OTSL", "orig": "OTSL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 66, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 289.02, "r_y0": 428.71, "r_x1": 310.0, "r_y1": 428.71, "r_x2": 310.0, "r_y2": 420.64, "r_x3": 289.02, "r_y3": 420.64, "coord_origin": "TOPLEFT" }, "text": "0.923", "orig": "0.923", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 67, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 326.72, "r_y0": 428.71, "r_x1": 347.7, "r_y1": 428.71, "r_x2": 347.7, "r_y2": 420.64, "r_x3": 326.72, "r_y3": 420.64, "coord_origin": "TOPLEFT" }, "text": "0.897", "orig": "0.897", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 68, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 363.68, "r_y0": 428.71, "r_x1": 384.66, "r_y1": 428.71, "r_x2": 384.66, "r_y2": 420.64, "r_x3": 363.68, "r_y3": 420.64, "coord_origin": "TOPLEFT" }, "text": "0.915", "orig": "0.915", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 69, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 394.62, "r_y0": 428.5, "r_x1": 418.78, "r_y1": 428.5, "r_x2": 418.78, "r_y2": 420.58, "r_x3": 394.62, "r_y3": 420.58, "coord_origin": "TOPLEFT" }, "text": "0.859", "orig": "0.859", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 70, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 439.53, "r_y0": 428.5, "r_x1": 458.38, "r_y1": 428.5, "r_x2": 458.38, "r_y2": 420.58, "r_x3": 439.53, "r_y3": 420.58, "coord_origin": "TOPLEFT" }, "text": "1.91", "orig": "1.91", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 71, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 245.18, "r_y0": 441.66, "r_x1": 272.94, "r_y1": 441.66, "r_x2": 272.94, "r_y2": 433.59, "r_x3": 245.18, "r_y3": 433.59, "coord_origin": "TOPLEFT" }, "text": "HTML", "orig": "HTML", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 72, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 289.02, "r_y0": 441.66, "r_x1": 310.0, "r_y1": 441.66, "r_x2": 310.0, "r_y2": 433.59, "r_x3": 289.02, "r_y3": 433.59, "coord_origin": "TOPLEFT" }, "text": "0.945", "orig": "0.945", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 73, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 326.72, "r_y0": 441.66, "r_x1": 347.7, "r_y1": 441.66, "r_x2": 347.7, "r_y2": 433.59, "r_x3": 326.72, "r_y3": 433.59, "coord_origin": "TOPLEFT" }, "text": "0.901", "orig": "0.901", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 74, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 362.09, "r_y0": 441.45, "r_x1": 386.25, "r_y1": 441.45, "r_x2": 386.25, "r_y2": 433.53, "r_x3": 362.09, "r_y3": 433.53, "coord_origin": "TOPLEFT" }, "text": "0.931", "orig": "0.931", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 75, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 396.21, "r_y0": 441.66, "r_x1": 417.19, "r_y1": 441.66, "r_x2": 417.19, "r_y2": 433.59, "r_x3": 396.21, "r_y3": 433.59, "coord_origin": "TOPLEFT" }, "text": "0.834", "orig": "0.834", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 76, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 440.77, "r_y0": 441.66, "r_x1": 457.15, "r_y1": 441.66, "r_x2": 457.15, "r_y2": 433.59, "r_x3": 440.77, "r_y3": 433.59, "coord_origin": "TOPLEFT" }, "text": "3.81", "orig": "3.81", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 77, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 161.91, "r_y0": 460.49, "r_x1": 166.51, "r_y1": 460.49, "r_x2": 166.51, "r_y2": 452.42, "r_x3": 161.91, "r_y3": 452.42, "coord_origin": "TOPLEFT" }, "text": "4", "orig": "4", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 78, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 209.51, "r_y0": 460.49, "r_x1": 214.12, "r_y1": 460.49, "r_x2": 214.12, "r_y2": 452.42, "r_x3": 209.51, "r_y3": 452.42, "coord_origin": "TOPLEFT" }, "text": "2", "orig": "2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 79, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 246.71, "r_y0": 455.01, "r_x1": 271.41, "r_y1": 455.01, "r_x2": 271.41, "r_y2": 446.94, "r_x3": 246.71, "r_y3": 446.94, "coord_origin": "TOPLEFT" }, "text": "OTSL", "orig": "OTSL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 80, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 289.02, "r_y0": 455.01, "r_x1": 310.0, "r_y1": 455.01, "r_x2": 310.0, "r_y2": 446.94, "r_x3": 289.02, "r_y3": 446.94, "coord_origin": "TOPLEFT" }, "text": "0.952", "orig": "0.952", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 81, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 329.02, "r_y0": 455.01, "r_x1": 345.4, "r_y1": 455.01, "r_x2": 345.4, "r_y2": 446.94, "r_x3": 329.02, "r_y3": 446.94, "coord_origin": "TOPLEFT" }, "text": "0.92", "orig": "0.92", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 82, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 362.09, "r_y0": 454.8, "r_x1": 386.25, "r_y1": 454.8, "r_x2": 386.25, "r_y2": 446.88, "r_x3": 362.09, "r_y3": 446.88, "coord_origin": "TOPLEFT" }, "text": "0.942", "orig": "0.942", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 83, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 394.62, "r_y0": 454.8, "r_x1": 418.78, "r_y1": 454.8, "r_x2": 418.78, "r_y2": 446.88, "r_x3": 394.62, "r_y3": 446.88, "coord_origin": "TOPLEFT" }, "text": "0.857", "orig": "0.857", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 84, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 439.53, "r_y0": 454.8, "r_x1": 458.38, "r_y1": 454.8, "r_x2": 458.38, "r_y2": 446.88, "r_x3": 439.53, "r_y3": 446.88, "coord_origin": "TOPLEFT" }, "text": "1.22", "orig": "1.22", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 85, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 245.18, "r_y0": 467.96, "r_x1": 272.94, "r_y1": 467.96, "r_x2": 272.94, "r_y2": 459.89, "r_x3": 245.18, "r_y3": 459.89, "coord_origin": "TOPLEFT" }, "text": "HTML", "orig": "HTML", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 86, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 289.02, "r_y0": 467.96, "r_x1": 310.0, "r_y1": 467.96, "r_x2": 310.0, "r_y2": 459.89, "r_x3": 289.02, "r_y3": 459.89, "coord_origin": "TOPLEFT" }, "text": "0.944", "orig": "0.944", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 87, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 326.72, "r_y0": 467.96, "r_x1": 347.7, "r_y1": 467.96, "r_x2": 347.7, "r_y2": 459.89, "r_x3": 326.72, "r_y3": 459.89, "coord_origin": "TOPLEFT" }, "text": "0.903", "orig": "0.903", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 88, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 363.68, "r_y0": 467.96, "r_x1": 384.66, "r_y1": 467.96, "r_x2": 384.66, "r_y2": 459.89, "r_x3": 363.68, "r_y3": 459.89, "coord_origin": "TOPLEFT" }, "text": "0.931", "orig": "0.931", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 89, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 396.21, "r_y0": 467.96, "r_x1": 417.19, "r_y1": 467.96, "r_x2": 417.19, "r_y2": 459.89, "r_x3": 396.21, "r_y3": 459.89, "coord_origin": "TOPLEFT" }, "text": "0.824", "orig": "0.824", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 90, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 446.65, "r_y0": 467.96, "r_x1": 451.26, "r_y1": 467.96, "r_x2": 451.26, "r_y2": 459.89, "r_x3": 446.65, "r_y3": 459.89, "coord_origin": "TOPLEFT" }, "text": "2", "orig": "2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [ { "id": 11, "label": "text", "bbox": { "l": 160.37, "t": 341.73, "r": 168.05, "b": 349.8, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 22, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 160.37, "r_y0": 349.8, "r_x1": 168.05, "r_y1": 349.8, "r_x2": 168.05, "r_y2": 341.73, "r_x3": 160.37, "r_y3": 341.73, "coord_origin": "TOPLEFT" }, "text": "#", "orig": "#", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 12, "label": "text", "bbox": { "l": 144.59, "t": 354.69, "r": 183.83, "b": 362.76, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 23, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 144.59, "r_y0": 362.76, "r_x1": 183.83, "r_y1": 362.76, "r_x2": 183.83, "r_y2": 354.69, "r_x3": 144.59, "r_y3": 354.69, "coord_origin": "TOPLEFT" }, "text": "enc-layers", "orig": "enc-layers", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 13, "label": "text", "bbox": { "l": 207.97, "t": 341.73, "r": 215.65, "b": 349.8, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 24, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 207.97, "r_y0": 349.8, "r_x1": 215.65, "r_y1": 349.8, "r_x2": 215.65, "r_y2": 341.73, "r_x3": 207.97, "r_y3": 341.73, "coord_origin": "TOPLEFT" }, "text": "#", "orig": "#", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 14, "label": "text", "bbox": { "l": 192.19, "t": 354.69, "r": 231.43, "b": 362.76, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 25, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 192.19, "r_y0": 362.76, "r_x1": 231.43, "r_y1": 362.76, "r_x2": 231.43, "r_y2": 354.69, "r_x3": 192.19, "r_y3": 354.69, "coord_origin": "TOPLEFT" }, "text": "dec-layers", "orig": "dec-layers", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 15, "label": "text", "bbox": { "l": 239.8, "t": 347.21, "r": 278.32, "b": 355.28, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 26, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 239.8, "r_y0": 355.28, "r_x1": 278.32, "r_y1": 355.28, "r_x2": 278.32, "r_y2": 347.21, "r_x3": 239.8, "r_y3": 347.21, "coord_origin": "TOPLEFT" }, "text": "Language", "orig": "Language", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 16, "label": "text", "bbox": { "l": 324.67, "t": 341.73, "r": 348.26, "b": 349.8, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 27, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 324.67, "r_y0": 349.8, "r_x1": 348.26, "r_y1": 349.8, "r_x2": 348.26, "r_y2": 341.73, "r_x3": 324.67, "r_y3": 341.73, "coord_origin": "TOPLEFT" }, "text": "TEDs", "orig": "TEDs", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 17, "label": "text", "bbox": { "l": 396.27, "t": 341.73, "r": 417.13, "b": 349.8, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 28, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 396.27, "r_y0": 349.8, "r_x1": 417.13, "r_y1": 349.8, "r_x2": 417.13, "r_y2": 341.73, "r_x3": 396.27, "r_y3": 341.73, "coord_origin": "TOPLEFT" }, "text": "mAP", "orig": "mAP", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 18, "label": "text", "bbox": { "l": 394.93, "t": 352.69, "r": 418.47, "b": 360.76, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 29, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 394.93, "r_y0": 360.76, "r_x1": 418.47, "r_y1": 360.76, "r_x2": 418.47, "r_y2": 352.69, "r_x3": 394.93, "r_y3": 352.69, "coord_origin": "TOPLEFT" }, "text": "(0.75)", "orig": "(0.75)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 19, "label": "text", "bbox": { "l": 430.77, "t": 341.73, "r": 467.14, "b": 349.8, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 30, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 430.77, "r_y0": 349.8, "r_x1": 467.14, "r_y1": 349.8, "r_x2": 467.14, "r_y2": 341.73, "r_x3": 430.77, "r_y3": 341.73, "coord_origin": "TOPLEFT" }, "text": "Inference", "orig": "Inference", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 20, "label": "text", "bbox": { "l": 427.15, "t": 352.69, "r": 470.76, "b": 360.76, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 31, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 427.15, "r_y0": 360.76, "r_x1": 470.76, "r_y1": 360.76, "r_x2": 470.76, "r_y2": 352.69, "r_x3": 427.15, "r_y3": 352.69, "coord_origin": "TOPLEFT" }, "text": "time (secs)", "orig": "time (secs)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 21, "label": "text", "bbox": { "l": 286.69, "t": 354.69, "r": 312.33, "b": 362.76, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 32, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 286.69, "r_y0": 362.76, "r_x1": 312.33, "r_y1": 362.76, "r_x2": 312.33, "r_y2": 354.69, "r_x3": 286.69, "r_y3": 354.69, "coord_origin": "TOPLEFT" }, "text": "simple", "orig": "simple", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 22, "label": "text", "bbox": { "l": 320.7, "t": 354.69, "r": 353.72, "b": 362.76, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 33, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 320.7, "r_y0": 362.76, "r_x1": 353.72, "r_y1": 362.76, "r_x2": 353.72, "r_y2": 354.69, "r_x3": 320.7, "r_y3": 354.69, "coord_origin": "TOPLEFT" }, "text": "complex", "orig": "complex", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 23, "label": "text", "bbox": { "l": 369.31, "t": 354.69, "r": 379.03, "b": 362.76, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 34, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 369.31, "r_y0": 362.76, "r_x1": 379.03, "r_y1": 362.76, "r_x2": 379.03, "r_y2": 354.69, "r_x3": 369.31, "r_y3": 354.69, "coord_origin": "TOPLEFT" }, "text": "all", "orig": "all", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 24, "label": "text", "bbox": { "l": 161.91, "t": 373.52, "r": 166.51, "b": 381.59, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 35, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 161.91, "r_y0": 381.59, "r_x1": 166.51, "r_y1": 381.59, "r_x2": 166.51, "r_y2": 373.52, "r_x3": 161.91, "r_y3": 373.52, "coord_origin": "TOPLEFT" }, "text": "6", "orig": "6", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 25, "label": "text", "bbox": { "l": 209.51, "t": 373.52, "r": 214.12, "b": 381.59, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 36, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 209.51, "r_y0": 381.59, "r_x1": 214.12, "r_y1": 381.59, "r_x2": 214.12, "r_y2": 373.52, "r_x3": 209.51, "r_y3": 373.52, "coord_origin": "TOPLEFT" }, "text": "6", "orig": "6", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 26, "label": "text", "bbox": { "l": 246.71, "t": 368.04, "r": 271.41, "b": 376.11, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 37, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 246.71, "r_y0": 376.11, "r_x1": 271.41, "r_y1": 376.11, "r_x2": 271.41, "r_y2": 368.04, "r_x3": 246.71, "r_y3": 368.04, "coord_origin": "TOPLEFT" }, "text": "OTSL", "orig": "OTSL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 27, "label": "text", "bbox": { "l": 289.02, "t": 368.04, "r": 310.0, "b": 376.11, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 38, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 289.02, "r_y0": 376.11, "r_x1": 310.0, "r_y1": 376.11, "r_x2": 310.0, "r_y2": 368.04, "r_x3": 289.02, "r_y3": 368.04, "coord_origin": "TOPLEFT" }, "text": "0.965", "orig": "0.965", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 28, "label": "text", "bbox": { "l": 326.72, "t": 368.04, "r": 347.7, "b": 376.11, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 39, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 326.72, "r_y0": 376.11, "r_x1": 347.7, "r_y1": 376.11, "r_x2": 347.7, "r_y2": 368.04, "r_x3": 326.72, "r_y3": 368.04, "coord_origin": "TOPLEFT" }, "text": "0.934", "orig": "0.934", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 29, "label": "text", "bbox": { "l": 363.68, "t": 368.04, "r": 384.66, "b": 376.11, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 40, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 363.68, "r_y0": 376.11, "r_x1": 384.66, "r_y1": 376.11, "r_x2": 384.66, "r_y2": 368.04, "r_x3": 363.68, "r_y3": 368.04, "coord_origin": "TOPLEFT" }, "text": "0.955", "orig": "0.955", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 30, "label": "text", "bbox": { "l": 397.27, "t": 367.97, "r": 416.13, "b": 375.9, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 41, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 397.27, "r_y0": 375.9, "r_x1": 416.13, "r_y1": 375.9, "r_x2": 416.13, "r_y2": 367.97, "r_x3": 397.27, "r_y3": 367.97, "coord_origin": "TOPLEFT" }, "text": "0.88", "orig": "0.88", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 31, "label": "text", "bbox": { "l": 439.53, "t": 367.97, "r": 458.38, "b": 375.9, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 42, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 439.53, "r_y0": 375.9, "r_x1": 458.38, "r_y1": 375.9, "r_x2": 458.38, "r_y2": 367.97, "r_x3": 439.53, "r_y3": 367.97, "coord_origin": "TOPLEFT" }, "text": "2.73", "orig": "2.73", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 32, "label": "text", "bbox": { "l": 245.18, "t": 380.99, "r": 272.94, "b": 389.06, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 43, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 245.18, "r_y0": 389.06, "r_x1": 272.94, "r_y1": 389.06, "r_x2": 272.94, "r_y2": 380.99, "r_x3": 245.18, "r_y3": 380.99, "coord_origin": "TOPLEFT" }, "text": "HTML", "orig": "HTML", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 33, "label": "text", "bbox": { "l": 289.02, "t": 380.99, "r": 310.0, "b": 389.06, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 44, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 289.02, "r_y0": 389.06, "r_x1": 310.0, "r_y1": 389.06, "r_x2": 310.0, "r_y2": 380.99, "r_x3": 289.02, "r_y3": 380.99, "coord_origin": "TOPLEFT" }, "text": "0.969", "orig": "0.969", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 34, "label": "text", "bbox": { "l": 326.72, "t": 380.99, "r": 347.7, "b": 389.06, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 45, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 326.72, "r_y0": 389.06, "r_x1": 347.7, "r_y1": 389.06, "r_x2": 347.7, "r_y2": 380.99, "r_x3": 326.72, "r_y3": 380.99, "coord_origin": "TOPLEFT" }, "text": "0.927", "orig": "0.927", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 35, "label": "text", "bbox": { "l": 363.68, "t": 380.99, "r": 384.66, "b": 389.06, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 46, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 363.68, "r_y0": 389.06, "r_x1": 384.66, "r_y1": 389.06, "r_x2": 384.66, "r_y2": 380.99, "r_x3": 363.68, "r_y3": 380.99, "coord_origin": "TOPLEFT" }, "text": "0.955", "orig": "0.955", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 36, "label": "text", "bbox": { "l": 396.21, "t": 380.99, "r": 417.19, "b": 389.06, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 47, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 396.21, "r_y0": 389.06, "r_x1": 417.19, "r_y1": 389.06, "r_x2": 417.19, "r_y2": 380.99, "r_x3": 396.21, "r_y3": 380.99, "coord_origin": "TOPLEFT" }, "text": "0.857", "orig": "0.857", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 37, "label": "text", "bbox": { "l": 440.77, "t": 380.99, "r": 457.15, "b": 389.06, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 48, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 440.77, "r_y0": 389.06, "r_x1": 457.15, "r_y1": 389.06, "r_x2": 457.15, "r_y2": 380.99, "r_x3": 440.77, "r_y3": 380.99, "coord_origin": "TOPLEFT" }, "text": "5.39", "orig": "5.39", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 38, "label": "text", "bbox": { "l": 161.91, "t": 399.82, "r": 166.51, "b": 407.89, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 49, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 161.91, "r_y0": 407.89, "r_x1": 166.51, "r_y1": 407.89, "r_x2": 166.51, "r_y2": 399.82, "r_x3": 161.91, "r_y3": 399.82, "coord_origin": "TOPLEFT" }, "text": "4", "orig": "4", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 39, "label": "text", "bbox": { "l": 209.51, "t": 399.82, "r": 214.12, "b": 407.89, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 50, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 209.51, "r_y0": 407.89, "r_x1": 214.12, "r_y1": 407.89, "r_x2": 214.12, "r_y2": 399.82, "r_x3": 209.51, "r_y3": 399.82, "coord_origin": "TOPLEFT" }, "text": "4", "orig": "4", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 40, "label": "text", "bbox": { "l": 246.71, "t": 394.34, "r": 271.41, "b": 402.41, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 51, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 246.71, "r_y0": 402.41, "r_x1": 271.41, "r_y1": 402.41, "r_x2": 271.41, "r_y2": 394.34, "r_x3": 246.71, "r_y3": 394.34, "coord_origin": "TOPLEFT" }, "text": "OTSL", "orig": "OTSL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 41, "label": "text", "bbox": { "l": 289.02, "t": 394.34, "r": 310.0, "b": 402.41, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 52, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 289.02, "r_y0": 402.41, "r_x1": 310.0, "r_y1": 402.41, "r_x2": 310.0, "r_y2": 394.34, "r_x3": 289.02, "r_y3": 394.34, "coord_origin": "TOPLEFT" }, "text": "0.938", "orig": "0.938", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 42, "label": "text", "bbox": { "l": 326.72, "t": 394.34, "r": 347.7, "b": 402.41, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 53, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 326.72, "r_y0": 402.41, "r_x1": 347.7, "r_y1": 402.41, "r_x2": 347.7, "r_y2": 394.34, "r_x3": 326.72, "r_y3": 394.34, "coord_origin": "TOPLEFT" }, "text": "0.904", "orig": "0.904", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 43, "label": "text", "bbox": { "l": 363.68, "t": 394.34, "r": 384.66, "b": 402.41, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 54, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 363.68, "r_y0": 402.41, "r_x1": 384.66, "r_y1": 402.41, "r_x2": 384.66, "r_y2": 394.34, "r_x3": 363.68, "r_y3": 394.34, "coord_origin": "TOPLEFT" }, "text": "0.927", "orig": "0.927", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 44, "label": "text", "bbox": { "l": 394.62, "t": 394.28, "r": 418.78, "b": 402.2, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 55, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 394.62, "r_y0": 402.2, "r_x1": 418.78, "r_y1": 402.2, "r_x2": 418.78, "r_y2": 394.28, "r_x3": 394.62, "r_y3": 394.28, "coord_origin": "TOPLEFT" }, "text": "0.853", "orig": "0.853", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 45, "label": "text", "bbox": { "l": 439.53, "t": 394.28, "r": 458.38, "b": 402.2, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 56, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 439.53, "r_y0": 402.2, "r_x1": 458.38, "r_y1": 402.2, "r_x2": 458.38, "r_y2": 394.28, "r_x3": 439.53, "r_y3": 394.28, "coord_origin": "TOPLEFT" }, "text": "1.97", "orig": "1.97", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 46, "label": "text", "bbox": { "l": 245.18, "t": 407.29, "r": 272.94, "b": 415.36, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 57, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 245.18, "r_y0": 415.36, "r_x1": 272.94, "r_y1": 415.36, "r_x2": 272.94, "r_y2": 407.29, "r_x3": 245.18, "r_y3": 407.29, "coord_origin": "TOPLEFT" }, "text": "HTML", "orig": "HTML", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 47, "label": "text", "bbox": { "l": 289.02, "t": 407.29, "r": 310.0, "b": 415.36, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 58, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 289.02, "r_y0": 415.36, "r_x1": 310.0, "r_y1": 415.36, "r_x2": 310.0, "r_y2": 407.29, "r_x3": 289.02, "r_y3": 407.29, "coord_origin": "TOPLEFT" }, "text": "0.952", "orig": "0.952", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 48, "label": "text", "bbox": { "l": 326.72, "t": 407.29, "r": 347.7, "b": 415.36, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 59, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 326.72, "r_y0": 415.36, "r_x1": 347.7, "r_y1": 415.36, "r_x2": 347.7, "r_y2": 407.29, "r_x3": 326.72, "r_y3": 407.29, "coord_origin": "TOPLEFT" }, "text": "0.909", "orig": "0.909", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 49, "label": "text", "bbox": { "l": 362.09, "t": 407.23, "r": 386.25, "b": 415.15, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 60, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 362.09, "r_y0": 415.15, "r_x1": 386.25, "r_y1": 415.15, "r_x2": 386.25, "r_y2": 407.23, "r_x3": 362.09, "r_y3": 407.23, "coord_origin": "TOPLEFT" }, "text": "0.938", "orig": "0.938", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 50, "label": "text", "bbox": { "l": 396.21, "t": 407.29, "r": 417.19, "b": 415.36, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 61, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 396.21, "r_y0": 415.36, "r_x1": 417.19, "r_y1": 415.36, "r_x2": 417.19, "r_y2": 407.29, "r_x3": 396.21, "r_y3": 407.29, "coord_origin": "TOPLEFT" }, "text": "0.843", "orig": "0.843", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 51, "label": "text", "bbox": { "l": 440.77, "t": 407.29, "r": 457.15, "b": 415.36, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 62, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 440.77, "r_y0": 415.36, "r_x1": 457.15, "r_y1": 415.36, "r_x2": 457.15, "r_y2": 407.29, "r_x3": 440.77, "r_y3": 407.29, "coord_origin": "TOPLEFT" }, "text": "3.77", "orig": "3.77", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 52, "label": "text", "bbox": { "l": 161.91, "t": 426.12, "r": 166.51, "b": 434.19, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 63, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 161.91, "r_y0": 434.19, "r_x1": 166.51, "r_y1": 434.19, "r_x2": 166.51, "r_y2": 426.12, "r_x3": 161.91, "r_y3": 426.12, "coord_origin": "TOPLEFT" }, "text": "2", "orig": "2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 53, "label": "text", "bbox": { "l": 209.51, "t": 426.12, "r": 214.12, "b": 434.19, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 64, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 209.51, "r_y0": 434.19, "r_x1": 214.12, "r_y1": 434.19, "r_x2": 214.12, "r_y2": 426.12, "r_x3": 209.51, "r_y3": 426.12, "coord_origin": "TOPLEFT" }, "text": "4", "orig": "4", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 54, "label": "text", "bbox": { "l": 246.71, "t": 420.64, "r": 271.41, "b": 428.71, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 65, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 246.71, "r_y0": 428.71, "r_x1": 271.41, "r_y1": 428.71, "r_x2": 271.41, "r_y2": 420.64, "r_x3": 246.71, "r_y3": 420.64, "coord_origin": "TOPLEFT" }, "text": "OTSL", "orig": "OTSL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 55, "label": "text", "bbox": { "l": 289.02, "t": 420.64, "r": 310.0, "b": 428.71, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 66, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 289.02, "r_y0": 428.71, "r_x1": 310.0, "r_y1": 428.71, "r_x2": 310.0, "r_y2": 420.64, "r_x3": 289.02, "r_y3": 420.64, "coord_origin": "TOPLEFT" }, "text": "0.923", "orig": "0.923", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 56, "label": "text", "bbox": { "l": 326.72, "t": 420.64, "r": 347.7, "b": 428.71, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 67, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 326.72, "r_y0": 428.71, "r_x1": 347.7, "r_y1": 428.71, "r_x2": 347.7, "r_y2": 420.64, "r_x3": 326.72, "r_y3": 420.64, "coord_origin": "TOPLEFT" }, "text": "0.897", "orig": "0.897", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 57, "label": "text", "bbox": { "l": 363.68, "t": 420.64, "r": 384.66, "b": 428.71, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 68, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 363.68, "r_y0": 428.71, "r_x1": 384.66, "r_y1": 428.71, "r_x2": 384.66, "r_y2": 420.64, "r_x3": 363.68, "r_y3": 420.64, "coord_origin": "TOPLEFT" }, "text": "0.915", "orig": "0.915", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 58, "label": "text", "bbox": { "l": 394.62, "t": 420.58, "r": 418.78, "b": 428.5, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 69, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 394.62, "r_y0": 428.5, "r_x1": 418.78, "r_y1": 428.5, "r_x2": 418.78, "r_y2": 420.58, "r_x3": 394.62, "r_y3": 420.58, "coord_origin": "TOPLEFT" }, "text": "0.859", "orig": "0.859", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 59, "label": "text", "bbox": { "l": 439.53, "t": 420.58, "r": 458.38, "b": 428.5, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 70, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 439.53, "r_y0": 428.5, "r_x1": 458.38, "r_y1": 428.5, "r_x2": 458.38, "r_y2": 420.58, "r_x3": 439.53, "r_y3": 420.58, "coord_origin": "TOPLEFT" }, "text": "1.91", "orig": "1.91", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 60, "label": "text", "bbox": { "l": 245.18, "t": 433.59, "r": 272.94, "b": 441.66, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 71, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 245.18, "r_y0": 441.66, "r_x1": 272.94, "r_y1": 441.66, "r_x2": 272.94, "r_y2": 433.59, "r_x3": 245.18, "r_y3": 433.59, "coord_origin": "TOPLEFT" }, "text": "HTML", "orig": "HTML", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 61, "label": "text", "bbox": { "l": 289.02, "t": 433.59, "r": 310.0, "b": 441.66, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 72, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 289.02, "r_y0": 441.66, "r_x1": 310.0, "r_y1": 441.66, "r_x2": 310.0, "r_y2": 433.59, "r_x3": 289.02, "r_y3": 433.59, "coord_origin": "TOPLEFT" }, "text": "0.945", "orig": "0.945", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 62, "label": "text", "bbox": { "l": 326.72, "t": 433.59, "r": 347.7, "b": 441.66, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 73, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 326.72, "r_y0": 441.66, "r_x1": 347.7, "r_y1": 441.66, "r_x2": 347.7, "r_y2": 433.59, "r_x3": 326.72, "r_y3": 433.59, "coord_origin": "TOPLEFT" }, "text": "0.901", "orig": "0.901", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 63, "label": "text", "bbox": { "l": 362.09, "t": 433.53, "r": 386.25, "b": 441.45, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 74, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 362.09, "r_y0": 441.45, "r_x1": 386.25, "r_y1": 441.45, "r_x2": 386.25, "r_y2": 433.53, "r_x3": 362.09, "r_y3": 433.53, "coord_origin": "TOPLEFT" }, "text": "0.931", "orig": "0.931", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 64, "label": "text", "bbox": { "l": 396.21, "t": 433.59, "r": 417.19, "b": 441.66, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 75, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 396.21, "r_y0": 441.66, "r_x1": 417.19, "r_y1": 441.66, "r_x2": 417.19, "r_y2": 433.59, "r_x3": 396.21, "r_y3": 433.59, "coord_origin": "TOPLEFT" }, "text": "0.834", "orig": "0.834", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 65, "label": "text", "bbox": { "l": 440.77, "t": 433.59, "r": 457.15, "b": 441.66, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 76, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 440.77, "r_y0": 441.66, "r_x1": 457.15, "r_y1": 441.66, "r_x2": 457.15, "r_y2": 433.59, "r_x3": 440.77, "r_y3": 433.59, "coord_origin": "TOPLEFT" }, "text": "3.81", "orig": "3.81", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 66, "label": "text", "bbox": { "l": 161.91, "t": 452.42, "r": 166.51, "b": 460.49, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 77, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 161.91, "r_y0": 460.49, "r_x1": 166.51, "r_y1": 460.49, "r_x2": 166.51, "r_y2": 452.42, "r_x3": 161.91, "r_y3": 452.42, "coord_origin": "TOPLEFT" }, "text": "4", "orig": "4", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 67, "label": "text", "bbox": { "l": 209.51, "t": 452.42, "r": 214.12, "b": 460.49, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 78, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 209.51, "r_y0": 460.49, "r_x1": 214.12, "r_y1": 460.49, "r_x2": 214.12, "r_y2": 452.42, "r_x3": 209.51, "r_y3": 452.42, "coord_origin": "TOPLEFT" }, "text": "2", "orig": "2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 68, "label": "text", "bbox": { "l": 246.71, "t": 446.94, "r": 271.41, "b": 455.01, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 79, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 246.71, "r_y0": 455.01, "r_x1": 271.41, "r_y1": 455.01, "r_x2": 271.41, "r_y2": 446.94, "r_x3": 246.71, "r_y3": 446.94, "coord_origin": "TOPLEFT" }, "text": "OTSL", "orig": "OTSL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 69, "label": "text", "bbox": { "l": 289.02, "t": 446.94, "r": 310.0, "b": 455.01, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 80, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 289.02, "r_y0": 455.01, "r_x1": 310.0, "r_y1": 455.01, "r_x2": 310.0, "r_y2": 446.94, "r_x3": 289.02, "r_y3": 446.94, "coord_origin": "TOPLEFT" }, "text": "0.952", "orig": "0.952", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 70, "label": "text", "bbox": { "l": 329.02, "t": 446.94, "r": 345.4, "b": 455.01, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 81, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 329.02, "r_y0": 455.01, "r_x1": 345.4, "r_y1": 455.01, "r_x2": 345.4, "r_y2": 446.94, "r_x3": 329.02, "r_y3": 446.94, "coord_origin": "TOPLEFT" }, "text": "0.92", "orig": "0.92", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 71, "label": "text", "bbox": { "l": 362.09, "t": 446.88, "r": 386.25, "b": 454.8, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 82, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 362.09, "r_y0": 454.8, "r_x1": 386.25, "r_y1": 454.8, "r_x2": 386.25, "r_y2": 446.88, "r_x3": 362.09, "r_y3": 446.88, "coord_origin": "TOPLEFT" }, "text": "0.942", "orig": "0.942", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 72, "label": "text", "bbox": { "l": 394.62, "t": 446.88, "r": 418.78, "b": 454.8, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 83, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 394.62, "r_y0": 454.8, "r_x1": 418.78, "r_y1": 454.8, "r_x2": 418.78, "r_y2": 446.88, "r_x3": 394.62, "r_y3": 446.88, "coord_origin": "TOPLEFT" }, "text": "0.857", "orig": "0.857", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 73, "label": "text", "bbox": { "l": 439.53, "t": 446.88, "r": 458.38, "b": 454.8, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 84, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 439.53, "r_y0": 454.8, "r_x1": 458.38, "r_y1": 454.8, "r_x2": 458.38, "r_y2": 446.88, "r_x3": 439.53, "r_y3": 446.88, "coord_origin": "TOPLEFT" }, "text": "1.22", "orig": "1.22", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 74, "label": "text", "bbox": { "l": 245.18, "t": 459.89, "r": 272.94, "b": 467.96, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 85, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 245.18, "r_y0": 467.96, "r_x1": 272.94, "r_y1": 467.96, "r_x2": 272.94, "r_y2": 459.89, "r_x3": 245.18, "r_y3": 459.89, "coord_origin": "TOPLEFT" }, "text": "HTML", "orig": "HTML", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 75, "label": "text", "bbox": { "l": 289.02, "t": 459.89, "r": 310.0, "b": 467.96, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 86, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 289.02, "r_y0": 467.96, "r_x1": 310.0, "r_y1": 467.96, "r_x2": 310.0, "r_y2": 459.89, "r_x3": 289.02, "r_y3": 459.89, "coord_origin": "TOPLEFT" }, "text": "0.944", "orig": "0.944", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 76, "label": "text", "bbox": { "l": 326.72, "t": 459.89, "r": 347.7, "b": 467.96, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 87, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 326.72, "r_y0": 467.96, "r_x1": 347.7, "r_y1": 467.96, "r_x2": 347.7, "r_y2": 459.89, "r_x3": 326.72, "r_y3": 459.89, "coord_origin": "TOPLEFT" }, "text": "0.903", "orig": "0.903", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 77, "label": "text", "bbox": { "l": 363.68, "t": 459.89, "r": 384.66, "b": 467.96, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 88, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 363.68, "r_y0": 467.96, "r_x1": 384.66, "r_y1": 467.96, "r_x2": 384.66, "r_y2": 459.89, "r_x3": 363.68, "r_y3": 459.89, "coord_origin": "TOPLEFT" }, "text": "0.931", "orig": "0.931", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 78, "label": "text", "bbox": { "l": 396.21, "t": 459.89, "r": 417.19, "b": 467.96, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 89, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 396.21, "r_y0": 467.96, "r_x1": 417.19, "r_y1": 467.96, "r_x2": 417.19, "r_y2": 459.89, "r_x3": 396.21, "r_y3": 459.89, "coord_origin": "TOPLEFT" }, "text": "0.824", "orig": "0.824", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 79, "label": "text", "bbox": { "l": 446.65, "t": 459.89, "r": 451.26, "b": 467.96, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 90, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 446.65, "r_y0": 467.96, "r_x1": 451.26, "r_y1": 467.96, "r_x2": 451.26, "r_y2": 459.89, "r_x3": 446.65, "r_y3": 459.89, "coord_origin": "TOPLEFT" }, "text": "2", "orig": "2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] } ] }, "text": null, "otsl_seq": [ "ched", "ched", "ched", "ched", "lcel", "lcel", "ched", "ched", "nl", "ucel", "ucel", "ucel", "ched", "ched", "ched", "ched", "ched", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "nl" ], "num_rows": 6, "num_cols": 8, "table_cells": [ { "bbox": { "l": 160.37, "t": 341.73, "r": 168.05, "b": 349.8, "coord_origin": "TOPLEFT" }, "row_span": 2, "col_span": 1, "start_row_offset_idx": 0, "end_row_offset_idx": 2, "start_col_offset_idx": 0, "end_col_offset_idx": 1, "text": "# enc-layers", "column_header": true, "row_header": false, "row_section": false }, { "bbox": { "l": 207.97, "t": 341.73, "r": 215.65, "b": 349.8, "coord_origin": "TOPLEFT" }, "row_span": 2, "col_span": 1, "start_row_offset_idx": 0, "end_row_offset_idx": 2, "start_col_offset_idx": 1, "end_col_offset_idx": 2, "text": "# dec-layers", "column_header": true, "row_header": false, "row_section": false }, { "bbox": { "l": 239.8, "t": 347.21, "r": 278.32, "b": 355.28, "coord_origin": "TOPLEFT" }, "row_span": 2, "col_span": 1, "start_row_offset_idx": 0, "end_row_offset_idx": 2, "start_col_offset_idx": 2, "end_col_offset_idx": 3, "text": "Language", "column_header": true, "row_header": false, "row_section": false }, { "bbox": { "l": 324.67, "t": 341.73, "r": 348.26, "b": 349.8, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 3, "start_row_offset_idx": 0, "end_row_offset_idx": 1, "start_col_offset_idx": 3, "end_col_offset_idx": 6, "text": "TEDs", "column_header": true, "row_header": false, "row_section": false }, { "bbox": { "l": 396.27, "t": 341.73, "r": 417.13, "b": 349.8, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 0, "end_row_offset_idx": 1, "start_col_offset_idx": 6, "end_col_offset_idx": 7, "text": "mAP", "column_header": true, "row_header": false, "row_section": false }, { "bbox": { "l": 394.93, "t": 352.69, "r": 418.47, "b": 360.76, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 1, "end_row_offset_idx": 2, "start_col_offset_idx": 6, "end_col_offset_idx": 7, "text": "(0.75)", "column_header": true, "row_header": false, "row_section": false }, { "bbox": { "l": 430.77, "t": 341.73, "r": 467.14, "b": 349.8, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 0, "end_row_offset_idx": 1, "start_col_offset_idx": 7, "end_col_offset_idx": 8, "text": "Inference", "column_header": true, "row_header": false, "row_section": false }, { "bbox": { "l": 427.15, "t": 352.69, "r": 470.76, "b": 360.76, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 1, "end_row_offset_idx": 2, "start_col_offset_idx": 7, "end_col_offset_idx": 8, "text": "time (secs)", "column_header": true, "row_header": false, "row_section": false }, { "bbox": { "l": 286.69, "t": 354.69, "r": 312.33, "b": 362.76, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 1, "end_row_offset_idx": 2, "start_col_offset_idx": 3, "end_col_offset_idx": 4, "text": "simple", "column_header": true, "row_header": false, "row_section": false }, { "bbox": { "l": 320.7, "t": 354.69, "r": 353.72, "b": 362.76, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 1, "end_row_offset_idx": 2, "start_col_offset_idx": 4, "end_col_offset_idx": 5, "text": "complex", "column_header": true, "row_header": false, "row_section": false }, { "bbox": { "l": 369.31, "t": 354.69, "r": 379.03, "b": 362.76, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 1, "end_row_offset_idx": 2, "start_col_offset_idx": 5, "end_col_offset_idx": 6, "text": "all", "column_header": true, "row_header": false, "row_section": false }, { "bbox": { "l": 161.91, "t": 373.52, "r": 166.51, "b": 381.59, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 2, "end_row_offset_idx": 3, "start_col_offset_idx": 0, "end_col_offset_idx": 1, "text": "6", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 209.51, "t": 373.52, "r": 214.12, "b": 381.59, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 2, "end_row_offset_idx": 3, "start_col_offset_idx": 1, "end_col_offset_idx": 2, "text": "6", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 246.71, "t": 368.04, "r": 271.41, "b": 376.11, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 2, "end_row_offset_idx": 3, "start_col_offset_idx": 2, "end_col_offset_idx": 3, "text": "OTSL HTML", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 289.02, "t": 368.04, "r": 310.0, "b": 376.11, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 2, "end_row_offset_idx": 3, "start_col_offset_idx": 3, "end_col_offset_idx": 4, "text": "0.965 0.969", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 326.72, "t": 368.04, "r": 347.7, "b": 376.11, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 2, "end_row_offset_idx": 3, "start_col_offset_idx": 4, "end_col_offset_idx": 5, "text": "0.934 0.927", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 363.68, "t": 368.04, "r": 384.66, "b": 376.11, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 2, "end_row_offset_idx": 3, "start_col_offset_idx": 5, "end_col_offset_idx": 6, "text": "0.955 0.955", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 397.27, "t": 367.97, "r": 416.13, "b": 375.9, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 2, "end_row_offset_idx": 3, "start_col_offset_idx": 6, "end_col_offset_idx": 7, "text": "0.88 0.857", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 439.53, "t": 367.97, "r": 458.38, "b": 375.9, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 2, "end_row_offset_idx": 3, "start_col_offset_idx": 7, "end_col_offset_idx": 8, "text": "2.73 5.39", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 161.91, "t": 399.82, "r": 166.51, "b": 407.89, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 3, "end_row_offset_idx": 4, "start_col_offset_idx": 0, "end_col_offset_idx": 1, "text": "4", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 209.51, "t": 399.82, "r": 214.12, "b": 407.89, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 3, "end_row_offset_idx": 4, "start_col_offset_idx": 1, "end_col_offset_idx": 2, "text": "4", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 246.71, "t": 394.34, "r": 271.41, "b": 402.41, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 3, "end_row_offset_idx": 4, "start_col_offset_idx": 2, "end_col_offset_idx": 3, "text": "OTSL HTML", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 289.02, "t": 394.34, "r": 310.0, "b": 402.41, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 3, "end_row_offset_idx": 4, "start_col_offset_idx": 3, "end_col_offset_idx": 4, "text": "0.938 0.952", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 326.72, "t": 394.34, "r": 347.7, "b": 402.41, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 3, "end_row_offset_idx": 4, "start_col_offset_idx": 4, "end_col_offset_idx": 5, "text": "0.904 0.909", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 363.68, "t": 394.34, "r": 384.66, "b": 402.41, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 3, "end_row_offset_idx": 4, "start_col_offset_idx": 5, "end_col_offset_idx": 6, "text": "0.927 0.938", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 394.62, "t": 394.28, "r": 418.78, "b": 402.2, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 3, "end_row_offset_idx": 4, "start_col_offset_idx": 6, "end_col_offset_idx": 7, "text": "0.853 0.843", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 439.53, "t": 394.28, "r": 458.38, "b": 402.2, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 3, "end_row_offset_idx": 4, "start_col_offset_idx": 7, "end_col_offset_idx": 8, "text": "1.97 3.77", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 161.91, "t": 426.12, "r": 166.51, "b": 434.19, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 4, "end_row_offset_idx": 5, "start_col_offset_idx": 0, "end_col_offset_idx": 1, "text": "2", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 209.51, "t": 426.12, "r": 214.12, "b": 434.19, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 4, "end_row_offset_idx": 5, "start_col_offset_idx": 1, "end_col_offset_idx": 2, "text": "4", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 246.71, "t": 420.64, "r": 271.41, "b": 428.71, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 4, "end_row_offset_idx": 5, "start_col_offset_idx": 2, "end_col_offset_idx": 3, "text": "OTSL HTML", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 289.02, "t": 420.64, "r": 310.0, "b": 428.71, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 4, "end_row_offset_idx": 5, "start_col_offset_idx": 3, "end_col_offset_idx": 4, "text": "0.923 0.945", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 326.72, "t": 420.64, "r": 347.7, "b": 428.71, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 4, "end_row_offset_idx": 5, "start_col_offset_idx": 4, "end_col_offset_idx": 5, "text": "0.897 0.901", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 363.68, "t": 420.64, "r": 384.66, "b": 428.71, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 4, "end_row_offset_idx": 5, "start_col_offset_idx": 5, "end_col_offset_idx": 6, "text": "0.915 0.931", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 394.62, "t": 420.58, "r": 418.78, "b": 428.5, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 4, "end_row_offset_idx": 5, "start_col_offset_idx": 6, "end_col_offset_idx": 7, "text": "0.859 0.834", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 439.53, "t": 420.58, "r": 458.38, "b": 428.5, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 4, "end_row_offset_idx": 5, "start_col_offset_idx": 7, "end_col_offset_idx": 8, "text": "1.91 3.81", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 161.91, "t": 452.42, "r": 166.51, "b": 460.49, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 5, "end_row_offset_idx": 6, "start_col_offset_idx": 0, "end_col_offset_idx": 1, "text": "4", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 209.51, "t": 452.42, "r": 214.12, "b": 460.49, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 5, "end_row_offset_idx": 6, "start_col_offset_idx": 1, "end_col_offset_idx": 2, "text": "2", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 246.71, "t": 446.94, "r": 271.41, "b": 455.01, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 5, "end_row_offset_idx": 6, "start_col_offset_idx": 2, "end_col_offset_idx": 3, "text": "OTSL HTML", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 289.02, "t": 446.94, "r": 310.0, "b": 455.01, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 5, "end_row_offset_idx": 6, "start_col_offset_idx": 3, "end_col_offset_idx": 4, "text": "0.952 0.944", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 329.02, "t": 446.94, "r": 345.4, "b": 455.01, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 5, "end_row_offset_idx": 6, "start_col_offset_idx": 4, "end_col_offset_idx": 5, "text": "0.92 0.903", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 362.09, "t": 446.88, "r": 386.25, "b": 454.8, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 5, "end_row_offset_idx": 6, "start_col_offset_idx": 5, "end_col_offset_idx": 6, "text": "0.942 0.931", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 394.62, "t": 446.88, "r": 418.78, "b": 454.8, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 5, "end_row_offset_idx": 6, "start_col_offset_idx": 6, "end_col_offset_idx": 7, "text": "0.857 0.824", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 439.53, "t": 446.88, "r": 458.38, "b": 454.8, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 5, "end_row_offset_idx": 6, "start_col_offset_idx": 7, "end_col_offset_idx": 8, "text": "1.22 2", "column_header": false, "row_header": false, "row_section": false } ] } } }, "figures_classification": null, "equations_prediction": null, "vlm_response": null }, "assembled": { "elements": [ { "label": "page_header", "id": 8, "page_no": 8, "cluster": { "id": 8, "label": "page_header", "bbox": { "l": 194.48, "t": 93.77, "r": 447.54, "b": 101.84, "coord_origin": "TOPLEFT" }, "confidence": 0.937, "cells": [ { "index": 0, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 194.48, "r_y0": 101.84, "r_x1": 447.54, "r_y1": 101.84, "r_x2": 447.54, "r_y2": 93.77, "r_x3": 194.48, "r_y3": 93.77, "coord_origin": "TOPLEFT" }, "text": "Optimized Table Tokenization for Table Structure Recognition", "orig": "Optimized Table Tokenization for Table Structure Recognition", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "Optimized Table Tokenization for Table Structure Recognition" }, { "label": "page_header", "id": 9, "page_no": 8, "cluster": { "id": 9, "label": "page_header", "bbox": { "l": 475.98, "t": 93.77, "r": 480.59, "b": 101.84, "coord_origin": "TOPLEFT" }, "confidence": 0.886, "cells": [ { "index": 1, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 475.98, "r_y0": 101.84, "r_x1": 480.59, "r_y1": 101.84, "r_x2": 480.59, "r_y2": 93.77, "r_x3": 475.98, "r_y3": 93.77, "coord_origin": "TOPLEFT" }, "text": "9", "orig": "9", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "9" }, { "label": "text", "id": 4, "page_no": 8, "cluster": { "id": 4, "label": "text", "bbox": { "l": 134.76, "t": 118.93, "r": 480.6, "b": 151.64, "coord_origin": "TOPLEFT" }, "confidence": 0.981, "cells": [ { "index": 2, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 127.73, "r_x1": 480.59, "r_y1": 127.73, "r_x2": 480.59, "r_y2": 118.93, "r_x3": 134.76, "r_y3": 118.93, "coord_origin": "TOPLEFT" }, "text": "order to compute the TED score. Inference timing results for all experiments", "orig": "order to compute the TED score. Inference timing results for all experiments", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 3, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 139.69, "r_x1": 480.6, "r_y1": 139.69, "r_x2": 480.6, "r_y2": 130.89, "r_x3": 134.76, "r_y3": 130.89, "coord_origin": "TOPLEFT" }, "text": "were obtained from the same machine on a single core with AMD EPYC 7763", "orig": "were obtained from the same machine on a single core with AMD EPYC 7763", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 4, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 151.64, "r_x1": 210.78, "r_y1": 151.64, "r_x2": 210.78, "r_y2": 142.84, "r_x3": 134.76, "r_y3": 142.84, "coord_origin": "TOPLEFT" }, "text": "CPU @2.45 GHz.", "orig": "CPU @2.45 GHz.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "order to compute the TED score. Inference timing results for all experiments were obtained from the same machine on a single core with AMD EPYC 7763 CPU @2.45 GHz." }, { "label": "section_header", "id": 6, "page_no": 8, "cluster": { "id": 6, "label": "section_header", "bbox": { "l": 134.76, "t": 169.19, "r": 318.45, "b": 177.99, "coord_origin": "TOPLEFT" }, "confidence": 0.958, "cells": [ { "index": 5, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 177.99, "r_x1": 149.4, "r_y1": 177.99, "r_x2": 149.4, "r_y2": 169.19, "r_x3": 134.76, "r_y3": 169.19, "coord_origin": "TOPLEFT" }, "text": "5.1", "orig": "5.1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 6, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 160.86, "r_y0": 177.99, "r_x1": 318.45, "r_y1": 177.99, "r_x2": 318.45, "r_y2": 169.19, "r_x3": 160.86, "r_y3": 169.19, "coord_origin": "TOPLEFT" }, "text": "Hyper Parameter Optimization", "orig": "Hyper Parameter Optimization", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "5.1 Hyper Parameter Optimization" }, { "label": "text", "id": 3, "page_no": 8, "cluster": { "id": 3, "label": "text", "bbox": { "l": 134.76, "t": 185.59, "r": 480.59, "b": 254.16, "coord_origin": "TOPLEFT" }, "confidence": 0.984, "cells": [ { "index": 7, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 194.38, "r_x1": 480.59, "r_y1": 194.38, "r_x2": 480.59, "r_y2": 185.59, "r_x3": 134.76, "r_y3": 185.59, "coord_origin": "TOPLEFT" }, "text": "We have chosen the PubTabNet data set to perform HPO, since it includes a", "orig": "We have chosen the PubTabNet data set to perform HPO, since it includes a", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 8, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 206.34, "r_x1": 480.59, "r_y1": 206.34, "r_x2": 480.59, "r_y2": 197.54, "r_x3": 134.76, "r_y3": 197.54, "coord_origin": "TOPLEFT" }, "text": "highly diverse set of tables. Also we report TED scores separately for simple and", "orig": "highly diverse set of tables. Also we report TED scores separately for simple and", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 9, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 218.29, "r_x1": 480.59, "r_y1": 218.29, "r_x2": 480.59, "r_y2": 209.5, "r_x3": 134.76, "r_y3": 209.5, "coord_origin": "TOPLEFT" }, "text": "complex tables (tables with cell spans). Results are presented in Table. 1. It is", "orig": "complex tables (tables with cell spans). Results are presented in Table. 1. It is", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 10, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 230.25, "r_x1": 480.59, "r_y1": 230.25, "r_x2": 480.59, "r_y2": 221.45, "r_x3": 134.76, "r_y3": 221.45, "coord_origin": "TOPLEFT" }, "text": "evident that with OTSL, our model achieves the same TED score and slightly", "orig": "evident that with OTSL, our model achieves the same TED score and slightly", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 11, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 242.2, "r_x1": 440.94, "r_y1": 242.2, "r_x2": 440.94, "r_y2": 233.41, "r_x3": 134.76, "r_y3": 233.41, "coord_origin": "TOPLEFT" }, "text": "better mAP scores in comparison to HTML. However OTSL yields a", "orig": "better mAP scores in comparison to HTML. However OTSL yields a", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 12, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 444.87, "r_y0": 242.2, "r_x1": 480.59, "r_y1": 242.2, "r_x2": 480.59, "r_y2": 233.41, "r_x3": 444.87, "r_y3": 233.41, "coord_origin": "TOPLEFT" }, "text": "2x speed", "orig": "2x speed", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 13, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 254.16, "r_x1": 145.2, "r_y1": 254.16, "r_x2": 145.2, "r_y2": 245.36, "r_x3": 134.76, "r_y3": 245.36, "coord_origin": "TOPLEFT" }, "text": "up", "orig": "up", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 14, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 149.15, "r_y0": 254.16, "r_x1": 311.22, "r_y1": 254.16, "r_x2": 311.22, "r_y2": 245.36, "r_x3": 149.15, "r_y3": 245.36, "coord_origin": "TOPLEFT" }, "text": "in the inference runtime over HTML.", "orig": "in the inference runtime over HTML.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "We have chosen the PubTabNet data set to perform HPO, since it includes a highly diverse set of tables. Also we report TED scores separately for simple and complex tables (tables with cell spans). Results are presented in Table. 1. It is evident that with OTSL, our model achieves the same TED score and slightly better mAP scores in comparison to HTML. However OTSL yields a 2x speed up in the inference runtime over HTML." }, { "label": "caption", "id": 7, "page_no": 8, "cluster": { "id": 7, "label": "caption", "bbox": { "l": 134.76, "t": 275.07, "r": 480.6, "b": 327.04, "coord_origin": "TOPLEFT" }, "confidence": 0.957, "cells": [ { "index": 15, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 283.0, "r_x1": 160.12, "r_y1": 283.0, "r_x2": 160.12, "r_y2": 275.07, "r_x3": 134.76, "r_y3": 275.07, "coord_origin": "TOPLEFT" }, "text": "Table", "orig": "Table", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 16, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 167.35, "r_y0": 283.0, "r_x1": 175.6, "r_y1": 283.0, "r_x2": 175.6, "r_y2": 275.07, "r_x3": 167.35, "r_y3": 275.07, "coord_origin": "TOPLEFT" }, "text": "1.", "orig": "1.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 17, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 188.13, "r_y0": 283.2, "r_x1": 480.59, "r_y1": 283.2, "r_x2": 480.59, "r_y2": 275.14, "r_x3": 188.13, "r_y3": 275.14, "coord_origin": "TOPLEFT" }, "text": "HPO performed in OTSL and HTML representation on the same", "orig": "HPO performed in OTSL and HTML representation on the same", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 18, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 294.16, "r_x1": 480.59, "r_y1": 294.16, "r_x2": 480.59, "r_y2": 286.09, "r_x3": 134.76, "r_y3": 286.09, "coord_origin": "TOPLEFT" }, "text": "transformer-based TableFormer [9] architecture, trained only on PubTabNet [22]. Ef-", "orig": "transformer-based TableFormer [9] architecture, trained only on PubTabNet [22]. Ef-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 19, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 305.12, "r_x1": 480.6, "r_y1": 305.12, "r_x2": 480.6, "r_y2": 297.05, "r_x3": 134.76, "r_y3": 297.05, "coord_origin": "TOPLEFT" }, "text": "fects of reducing the # of layers in encoder and decoder stages of the model show that", "orig": "fects of reducing the # of layers in encoder and decoder stages of the model show that", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 20, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 316.08, "r_x1": 480.59, "r_y1": 316.08, "r_x2": 480.59, "r_y2": 308.01, "r_x3": 134.76, "r_y3": 308.01, "coord_origin": "TOPLEFT" }, "text": "smaller models trained on OTSL perform better, especially in recognizing complex", "orig": "smaller models trained on OTSL perform better, especially in recognizing complex", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 21, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 327.04, "r_x1": 480.59, "r_y1": 327.04, "r_x2": 480.59, "r_y2": 318.97, "r_x3": 134.76, "r_y3": 318.97, "coord_origin": "TOPLEFT" }, "text": "table structures, and maintain a much higher mAP score than the HTML counterpart.", "orig": "table structures, and maintain a much higher mAP score than the HTML counterpart.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "Table 1. HPO performed in OTSL and HTML representation on the same transformer-based TableFormer [9] architecture, trained only on PubTabNet [22]. Effects of reducing the # of layers in encoder and decoder stages of the model show that smaller models trained on OTSL perform better, especially in recognizing complex table structures, and maintain a much higher mAP score than the HTML counterpart." }, { "label": "table", "id": 0, "page_no": 8, "cluster": { "id": 0, "label": "table", "bbox": { "l": 139.67, "t": 337.57, "r": 475.0, "b": 469.47, "coord_origin": "TOPLEFT" }, "confidence": 0.99, "cells": [ { "index": 22, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 160.37, "r_y0": 349.8, "r_x1": 168.05, "r_y1": 349.8, "r_x2": 168.05, "r_y2": 341.73, "r_x3": 160.37, "r_y3": 341.73, "coord_origin": "TOPLEFT" }, "text": "#", "orig": "#", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 23, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 144.59, "r_y0": 362.76, "r_x1": 183.83, "r_y1": 362.76, "r_x2": 183.83, "r_y2": 354.69, "r_x3": 144.59, "r_y3": 354.69, "coord_origin": "TOPLEFT" }, "text": "enc-layers", "orig": "enc-layers", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 24, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 207.97, "r_y0": 349.8, "r_x1": 215.65, "r_y1": 349.8, "r_x2": 215.65, "r_y2": 341.73, "r_x3": 207.97, "r_y3": 341.73, "coord_origin": "TOPLEFT" }, "text": "#", "orig": "#", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 25, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 192.19, "r_y0": 362.76, "r_x1": 231.43, "r_y1": 362.76, "r_x2": 231.43, "r_y2": 354.69, "r_x3": 192.19, "r_y3": 354.69, "coord_origin": "TOPLEFT" }, "text": "dec-layers", "orig": "dec-layers", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 26, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 239.8, "r_y0": 355.28, "r_x1": 278.32, "r_y1": 355.28, "r_x2": 278.32, "r_y2": 347.21, "r_x3": 239.8, "r_y3": 347.21, "coord_origin": "TOPLEFT" }, "text": "Language", "orig": "Language", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 27, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 324.67, "r_y0": 349.8, "r_x1": 348.26, "r_y1": 349.8, "r_x2": 348.26, "r_y2": 341.73, "r_x3": 324.67, "r_y3": 341.73, "coord_origin": "TOPLEFT" }, "text": "TEDs", "orig": "TEDs", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 28, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 396.27, "r_y0": 349.8, "r_x1": 417.13, "r_y1": 349.8, "r_x2": 417.13, "r_y2": 341.73, "r_x3": 396.27, "r_y3": 341.73, "coord_origin": "TOPLEFT" }, "text": "mAP", "orig": "mAP", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 29, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 394.93, "r_y0": 360.76, "r_x1": 418.47, "r_y1": 360.76, "r_x2": 418.47, "r_y2": 352.69, "r_x3": 394.93, "r_y3": 352.69, "coord_origin": "TOPLEFT" }, "text": "(0.75)", "orig": "(0.75)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 30, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 430.77, "r_y0": 349.8, "r_x1": 467.14, "r_y1": 349.8, "r_x2": 467.14, "r_y2": 341.73, "r_x3": 430.77, "r_y3": 341.73, "coord_origin": "TOPLEFT" }, "text": "Inference", "orig": "Inference", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 31, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 427.15, "r_y0": 360.76, "r_x1": 470.76, "r_y1": 360.76, "r_x2": 470.76, "r_y2": 352.69, "r_x3": 427.15, "r_y3": 352.69, "coord_origin": "TOPLEFT" }, "text": "time (secs)", "orig": "time (secs)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 32, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 286.69, "r_y0": 362.76, "r_x1": 312.33, "r_y1": 362.76, "r_x2": 312.33, "r_y2": 354.69, "r_x3": 286.69, "r_y3": 354.69, "coord_origin": "TOPLEFT" }, "text": "simple", "orig": "simple", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 33, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 320.7, "r_y0": 362.76, "r_x1": 353.72, "r_y1": 362.76, "r_x2": 353.72, "r_y2": 354.69, "r_x3": 320.7, "r_y3": 354.69, "coord_origin": "TOPLEFT" }, "text": "complex", "orig": "complex", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 34, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 369.31, "r_y0": 362.76, "r_x1": 379.03, "r_y1": 362.76, "r_x2": 379.03, "r_y2": 354.69, "r_x3": 369.31, "r_y3": 354.69, "coord_origin": "TOPLEFT" }, "text": "all", "orig": "all", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 35, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 161.91, "r_y0": 381.59, "r_x1": 166.51, "r_y1": 381.59, "r_x2": 166.51, "r_y2": 373.52, "r_x3": 161.91, "r_y3": 373.52, "coord_origin": "TOPLEFT" }, "text": "6", "orig": "6", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 36, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 209.51, "r_y0": 381.59, "r_x1": 214.12, "r_y1": 381.59, "r_x2": 214.12, "r_y2": 373.52, "r_x3": 209.51, "r_y3": 373.52, "coord_origin": "TOPLEFT" }, "text": "6", "orig": "6", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 37, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 246.71, "r_y0": 376.11, "r_x1": 271.41, "r_y1": 376.11, "r_x2": 271.41, "r_y2": 368.04, "r_x3": 246.71, "r_y3": 368.04, "coord_origin": "TOPLEFT" }, "text": "OTSL", "orig": "OTSL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 38, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 289.02, "r_y0": 376.11, "r_x1": 310.0, "r_y1": 376.11, "r_x2": 310.0, "r_y2": 368.04, "r_x3": 289.02, "r_y3": 368.04, "coord_origin": "TOPLEFT" }, "text": "0.965", "orig": "0.965", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 39, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 326.72, "r_y0": 376.11, "r_x1": 347.7, "r_y1": 376.11, "r_x2": 347.7, "r_y2": 368.04, "r_x3": 326.72, "r_y3": 368.04, "coord_origin": "TOPLEFT" }, "text": "0.934", "orig": "0.934", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 40, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 363.68, "r_y0": 376.11, "r_x1": 384.66, "r_y1": 376.11, "r_x2": 384.66, "r_y2": 368.04, "r_x3": 363.68, "r_y3": 368.04, "coord_origin": "TOPLEFT" }, "text": "0.955", "orig": "0.955", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 41, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 397.27, "r_y0": 375.9, "r_x1": 416.13, "r_y1": 375.9, "r_x2": 416.13, "r_y2": 367.97, "r_x3": 397.27, "r_y3": 367.97, "coord_origin": "TOPLEFT" }, "text": "0.88", "orig": "0.88", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 42, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 439.53, "r_y0": 375.9, "r_x1": 458.38, "r_y1": 375.9, "r_x2": 458.38, "r_y2": 367.97, "r_x3": 439.53, "r_y3": 367.97, "coord_origin": "TOPLEFT" }, "text": "2.73", "orig": "2.73", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 43, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 245.18, "r_y0": 389.06, "r_x1": 272.94, "r_y1": 389.06, "r_x2": 272.94, "r_y2": 380.99, "r_x3": 245.18, "r_y3": 380.99, "coord_origin": "TOPLEFT" }, "text": "HTML", "orig": "HTML", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 44, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 289.02, "r_y0": 389.06, "r_x1": 310.0, "r_y1": 389.06, "r_x2": 310.0, "r_y2": 380.99, "r_x3": 289.02, "r_y3": 380.99, "coord_origin": "TOPLEFT" }, "text": "0.969", "orig": "0.969", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 45, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 326.72, "r_y0": 389.06, "r_x1": 347.7, "r_y1": 389.06, "r_x2": 347.7, "r_y2": 380.99, "r_x3": 326.72, "r_y3": 380.99, "coord_origin": "TOPLEFT" }, "text": "0.927", "orig": "0.927", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 46, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 363.68, "r_y0": 389.06, "r_x1": 384.66, "r_y1": 389.06, "r_x2": 384.66, "r_y2": 380.99, "r_x3": 363.68, "r_y3": 380.99, "coord_origin": "TOPLEFT" }, "text": "0.955", "orig": "0.955", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 47, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 396.21, "r_y0": 389.06, "r_x1": 417.19, "r_y1": 389.06, "r_x2": 417.19, "r_y2": 380.99, "r_x3": 396.21, "r_y3": 380.99, "coord_origin": "TOPLEFT" }, "text": "0.857", "orig": "0.857", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 48, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 440.77, "r_y0": 389.06, "r_x1": 457.15, "r_y1": 389.06, "r_x2": 457.15, "r_y2": 380.99, "r_x3": 440.77, "r_y3": 380.99, "coord_origin": "TOPLEFT" }, "text": "5.39", "orig": "5.39", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 49, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 161.91, "r_y0": 407.89, "r_x1": 166.51, "r_y1": 407.89, "r_x2": 166.51, "r_y2": 399.82, "r_x3": 161.91, "r_y3": 399.82, "coord_origin": "TOPLEFT" }, "text": "4", "orig": "4", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 50, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 209.51, "r_y0": 407.89, "r_x1": 214.12, "r_y1": 407.89, "r_x2": 214.12, "r_y2": 399.82, "r_x3": 209.51, "r_y3": 399.82, "coord_origin": "TOPLEFT" }, "text": "4", "orig": "4", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 51, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 246.71, "r_y0": 402.41, "r_x1": 271.41, "r_y1": 402.41, "r_x2": 271.41, "r_y2": 394.34, "r_x3": 246.71, "r_y3": 394.34, "coord_origin": "TOPLEFT" }, "text": "OTSL", "orig": "OTSL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 52, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 289.02, "r_y0": 402.41, "r_x1": 310.0, "r_y1": 402.41, "r_x2": 310.0, "r_y2": 394.34, "r_x3": 289.02, "r_y3": 394.34, "coord_origin": "TOPLEFT" }, "text": "0.938", "orig": "0.938", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 53, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 326.72, "r_y0": 402.41, "r_x1": 347.7, "r_y1": 402.41, "r_x2": 347.7, "r_y2": 394.34, "r_x3": 326.72, "r_y3": 394.34, "coord_origin": "TOPLEFT" }, "text": "0.904", "orig": "0.904", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 54, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 363.68, "r_y0": 402.41, "r_x1": 384.66, "r_y1": 402.41, "r_x2": 384.66, "r_y2": 394.34, "r_x3": 363.68, "r_y3": 394.34, "coord_origin": "TOPLEFT" }, "text": "0.927", "orig": "0.927", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 55, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 394.62, "r_y0": 402.2, "r_x1": 418.78, "r_y1": 402.2, "r_x2": 418.78, "r_y2": 394.28, "r_x3": 394.62, "r_y3": 394.28, "coord_origin": "TOPLEFT" }, "text": "0.853", "orig": "0.853", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 56, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 439.53, "r_y0": 402.2, "r_x1": 458.38, "r_y1": 402.2, "r_x2": 458.38, "r_y2": 394.28, "r_x3": 439.53, "r_y3": 394.28, "coord_origin": "TOPLEFT" }, "text": "1.97", "orig": "1.97", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 57, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 245.18, "r_y0": 415.36, "r_x1": 272.94, "r_y1": 415.36, "r_x2": 272.94, "r_y2": 407.29, "r_x3": 245.18, "r_y3": 407.29, "coord_origin": "TOPLEFT" }, "text": "HTML", "orig": "HTML", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 58, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 289.02, "r_y0": 415.36, "r_x1": 310.0, "r_y1": 415.36, "r_x2": 310.0, "r_y2": 407.29, "r_x3": 289.02, "r_y3": 407.29, "coord_origin": "TOPLEFT" }, "text": "0.952", "orig": "0.952", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 59, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 326.72, "r_y0": 415.36, "r_x1": 347.7, "r_y1": 415.36, "r_x2": 347.7, "r_y2": 407.29, "r_x3": 326.72, "r_y3": 407.29, "coord_origin": "TOPLEFT" }, "text": "0.909", "orig": "0.909", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 60, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 362.09, "r_y0": 415.15, "r_x1": 386.25, "r_y1": 415.15, "r_x2": 386.25, "r_y2": 407.23, "r_x3": 362.09, "r_y3": 407.23, "coord_origin": "TOPLEFT" }, "text": "0.938", "orig": "0.938", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 61, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 396.21, "r_y0": 415.36, "r_x1": 417.19, "r_y1": 415.36, "r_x2": 417.19, "r_y2": 407.29, "r_x3": 396.21, "r_y3": 407.29, "coord_origin": "TOPLEFT" }, "text": "0.843", "orig": "0.843", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 62, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 440.77, "r_y0": 415.36, "r_x1": 457.15, "r_y1": 415.36, "r_x2": 457.15, "r_y2": 407.29, "r_x3": 440.77, "r_y3": 407.29, "coord_origin": "TOPLEFT" }, "text": "3.77", "orig": "3.77", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 63, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 161.91, "r_y0": 434.19, "r_x1": 166.51, "r_y1": 434.19, "r_x2": 166.51, "r_y2": 426.12, "r_x3": 161.91, "r_y3": 426.12, "coord_origin": "TOPLEFT" }, "text": "2", "orig": "2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 64, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 209.51, "r_y0": 434.19, "r_x1": 214.12, "r_y1": 434.19, "r_x2": 214.12, "r_y2": 426.12, "r_x3": 209.51, "r_y3": 426.12, "coord_origin": "TOPLEFT" }, "text": "4", "orig": "4", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 65, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 246.71, "r_y0": 428.71, "r_x1": 271.41, "r_y1": 428.71, "r_x2": 271.41, "r_y2": 420.64, "r_x3": 246.71, "r_y3": 420.64, "coord_origin": "TOPLEFT" }, "text": "OTSL", "orig": "OTSL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 66, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 289.02, "r_y0": 428.71, "r_x1": 310.0, "r_y1": 428.71, "r_x2": 310.0, "r_y2": 420.64, "r_x3": 289.02, "r_y3": 420.64, "coord_origin": "TOPLEFT" }, "text": "0.923", "orig": "0.923", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 67, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 326.72, "r_y0": 428.71, "r_x1": 347.7, "r_y1": 428.71, "r_x2": 347.7, "r_y2": 420.64, "r_x3": 326.72, "r_y3": 420.64, "coord_origin": "TOPLEFT" }, "text": "0.897", "orig": "0.897", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 68, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 363.68, "r_y0": 428.71, "r_x1": 384.66, "r_y1": 428.71, "r_x2": 384.66, "r_y2": 420.64, "r_x3": 363.68, "r_y3": 420.64, "coord_origin": "TOPLEFT" }, "text": "0.915", "orig": "0.915", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 69, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 394.62, "r_y0": 428.5, "r_x1": 418.78, "r_y1": 428.5, "r_x2": 418.78, "r_y2": 420.58, "r_x3": 394.62, "r_y3": 420.58, "coord_origin": "TOPLEFT" }, "text": "0.859", "orig": "0.859", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 70, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 439.53, "r_y0": 428.5, "r_x1": 458.38, "r_y1": 428.5, "r_x2": 458.38, "r_y2": 420.58, "r_x3": 439.53, "r_y3": 420.58, "coord_origin": "TOPLEFT" }, "text": "1.91", "orig": "1.91", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 71, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 245.18, "r_y0": 441.66, "r_x1": 272.94, "r_y1": 441.66, "r_x2": 272.94, "r_y2": 433.59, "r_x3": 245.18, "r_y3": 433.59, "coord_origin": "TOPLEFT" }, "text": "HTML", "orig": "HTML", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 72, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 289.02, "r_y0": 441.66, "r_x1": 310.0, "r_y1": 441.66, "r_x2": 310.0, "r_y2": 433.59, "r_x3": 289.02, "r_y3": 433.59, "coord_origin": "TOPLEFT" }, "text": "0.945", "orig": "0.945", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 73, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 326.72, "r_y0": 441.66, "r_x1": 347.7, "r_y1": 441.66, "r_x2": 347.7, "r_y2": 433.59, "r_x3": 326.72, "r_y3": 433.59, "coord_origin": "TOPLEFT" }, "text": "0.901", "orig": "0.901", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 74, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 362.09, "r_y0": 441.45, "r_x1": 386.25, "r_y1": 441.45, "r_x2": 386.25, "r_y2": 433.53, "r_x3": 362.09, "r_y3": 433.53, "coord_origin": "TOPLEFT" }, "text": "0.931", "orig": "0.931", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 75, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 396.21, "r_y0": 441.66, "r_x1": 417.19, "r_y1": 441.66, "r_x2": 417.19, "r_y2": 433.59, "r_x3": 396.21, "r_y3": 433.59, "coord_origin": "TOPLEFT" }, "text": "0.834", "orig": "0.834", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 76, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 440.77, "r_y0": 441.66, "r_x1": 457.15, "r_y1": 441.66, "r_x2": 457.15, "r_y2": 433.59, "r_x3": 440.77, "r_y3": 433.59, "coord_origin": "TOPLEFT" }, "text": "3.81", "orig": "3.81", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 77, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 161.91, "r_y0": 460.49, "r_x1": 166.51, "r_y1": 460.49, "r_x2": 166.51, "r_y2": 452.42, "r_x3": 161.91, "r_y3": 452.42, "coord_origin": "TOPLEFT" }, "text": "4", "orig": "4", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 78, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 209.51, "r_y0": 460.49, "r_x1": 214.12, "r_y1": 460.49, "r_x2": 214.12, "r_y2": 452.42, "r_x3": 209.51, "r_y3": 452.42, "coord_origin": "TOPLEFT" }, "text": "2", "orig": "2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 79, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 246.71, "r_y0": 455.01, "r_x1": 271.41, "r_y1": 455.01, "r_x2": 271.41, "r_y2": 446.94, "r_x3": 246.71, "r_y3": 446.94, "coord_origin": "TOPLEFT" }, "text": "OTSL", "orig": "OTSL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 80, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 289.02, "r_y0": 455.01, "r_x1": 310.0, "r_y1": 455.01, "r_x2": 310.0, "r_y2": 446.94, "r_x3": 289.02, "r_y3": 446.94, "coord_origin": "TOPLEFT" }, "text": "0.952", "orig": "0.952", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 81, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 329.02, "r_y0": 455.01, "r_x1": 345.4, "r_y1": 455.01, "r_x2": 345.4, "r_y2": 446.94, "r_x3": 329.02, "r_y3": 446.94, "coord_origin": "TOPLEFT" }, "text": "0.92", "orig": "0.92", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 82, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 362.09, "r_y0": 454.8, "r_x1": 386.25, "r_y1": 454.8, "r_x2": 386.25, "r_y2": 446.88, "r_x3": 362.09, "r_y3": 446.88, "coord_origin": "TOPLEFT" }, "text": "0.942", "orig": "0.942", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 83, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 394.62, "r_y0": 454.8, "r_x1": 418.78, "r_y1": 454.8, "r_x2": 418.78, "r_y2": 446.88, "r_x3": 394.62, "r_y3": 446.88, "coord_origin": "TOPLEFT" }, "text": "0.857", "orig": "0.857", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 84, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 439.53, "r_y0": 454.8, "r_x1": 458.38, "r_y1": 454.8, "r_x2": 458.38, "r_y2": 446.88, "r_x3": 439.53, "r_y3": 446.88, "coord_origin": "TOPLEFT" }, "text": "1.22", "orig": "1.22", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 85, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 245.18, "r_y0": 467.96, "r_x1": 272.94, "r_y1": 467.96, "r_x2": 272.94, "r_y2": 459.89, "r_x3": 245.18, "r_y3": 459.89, "coord_origin": "TOPLEFT" }, "text": "HTML", "orig": "HTML", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 86, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 289.02, "r_y0": 467.96, "r_x1": 310.0, "r_y1": 467.96, "r_x2": 310.0, "r_y2": 459.89, "r_x3": 289.02, "r_y3": 459.89, "coord_origin": "TOPLEFT" }, "text": "0.944", "orig": "0.944", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 87, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 326.72, "r_y0": 467.96, "r_x1": 347.7, "r_y1": 467.96, "r_x2": 347.7, "r_y2": 459.89, "r_x3": 326.72, "r_y3": 459.89, "coord_origin": "TOPLEFT" }, "text": "0.903", "orig": "0.903", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 88, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 363.68, "r_y0": 467.96, "r_x1": 384.66, "r_y1": 467.96, "r_x2": 384.66, "r_y2": 459.89, "r_x3": 363.68, "r_y3": 459.89, "coord_origin": "TOPLEFT" }, "text": "0.931", "orig": "0.931", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 89, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 396.21, "r_y0": 467.96, "r_x1": 417.19, "r_y1": 467.96, "r_x2": 417.19, "r_y2": 459.89, "r_x3": 396.21, "r_y3": 459.89, "coord_origin": "TOPLEFT" }, "text": "0.824", "orig": "0.824", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 90, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 446.65, "r_y0": 467.96, "r_x1": 451.26, "r_y1": 467.96, "r_x2": 451.26, "r_y2": 459.89, "r_x3": 446.65, "r_y3": 459.89, "coord_origin": "TOPLEFT" }, "text": "2", "orig": "2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [ { "id": 11, "label": "text", "bbox": { "l": 160.37, "t": 341.73, "r": 168.05, "b": 349.8, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 22, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 160.37, "r_y0": 349.8, "r_x1": 168.05, "r_y1": 349.8, "r_x2": 168.05, "r_y2": 341.73, "r_x3": 160.37, "r_y3": 341.73, "coord_origin": "TOPLEFT" }, "text": "#", "orig": "#", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 12, "label": "text", "bbox": { "l": 144.59, "t": 354.69, "r": 183.83, "b": 362.76, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 23, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 144.59, "r_y0": 362.76, "r_x1": 183.83, "r_y1": 362.76, "r_x2": 183.83, "r_y2": 354.69, "r_x3": 144.59, "r_y3": 354.69, "coord_origin": "TOPLEFT" }, "text": "enc-layers", "orig": "enc-layers", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 13, "label": "text", "bbox": { "l": 207.97, "t": 341.73, "r": 215.65, "b": 349.8, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 24, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 207.97, "r_y0": 349.8, "r_x1": 215.65, "r_y1": 349.8, "r_x2": 215.65, "r_y2": 341.73, "r_x3": 207.97, "r_y3": 341.73, "coord_origin": "TOPLEFT" }, "text": "#", "orig": "#", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 14, "label": "text", "bbox": { "l": 192.19, "t": 354.69, "r": 231.43, "b": 362.76, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 25, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 192.19, "r_y0": 362.76, "r_x1": 231.43, "r_y1": 362.76, "r_x2": 231.43, "r_y2": 354.69, "r_x3": 192.19, "r_y3": 354.69, "coord_origin": "TOPLEFT" }, "text": "dec-layers", "orig": "dec-layers", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 15, "label": "text", "bbox": { "l": 239.8, "t": 347.21, "r": 278.32, "b": 355.28, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 26, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 239.8, "r_y0": 355.28, "r_x1": 278.32, "r_y1": 355.28, "r_x2": 278.32, "r_y2": 347.21, "r_x3": 239.8, "r_y3": 347.21, "coord_origin": "TOPLEFT" }, "text": "Language", "orig": "Language", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 16, "label": "text", "bbox": { "l": 324.67, "t": 341.73, "r": 348.26, "b": 349.8, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 27, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 324.67, "r_y0": 349.8, "r_x1": 348.26, "r_y1": 349.8, "r_x2": 348.26, "r_y2": 341.73, "r_x3": 324.67, "r_y3": 341.73, "coord_origin": "TOPLEFT" }, "text": "TEDs", "orig": "TEDs", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 17, "label": "text", "bbox": { "l": 396.27, "t": 341.73, "r": 417.13, "b": 349.8, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 28, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 396.27, "r_y0": 349.8, "r_x1": 417.13, "r_y1": 349.8, "r_x2": 417.13, "r_y2": 341.73, "r_x3": 396.27, "r_y3": 341.73, "coord_origin": "TOPLEFT" }, "text": "mAP", "orig": "mAP", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 18, "label": "text", "bbox": { "l": 394.93, "t": 352.69, "r": 418.47, "b": 360.76, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 29, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 394.93, "r_y0": 360.76, "r_x1": 418.47, "r_y1": 360.76, "r_x2": 418.47, "r_y2": 352.69, "r_x3": 394.93, "r_y3": 352.69, "coord_origin": "TOPLEFT" }, "text": "(0.75)", "orig": "(0.75)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 19, "label": "text", "bbox": { "l": 430.77, "t": 341.73, "r": 467.14, "b": 349.8, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 30, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 430.77, "r_y0": 349.8, "r_x1": 467.14, "r_y1": 349.8, "r_x2": 467.14, "r_y2": 341.73, "r_x3": 430.77, "r_y3": 341.73, "coord_origin": "TOPLEFT" }, "text": "Inference", "orig": "Inference", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 20, "label": "text", "bbox": { "l": 427.15, "t": 352.69, "r": 470.76, "b": 360.76, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 31, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 427.15, "r_y0": 360.76, "r_x1": 470.76, "r_y1": 360.76, "r_x2": 470.76, "r_y2": 352.69, "r_x3": 427.15, "r_y3": 352.69, "coord_origin": "TOPLEFT" }, "text": "time (secs)", "orig": "time (secs)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 21, "label": "text", "bbox": { "l": 286.69, "t": 354.69, "r": 312.33, "b": 362.76, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 32, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 286.69, "r_y0": 362.76, "r_x1": 312.33, "r_y1": 362.76, "r_x2": 312.33, "r_y2": 354.69, "r_x3": 286.69, "r_y3": 354.69, "coord_origin": "TOPLEFT" }, "text": "simple", "orig": "simple", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 22, "label": "text", "bbox": { "l": 320.7, "t": 354.69, "r": 353.72, "b": 362.76, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 33, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 320.7, "r_y0": 362.76, "r_x1": 353.72, "r_y1": 362.76, "r_x2": 353.72, "r_y2": 354.69, "r_x3": 320.7, "r_y3": 354.69, "coord_origin": "TOPLEFT" }, "text": "complex", "orig": "complex", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 23, "label": "text", "bbox": { "l": 369.31, "t": 354.69, "r": 379.03, "b": 362.76, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 34, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 369.31, "r_y0": 362.76, "r_x1": 379.03, "r_y1": 362.76, "r_x2": 379.03, "r_y2": 354.69, "r_x3": 369.31, "r_y3": 354.69, "coord_origin": "TOPLEFT" }, "text": "all", "orig": "all", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 24, "label": "text", "bbox": { "l": 161.91, "t": 373.52, "r": 166.51, "b": 381.59, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 35, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 161.91, "r_y0": 381.59, "r_x1": 166.51, "r_y1": 381.59, "r_x2": 166.51, "r_y2": 373.52, "r_x3": 161.91, "r_y3": 373.52, "coord_origin": "TOPLEFT" }, "text": "6", "orig": "6", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 25, "label": "text", "bbox": { "l": 209.51, "t": 373.52, "r": 214.12, "b": 381.59, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 36, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 209.51, "r_y0": 381.59, "r_x1": 214.12, "r_y1": 381.59, "r_x2": 214.12, "r_y2": 373.52, "r_x3": 209.51, "r_y3": 373.52, "coord_origin": "TOPLEFT" }, "text": "6", "orig": "6", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 26, "label": "text", "bbox": { "l": 246.71, "t": 368.04, "r": 271.41, "b": 376.11, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 37, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 246.71, "r_y0": 376.11, "r_x1": 271.41, "r_y1": 376.11, "r_x2": 271.41, "r_y2": 368.04, "r_x3": 246.71, "r_y3": 368.04, "coord_origin": "TOPLEFT" }, "text": "OTSL", "orig": "OTSL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 27, "label": "text", "bbox": { "l": 289.02, "t": 368.04, "r": 310.0, "b": 376.11, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 38, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 289.02, "r_y0": 376.11, "r_x1": 310.0, "r_y1": 376.11, "r_x2": 310.0, "r_y2": 368.04, "r_x3": 289.02, "r_y3": 368.04, "coord_origin": "TOPLEFT" }, "text": "0.965", "orig": "0.965", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 28, "label": "text", "bbox": { "l": 326.72, "t": 368.04, "r": 347.7, "b": 376.11, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 39, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 326.72, "r_y0": 376.11, "r_x1": 347.7, "r_y1": 376.11, "r_x2": 347.7, "r_y2": 368.04, "r_x3": 326.72, "r_y3": 368.04, "coord_origin": "TOPLEFT" }, "text": "0.934", "orig": "0.934", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 29, "label": "text", "bbox": { "l": 363.68, "t": 368.04, "r": 384.66, "b": 376.11, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 40, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 363.68, "r_y0": 376.11, "r_x1": 384.66, "r_y1": 376.11, "r_x2": 384.66, "r_y2": 368.04, "r_x3": 363.68, "r_y3": 368.04, "coord_origin": "TOPLEFT" }, "text": "0.955", "orig": "0.955", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 30, "label": "text", "bbox": { "l": 397.27, "t": 367.97, "r": 416.13, "b": 375.9, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 41, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 397.27, "r_y0": 375.9, "r_x1": 416.13, "r_y1": 375.9, "r_x2": 416.13, "r_y2": 367.97, "r_x3": 397.27, "r_y3": 367.97, "coord_origin": "TOPLEFT" }, "text": "0.88", "orig": "0.88", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 31, "label": "text", "bbox": { "l": 439.53, "t": 367.97, "r": 458.38, "b": 375.9, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 42, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 439.53, "r_y0": 375.9, "r_x1": 458.38, "r_y1": 375.9, "r_x2": 458.38, "r_y2": 367.97, "r_x3": 439.53, "r_y3": 367.97, "coord_origin": "TOPLEFT" }, "text": "2.73", "orig": "2.73", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 32, "label": "text", "bbox": { "l": 245.18, "t": 380.99, "r": 272.94, "b": 389.06, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 43, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 245.18, "r_y0": 389.06, "r_x1": 272.94, "r_y1": 389.06, "r_x2": 272.94, "r_y2": 380.99, "r_x3": 245.18, "r_y3": 380.99, "coord_origin": "TOPLEFT" }, "text": "HTML", "orig": "HTML", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 33, "label": "text", "bbox": { "l": 289.02, "t": 380.99, "r": 310.0, "b": 389.06, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 44, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 289.02, "r_y0": 389.06, "r_x1": 310.0, "r_y1": 389.06, "r_x2": 310.0, "r_y2": 380.99, "r_x3": 289.02, "r_y3": 380.99, "coord_origin": "TOPLEFT" }, "text": "0.969", "orig": "0.969", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 34, "label": "text", "bbox": { "l": 326.72, "t": 380.99, "r": 347.7, "b": 389.06, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 45, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 326.72, "r_y0": 389.06, "r_x1": 347.7, "r_y1": 389.06, "r_x2": 347.7, "r_y2": 380.99, "r_x3": 326.72, "r_y3": 380.99, "coord_origin": "TOPLEFT" }, "text": "0.927", "orig": "0.927", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 35, "label": "text", "bbox": { "l": 363.68, "t": 380.99, "r": 384.66, "b": 389.06, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 46, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 363.68, "r_y0": 389.06, "r_x1": 384.66, "r_y1": 389.06, "r_x2": 384.66, "r_y2": 380.99, "r_x3": 363.68, "r_y3": 380.99, "coord_origin": "TOPLEFT" }, "text": "0.955", "orig": "0.955", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 36, "label": "text", "bbox": { "l": 396.21, "t": 380.99, "r": 417.19, "b": 389.06, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 47, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 396.21, "r_y0": 389.06, "r_x1": 417.19, "r_y1": 389.06, "r_x2": 417.19, "r_y2": 380.99, "r_x3": 396.21, "r_y3": 380.99, "coord_origin": "TOPLEFT" }, "text": "0.857", "orig": "0.857", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 37, "label": "text", "bbox": { "l": 440.77, "t": 380.99, "r": 457.15, "b": 389.06, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 48, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 440.77, "r_y0": 389.06, "r_x1": 457.15, "r_y1": 389.06, "r_x2": 457.15, "r_y2": 380.99, "r_x3": 440.77, "r_y3": 380.99, "coord_origin": "TOPLEFT" }, "text": "5.39", "orig": "5.39", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 38, "label": "text", "bbox": { "l": 161.91, "t": 399.82, "r": 166.51, "b": 407.89, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 49, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 161.91, "r_y0": 407.89, "r_x1": 166.51, "r_y1": 407.89, "r_x2": 166.51, "r_y2": 399.82, "r_x3": 161.91, "r_y3": 399.82, "coord_origin": "TOPLEFT" }, "text": "4", "orig": "4", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 39, "label": "text", "bbox": { "l": 209.51, "t": 399.82, "r": 214.12, "b": 407.89, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 50, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 209.51, "r_y0": 407.89, "r_x1": 214.12, "r_y1": 407.89, "r_x2": 214.12, "r_y2": 399.82, "r_x3": 209.51, "r_y3": 399.82, "coord_origin": "TOPLEFT" }, "text": "4", "orig": "4", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 40, "label": "text", "bbox": { "l": 246.71, "t": 394.34, "r": 271.41, "b": 402.41, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 51, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 246.71, "r_y0": 402.41, "r_x1": 271.41, "r_y1": 402.41, "r_x2": 271.41, "r_y2": 394.34, "r_x3": 246.71, "r_y3": 394.34, "coord_origin": "TOPLEFT" }, "text": "OTSL", "orig": "OTSL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 41, "label": "text", "bbox": { "l": 289.02, "t": 394.34, "r": 310.0, "b": 402.41, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 52, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 289.02, "r_y0": 402.41, "r_x1": 310.0, "r_y1": 402.41, "r_x2": 310.0, "r_y2": 394.34, "r_x3": 289.02, "r_y3": 394.34, "coord_origin": "TOPLEFT" }, "text": "0.938", "orig": "0.938", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 42, "label": "text", "bbox": { "l": 326.72, "t": 394.34, "r": 347.7, "b": 402.41, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 53, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 326.72, "r_y0": 402.41, "r_x1": 347.7, "r_y1": 402.41, "r_x2": 347.7, "r_y2": 394.34, "r_x3": 326.72, "r_y3": 394.34, "coord_origin": "TOPLEFT" }, "text": "0.904", "orig": "0.904", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 43, "label": "text", "bbox": { "l": 363.68, "t": 394.34, "r": 384.66, "b": 402.41, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 54, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 363.68, "r_y0": 402.41, "r_x1": 384.66, "r_y1": 402.41, "r_x2": 384.66, "r_y2": 394.34, "r_x3": 363.68, "r_y3": 394.34, "coord_origin": "TOPLEFT" }, "text": "0.927", "orig": "0.927", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 44, "label": "text", "bbox": { "l": 394.62, "t": 394.28, "r": 418.78, "b": 402.2, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 55, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 394.62, "r_y0": 402.2, "r_x1": 418.78, "r_y1": 402.2, "r_x2": 418.78, "r_y2": 394.28, "r_x3": 394.62, "r_y3": 394.28, "coord_origin": "TOPLEFT" }, "text": "0.853", "orig": "0.853", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 45, "label": "text", "bbox": { "l": 439.53, "t": 394.28, "r": 458.38, "b": 402.2, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 56, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 439.53, "r_y0": 402.2, "r_x1": 458.38, "r_y1": 402.2, "r_x2": 458.38, "r_y2": 394.28, "r_x3": 439.53, "r_y3": 394.28, "coord_origin": "TOPLEFT" }, "text": "1.97", "orig": "1.97", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 46, "label": "text", "bbox": { "l": 245.18, "t": 407.29, "r": 272.94, "b": 415.36, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 57, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 245.18, "r_y0": 415.36, "r_x1": 272.94, "r_y1": 415.36, "r_x2": 272.94, "r_y2": 407.29, "r_x3": 245.18, "r_y3": 407.29, "coord_origin": "TOPLEFT" }, "text": "HTML", "orig": "HTML", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 47, "label": "text", "bbox": { "l": 289.02, "t": 407.29, "r": 310.0, "b": 415.36, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 58, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 289.02, "r_y0": 415.36, "r_x1": 310.0, "r_y1": 415.36, "r_x2": 310.0, "r_y2": 407.29, "r_x3": 289.02, "r_y3": 407.29, "coord_origin": "TOPLEFT" }, "text": "0.952", "orig": "0.952", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 48, "label": "text", "bbox": { "l": 326.72, "t": 407.29, "r": 347.7, "b": 415.36, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 59, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 326.72, "r_y0": 415.36, "r_x1": 347.7, "r_y1": 415.36, "r_x2": 347.7, "r_y2": 407.29, "r_x3": 326.72, "r_y3": 407.29, "coord_origin": "TOPLEFT" }, "text": "0.909", "orig": "0.909", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 49, "label": "text", "bbox": { "l": 362.09, "t": 407.23, "r": 386.25, "b": 415.15, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 60, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 362.09, "r_y0": 415.15, "r_x1": 386.25, "r_y1": 415.15, "r_x2": 386.25, "r_y2": 407.23, "r_x3": 362.09, "r_y3": 407.23, "coord_origin": "TOPLEFT" }, "text": "0.938", "orig": "0.938", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 50, "label": "text", "bbox": { "l": 396.21, "t": 407.29, "r": 417.19, "b": 415.36, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 61, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 396.21, "r_y0": 415.36, "r_x1": 417.19, "r_y1": 415.36, "r_x2": 417.19, "r_y2": 407.29, "r_x3": 396.21, "r_y3": 407.29, "coord_origin": "TOPLEFT" }, "text": "0.843", "orig": "0.843", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 51, "label": "text", "bbox": { "l": 440.77, "t": 407.29, "r": 457.15, "b": 415.36, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 62, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 440.77, "r_y0": 415.36, "r_x1": 457.15, "r_y1": 415.36, "r_x2": 457.15, "r_y2": 407.29, "r_x3": 440.77, "r_y3": 407.29, "coord_origin": "TOPLEFT" }, "text": "3.77", "orig": "3.77", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 52, "label": "text", "bbox": { "l": 161.91, "t": 426.12, "r": 166.51, "b": 434.19, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 63, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 161.91, "r_y0": 434.19, "r_x1": 166.51, "r_y1": 434.19, "r_x2": 166.51, "r_y2": 426.12, "r_x3": 161.91, "r_y3": 426.12, "coord_origin": "TOPLEFT" }, "text": "2", "orig": "2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 53, "label": "text", "bbox": { "l": 209.51, "t": 426.12, "r": 214.12, "b": 434.19, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 64, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 209.51, "r_y0": 434.19, "r_x1": 214.12, "r_y1": 434.19, "r_x2": 214.12, "r_y2": 426.12, "r_x3": 209.51, "r_y3": 426.12, "coord_origin": "TOPLEFT" }, "text": "4", "orig": "4", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 54, "label": "text", "bbox": { "l": 246.71, "t": 420.64, "r": 271.41, "b": 428.71, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 65, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 246.71, "r_y0": 428.71, "r_x1": 271.41, "r_y1": 428.71, "r_x2": 271.41, "r_y2": 420.64, "r_x3": 246.71, "r_y3": 420.64, "coord_origin": "TOPLEFT" }, "text": "OTSL", "orig": "OTSL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 55, "label": "text", "bbox": { "l": 289.02, "t": 420.64, "r": 310.0, "b": 428.71, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 66, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 289.02, "r_y0": 428.71, "r_x1": 310.0, "r_y1": 428.71, "r_x2": 310.0, "r_y2": 420.64, "r_x3": 289.02, "r_y3": 420.64, "coord_origin": "TOPLEFT" }, "text": "0.923", "orig": "0.923", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 56, "label": "text", "bbox": { "l": 326.72, "t": 420.64, "r": 347.7, "b": 428.71, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 67, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 326.72, "r_y0": 428.71, "r_x1": 347.7, "r_y1": 428.71, "r_x2": 347.7, "r_y2": 420.64, "r_x3": 326.72, "r_y3": 420.64, "coord_origin": "TOPLEFT" }, "text": "0.897", "orig": "0.897", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 57, "label": "text", "bbox": { "l": 363.68, "t": 420.64, "r": 384.66, "b": 428.71, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 68, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 363.68, "r_y0": 428.71, "r_x1": 384.66, "r_y1": 428.71, "r_x2": 384.66, "r_y2": 420.64, "r_x3": 363.68, "r_y3": 420.64, "coord_origin": "TOPLEFT" }, "text": "0.915", "orig": "0.915", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 58, "label": "text", "bbox": { "l": 394.62, "t": 420.58, "r": 418.78, "b": 428.5, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 69, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 394.62, "r_y0": 428.5, "r_x1": 418.78, "r_y1": 428.5, "r_x2": 418.78, "r_y2": 420.58, "r_x3": 394.62, "r_y3": 420.58, "coord_origin": "TOPLEFT" }, "text": "0.859", "orig": "0.859", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 59, "label": "text", "bbox": { "l": 439.53, "t": 420.58, "r": 458.38, "b": 428.5, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 70, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 439.53, "r_y0": 428.5, "r_x1": 458.38, "r_y1": 428.5, "r_x2": 458.38, "r_y2": 420.58, "r_x3": 439.53, "r_y3": 420.58, "coord_origin": "TOPLEFT" }, "text": "1.91", "orig": "1.91", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 60, "label": "text", "bbox": { "l": 245.18, "t": 433.59, "r": 272.94, "b": 441.66, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 71, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 245.18, "r_y0": 441.66, "r_x1": 272.94, "r_y1": 441.66, "r_x2": 272.94, "r_y2": 433.59, "r_x3": 245.18, "r_y3": 433.59, "coord_origin": "TOPLEFT" }, "text": "HTML", "orig": "HTML", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 61, "label": "text", "bbox": { "l": 289.02, "t": 433.59, "r": 310.0, "b": 441.66, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 72, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 289.02, "r_y0": 441.66, "r_x1": 310.0, "r_y1": 441.66, "r_x2": 310.0, "r_y2": 433.59, "r_x3": 289.02, "r_y3": 433.59, "coord_origin": "TOPLEFT" }, "text": "0.945", "orig": "0.945", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 62, "label": "text", "bbox": { "l": 326.72, "t": 433.59, "r": 347.7, "b": 441.66, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 73, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 326.72, "r_y0": 441.66, "r_x1": 347.7, "r_y1": 441.66, "r_x2": 347.7, "r_y2": 433.59, "r_x3": 326.72, "r_y3": 433.59, "coord_origin": "TOPLEFT" }, "text": "0.901", "orig": "0.901", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 63, "label": "text", "bbox": { "l": 362.09, "t": 433.53, "r": 386.25, "b": 441.45, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 74, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 362.09, "r_y0": 441.45, "r_x1": 386.25, "r_y1": 441.45, "r_x2": 386.25, "r_y2": 433.53, "r_x3": 362.09, "r_y3": 433.53, "coord_origin": "TOPLEFT" }, "text": "0.931", "orig": "0.931", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 64, "label": "text", "bbox": { "l": 396.21, "t": 433.59, "r": 417.19, "b": 441.66, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 75, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 396.21, "r_y0": 441.66, "r_x1": 417.19, "r_y1": 441.66, "r_x2": 417.19, "r_y2": 433.59, "r_x3": 396.21, "r_y3": 433.59, "coord_origin": "TOPLEFT" }, "text": "0.834", "orig": "0.834", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 65, "label": "text", "bbox": { "l": 440.77, "t": 433.59, "r": 457.15, "b": 441.66, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 76, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 440.77, "r_y0": 441.66, "r_x1": 457.15, "r_y1": 441.66, "r_x2": 457.15, "r_y2": 433.59, "r_x3": 440.77, "r_y3": 433.59, "coord_origin": "TOPLEFT" }, "text": "3.81", "orig": "3.81", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 66, "label": "text", "bbox": { "l": 161.91, "t": 452.42, "r": 166.51, "b": 460.49, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 77, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 161.91, "r_y0": 460.49, "r_x1": 166.51, "r_y1": 460.49, "r_x2": 166.51, "r_y2": 452.42, "r_x3": 161.91, "r_y3": 452.42, "coord_origin": "TOPLEFT" }, "text": "4", "orig": "4", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 67, "label": "text", "bbox": { "l": 209.51, "t": 452.42, "r": 214.12, "b": 460.49, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 78, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 209.51, "r_y0": 460.49, "r_x1": 214.12, "r_y1": 460.49, "r_x2": 214.12, "r_y2": 452.42, "r_x3": 209.51, "r_y3": 452.42, "coord_origin": "TOPLEFT" }, "text": "2", "orig": "2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 68, "label": "text", "bbox": { "l": 246.71, "t": 446.94, "r": 271.41, "b": 455.01, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 79, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 246.71, "r_y0": 455.01, "r_x1": 271.41, "r_y1": 455.01, "r_x2": 271.41, "r_y2": 446.94, "r_x3": 246.71, "r_y3": 446.94, "coord_origin": "TOPLEFT" }, "text": "OTSL", "orig": "OTSL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 69, "label": "text", "bbox": { "l": 289.02, "t": 446.94, "r": 310.0, "b": 455.01, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 80, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 289.02, "r_y0": 455.01, "r_x1": 310.0, "r_y1": 455.01, "r_x2": 310.0, "r_y2": 446.94, "r_x3": 289.02, "r_y3": 446.94, "coord_origin": "TOPLEFT" }, "text": "0.952", "orig": "0.952", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 70, "label": "text", "bbox": { "l": 329.02, "t": 446.94, "r": 345.4, "b": 455.01, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 81, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 329.02, "r_y0": 455.01, "r_x1": 345.4, "r_y1": 455.01, "r_x2": 345.4, "r_y2": 446.94, "r_x3": 329.02, "r_y3": 446.94, "coord_origin": "TOPLEFT" }, "text": "0.92", "orig": "0.92", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 71, "label": "text", "bbox": { "l": 362.09, "t": 446.88, "r": 386.25, "b": 454.8, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 82, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 362.09, "r_y0": 454.8, "r_x1": 386.25, "r_y1": 454.8, "r_x2": 386.25, "r_y2": 446.88, "r_x3": 362.09, "r_y3": 446.88, "coord_origin": "TOPLEFT" }, "text": "0.942", "orig": "0.942", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 72, "label": "text", "bbox": { "l": 394.62, "t": 446.88, "r": 418.78, "b": 454.8, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 83, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 394.62, "r_y0": 454.8, "r_x1": 418.78, "r_y1": 454.8, "r_x2": 418.78, "r_y2": 446.88, "r_x3": 394.62, "r_y3": 446.88, "coord_origin": "TOPLEFT" }, "text": "0.857", "orig": "0.857", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 73, "label": "text", "bbox": { "l": 439.53, "t": 446.88, "r": 458.38, "b": 454.8, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 84, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 439.53, "r_y0": 454.8, "r_x1": 458.38, "r_y1": 454.8, "r_x2": 458.38, "r_y2": 446.88, "r_x3": 439.53, "r_y3": 446.88, "coord_origin": "TOPLEFT" }, "text": "1.22", "orig": "1.22", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 74, "label": "text", "bbox": { "l": 245.18, "t": 459.89, "r": 272.94, "b": 467.96, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 85, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 245.18, "r_y0": 467.96, "r_x1": 272.94, "r_y1": 467.96, "r_x2": 272.94, "r_y2": 459.89, "r_x3": 245.18, "r_y3": 459.89, "coord_origin": "TOPLEFT" }, "text": "HTML", "orig": "HTML", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 75, "label": "text", "bbox": { "l": 289.02, "t": 459.89, "r": 310.0, "b": 467.96, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 86, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 289.02, "r_y0": 467.96, "r_x1": 310.0, "r_y1": 467.96, "r_x2": 310.0, "r_y2": 459.89, "r_x3": 289.02, "r_y3": 459.89, "coord_origin": "TOPLEFT" }, "text": "0.944", "orig": "0.944", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 76, "label": "text", "bbox": { "l": 326.72, "t": 459.89, "r": 347.7, "b": 467.96, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 87, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 326.72, "r_y0": 467.96, "r_x1": 347.7, "r_y1": 467.96, "r_x2": 347.7, "r_y2": 459.89, "r_x3": 326.72, "r_y3": 459.89, "coord_origin": "TOPLEFT" }, "text": "0.903", "orig": "0.903", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 77, "label": "text", "bbox": { "l": 363.68, "t": 459.89, "r": 384.66, "b": 467.96, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 88, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 363.68, "r_y0": 467.96, "r_x1": 384.66, "r_y1": 467.96, "r_x2": 384.66, "r_y2": 459.89, "r_x3": 363.68, "r_y3": 459.89, "coord_origin": "TOPLEFT" }, "text": "0.931", "orig": "0.931", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 78, "label": "text", "bbox": { "l": 396.21, "t": 459.89, "r": 417.19, "b": 467.96, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 89, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 396.21, "r_y0": 467.96, "r_x1": 417.19, "r_y1": 467.96, "r_x2": 417.19, "r_y2": 459.89, "r_x3": 396.21, "r_y3": 459.89, "coord_origin": "TOPLEFT" }, "text": "0.824", "orig": "0.824", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 79, "label": "text", "bbox": { "l": 446.65, "t": 459.89, "r": 451.26, "b": 467.96, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 90, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 446.65, "r_y0": 467.96, "r_x1": 451.26, "r_y1": 467.96, "r_x2": 451.26, "r_y2": 459.89, "r_x3": 446.65, "r_y3": 459.89, "coord_origin": "TOPLEFT" }, "text": "2", "orig": "2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] } ] }, "text": null, "otsl_seq": [ "ched", "ched", "ched", "ched", "lcel", "lcel", "ched", "ched", "nl", "ucel", "ucel", "ucel", "ched", "ched", "ched", "ched", "ched", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "nl" ], "num_rows": 6, "num_cols": 8, "table_cells": [ { "bbox": { "l": 160.37, "t": 341.73, "r": 168.05, "b": 349.8, "coord_origin": "TOPLEFT" }, "row_span": 2, "col_span": 1, "start_row_offset_idx": 0, "end_row_offset_idx": 2, "start_col_offset_idx": 0, "end_col_offset_idx": 1, "text": "# enc-layers", "column_header": true, "row_header": false, "row_section": false }, { "bbox": { "l": 207.97, "t": 341.73, "r": 215.65, "b": 349.8, "coord_origin": "TOPLEFT" }, "row_span": 2, "col_span": 1, "start_row_offset_idx": 0, "end_row_offset_idx": 2, "start_col_offset_idx": 1, "end_col_offset_idx": 2, "text": "# dec-layers", "column_header": true, "row_header": false, "row_section": false }, { "bbox": { "l": 239.8, "t": 347.21, "r": 278.32, "b": 355.28, "coord_origin": "TOPLEFT" }, "row_span": 2, "col_span": 1, "start_row_offset_idx": 0, "end_row_offset_idx": 2, "start_col_offset_idx": 2, "end_col_offset_idx": 3, "text": "Language", "column_header": true, "row_header": false, "row_section": false }, { "bbox": { "l": 324.67, "t": 341.73, "r": 348.26, "b": 349.8, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 3, "start_row_offset_idx": 0, "end_row_offset_idx": 1, "start_col_offset_idx": 3, "end_col_offset_idx": 6, "text": "TEDs", "column_header": true, "row_header": false, "row_section": false }, { "bbox": { "l": 396.27, "t": 341.73, "r": 417.13, "b": 349.8, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 0, "end_row_offset_idx": 1, "start_col_offset_idx": 6, "end_col_offset_idx": 7, "text": "mAP", "column_header": true, "row_header": false, "row_section": false }, { "bbox": { "l": 394.93, "t": 352.69, "r": 418.47, "b": 360.76, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 1, "end_row_offset_idx": 2, "start_col_offset_idx": 6, "end_col_offset_idx": 7, "text": "(0.75)", "column_header": true, "row_header": false, "row_section": false }, { "bbox": { "l": 430.77, "t": 341.73, "r": 467.14, "b": 349.8, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 0, "end_row_offset_idx": 1, "start_col_offset_idx": 7, "end_col_offset_idx": 8, "text": "Inference", "column_header": true, "row_header": false, "row_section": false }, { "bbox": { "l": 427.15, "t": 352.69, "r": 470.76, "b": 360.76, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 1, "end_row_offset_idx": 2, "start_col_offset_idx": 7, "end_col_offset_idx": 8, "text": "time (secs)", "column_header": true, "row_header": false, "row_section": false }, { "bbox": { "l": 286.69, "t": 354.69, "r": 312.33, "b": 362.76, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 1, "end_row_offset_idx": 2, "start_col_offset_idx": 3, "end_col_offset_idx": 4, "text": "simple", "column_header": true, "row_header": false, "row_section": false }, { "bbox": { "l": 320.7, "t": 354.69, "r": 353.72, "b": 362.76, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 1, "end_row_offset_idx": 2, "start_col_offset_idx": 4, "end_col_offset_idx": 5, "text": "complex", "column_header": true, "row_header": false, "row_section": false }, { "bbox": { "l": 369.31, "t": 354.69, "r": 379.03, "b": 362.76, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 1, "end_row_offset_idx": 2, "start_col_offset_idx": 5, "end_col_offset_idx": 6, "text": "all", "column_header": true, "row_header": false, "row_section": false }, { "bbox": { "l": 161.91, "t": 373.52, "r": 166.51, "b": 381.59, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 2, "end_row_offset_idx": 3, "start_col_offset_idx": 0, "end_col_offset_idx": 1, "text": "6", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 209.51, "t": 373.52, "r": 214.12, "b": 381.59, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 2, "end_row_offset_idx": 3, "start_col_offset_idx": 1, "end_col_offset_idx": 2, "text": "6", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 246.71, "t": 368.04, "r": 271.41, "b": 376.11, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 2, "end_row_offset_idx": 3, "start_col_offset_idx": 2, "end_col_offset_idx": 3, "text": "OTSL HTML", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 289.02, "t": 368.04, "r": 310.0, "b": 376.11, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 2, "end_row_offset_idx": 3, "start_col_offset_idx": 3, "end_col_offset_idx": 4, "text": "0.965 0.969", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 326.72, "t": 368.04, "r": 347.7, "b": 376.11, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 2, "end_row_offset_idx": 3, "start_col_offset_idx": 4, "end_col_offset_idx": 5, "text": "0.934 0.927", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 363.68, "t": 368.04, "r": 384.66, "b": 376.11, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 2, "end_row_offset_idx": 3, "start_col_offset_idx": 5, "end_col_offset_idx": 6, "text": "0.955 0.955", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 397.27, "t": 367.97, "r": 416.13, "b": 375.9, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 2, "end_row_offset_idx": 3, "start_col_offset_idx": 6, "end_col_offset_idx": 7, "text": "0.88 0.857", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 439.53, "t": 367.97, "r": 458.38, "b": 375.9, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 2, "end_row_offset_idx": 3, "start_col_offset_idx": 7, "end_col_offset_idx": 8, "text": "2.73 5.39", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 161.91, "t": 399.82, "r": 166.51, "b": 407.89, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 3, "end_row_offset_idx": 4, "start_col_offset_idx": 0, "end_col_offset_idx": 1, "text": "4", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 209.51, "t": 399.82, "r": 214.12, "b": 407.89, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 3, "end_row_offset_idx": 4, "start_col_offset_idx": 1, "end_col_offset_idx": 2, "text": "4", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 246.71, "t": 394.34, "r": 271.41, "b": 402.41, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 3, "end_row_offset_idx": 4, "start_col_offset_idx": 2, "end_col_offset_idx": 3, "text": "OTSL HTML", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 289.02, "t": 394.34, "r": 310.0, "b": 402.41, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 3, "end_row_offset_idx": 4, "start_col_offset_idx": 3, "end_col_offset_idx": 4, "text": "0.938 0.952", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 326.72, "t": 394.34, "r": 347.7, "b": 402.41, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 3, "end_row_offset_idx": 4, "start_col_offset_idx": 4, "end_col_offset_idx": 5, "text": "0.904 0.909", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 363.68, "t": 394.34, "r": 384.66, "b": 402.41, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 3, "end_row_offset_idx": 4, "start_col_offset_idx": 5, "end_col_offset_idx": 6, "text": "0.927 0.938", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 394.62, "t": 394.28, "r": 418.78, "b": 402.2, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 3, "end_row_offset_idx": 4, "start_col_offset_idx": 6, "end_col_offset_idx": 7, "text": "0.853 0.843", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 439.53, "t": 394.28, "r": 458.38, "b": 402.2, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 3, "end_row_offset_idx": 4, "start_col_offset_idx": 7, "end_col_offset_idx": 8, "text": "1.97 3.77", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 161.91, "t": 426.12, "r": 166.51, "b": 434.19, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 4, "end_row_offset_idx": 5, "start_col_offset_idx": 0, "end_col_offset_idx": 1, "text": "2", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 209.51, "t": 426.12, "r": 214.12, "b": 434.19, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 4, "end_row_offset_idx": 5, "start_col_offset_idx": 1, "end_col_offset_idx": 2, "text": "4", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 246.71, "t": 420.64, "r": 271.41, "b": 428.71, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 4, "end_row_offset_idx": 5, "start_col_offset_idx": 2, "end_col_offset_idx": 3, "text": "OTSL HTML", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 289.02, "t": 420.64, "r": 310.0, "b": 428.71, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 4, "end_row_offset_idx": 5, "start_col_offset_idx": 3, "end_col_offset_idx": 4, "text": "0.923 0.945", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 326.72, "t": 420.64, "r": 347.7, "b": 428.71, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 4, "end_row_offset_idx": 5, "start_col_offset_idx": 4, "end_col_offset_idx": 5, "text": "0.897 0.901", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 363.68, "t": 420.64, "r": 384.66, "b": 428.71, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 4, "end_row_offset_idx": 5, "start_col_offset_idx": 5, "end_col_offset_idx": 6, "text": "0.915 0.931", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 394.62, "t": 420.58, "r": 418.78, "b": 428.5, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 4, "end_row_offset_idx": 5, "start_col_offset_idx": 6, "end_col_offset_idx": 7, "text": "0.859 0.834", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 439.53, "t": 420.58, "r": 458.38, "b": 428.5, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 4, "end_row_offset_idx": 5, "start_col_offset_idx": 7, "end_col_offset_idx": 8, "text": "1.91 3.81", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 161.91, "t": 452.42, "r": 166.51, "b": 460.49, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 5, "end_row_offset_idx": 6, "start_col_offset_idx": 0, "end_col_offset_idx": 1, "text": "4", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 209.51, "t": 452.42, "r": 214.12, "b": 460.49, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 5, "end_row_offset_idx": 6, "start_col_offset_idx": 1, "end_col_offset_idx": 2, "text": "2", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 246.71, "t": 446.94, "r": 271.41, "b": 455.01, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 5, "end_row_offset_idx": 6, "start_col_offset_idx": 2, "end_col_offset_idx": 3, "text": "OTSL HTML", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 289.02, "t": 446.94, "r": 310.0, "b": 455.01, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 5, "end_row_offset_idx": 6, "start_col_offset_idx": 3, "end_col_offset_idx": 4, "text": "0.952 0.944", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 329.02, "t": 446.94, "r": 345.4, "b": 455.01, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 5, "end_row_offset_idx": 6, "start_col_offset_idx": 4, "end_col_offset_idx": 5, "text": "0.92 0.903", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 362.09, "t": 446.88, "r": 386.25, "b": 454.8, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 5, "end_row_offset_idx": 6, "start_col_offset_idx": 5, "end_col_offset_idx": 6, "text": "0.942 0.931", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 394.62, "t": 446.88, "r": 418.78, "b": 454.8, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 5, "end_row_offset_idx": 6, "start_col_offset_idx": 6, "end_col_offset_idx": 7, "text": "0.857 0.824", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 439.53, "t": 446.88, "r": 458.38, "b": 454.8, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 5, "end_row_offset_idx": 6, "start_col_offset_idx": 7, "end_col_offset_idx": 8, "text": "1.22 2", "column_header": false, "row_header": false, "row_section": false } ] }, { "label": "section_header", "id": 5, "page_no": 8, "cluster": { "id": 5, "label": "section_header", "bbox": { "l": 134.76, "t": 508.15, "r": 264.4, "b": 516.96, "coord_origin": "TOPLEFT" }, "confidence": 0.959, "cells": [ { "index": 91, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 516.96, "r_x1": 149.4, "r_y1": 516.96, "r_x2": 149.4, "r_y2": 508.15, "r_x3": 134.76, "r_y3": 508.15, "coord_origin": "TOPLEFT" }, "text": "5.2", "orig": "5.2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 92, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 160.86, "r_y0": 516.96, "r_x1": 264.4, "r_y1": 516.96, "r_x2": 264.4, "r_y2": 508.15, "r_x3": 160.86, "r_y3": 508.15, "coord_origin": "TOPLEFT" }, "text": "Quantitative Results", "orig": "Quantitative Results", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "5.2 Quantitative Results" }, { "label": "text", "id": 1, "page_no": 8, "cluster": { "id": 1, "label": "text", "bbox": { "l": 134.76, "t": 524.55, "r": 480.6, "b": 617.03, "coord_origin": "TOPLEFT" }, "confidence": 0.985, "cells": [ { "index": 93, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 533.35, "r_x1": 480.59, "r_y1": 533.35, "r_x2": 480.59, "r_y2": 524.55, "r_x3": 134.76, "r_y3": 524.55, "coord_origin": "TOPLEFT" }, "text": "We picked the model parameter configuration that produced the best prediction", "orig": "We picked the model parameter configuration that produced the best prediction", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 94, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 545.3, "r_x1": 480.59, "r_y1": 545.3, "r_x2": 480.59, "r_y2": 536.51, "r_x3": 134.76, "r_y3": 536.51, "coord_origin": "TOPLEFT" }, "text": "quality (enc=6, dec=6, heads=8) with PubTabNet alone, then independently", "orig": "quality (enc=6, dec=6, heads=8) with PubTabNet alone, then independently", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 95, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 557.26, "r_x1": 480.6, "r_y1": 557.26, "r_x2": 480.6, "r_y2": 548.46, "r_x3": 134.76, "r_y3": 548.46, "coord_origin": "TOPLEFT" }, "text": "trained and evaluated it on three publicly available data sets: PubTabNet (395k", "orig": "trained and evaluated it on three publicly available data sets: PubTabNet (395k", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 96, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 569.21, "r_x1": 480.59, "r_y1": 569.21, "r_x2": 480.59, "r_y2": 560.42, "r_x3": 134.76, "r_y3": 560.42, "coord_origin": "TOPLEFT" }, "text": "samples), FinTabNet (113k samples) and PubTables-1M (about 1M samples).", "orig": "samples), FinTabNet (113k samples) and PubTables-1M (about 1M samples).", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 97, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 581.17, "r_x1": 480.59, "r_y1": 581.17, "r_x2": 480.59, "r_y2": 572.37, "r_x3": 134.76, "r_y3": 572.37, "coord_origin": "TOPLEFT" }, "text": "Performance results are presented in Table. 2. It is clearly evident that the model", "orig": "Performance results are presented in Table. 2. It is clearly evident that the model", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 98, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 593.12, "r_x1": 480.6, "r_y1": 593.12, "r_x2": 480.6, "r_y2": 584.33, "r_x3": 134.76, "r_y3": 584.33, "coord_origin": "TOPLEFT" }, "text": "trained on OTSL outperforms HTML across the board, keeping high TEDs and", "orig": "trained on OTSL outperforms HTML across the board, keeping high TEDs and", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 99, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 605.08, "r_x1": 480.59, "r_y1": 605.08, "r_x2": 480.59, "r_y2": 596.28, "r_x3": 134.76, "r_y3": 596.28, "coord_origin": "TOPLEFT" }, "text": "mAP scores even on difficult financial tables (FinTabNet) that contain sparse", "orig": "mAP scores even on difficult financial tables (FinTabNet) that contain sparse", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 100, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 617.03, "r_x1": 206.79, "r_y1": 617.03, "r_x2": 206.79, "r_y2": 608.24, "r_x3": 134.76, "r_y3": 608.24, "coord_origin": "TOPLEFT" }, "text": "and large tables.", "orig": "and large tables.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "We picked the model parameter configuration that produced the best prediction quality (enc=6, dec=6, heads=8) with PubTabNet alone, then independently trained and evaluated it on three publicly available data sets: PubTabNet (395k samples), FinTabNet (113k samples) and PubTables-1M (about 1M samples). Performance results are presented in Table. 2. It is clearly evident that the model trained on OTSL outperforms HTML across the board, keeping high TEDs and mAP scores even on difficult financial tables (FinTabNet) that contain sparse and large tables." }, { "label": "text", "id": 2, "page_no": 8, "cluster": { "id": 2, "label": "text", "bbox": { "l": 134.76, "t": 620.19, "r": 480.6, "b": 664.85, "coord_origin": "TOPLEFT" }, "confidence": 0.985, "cells": [ { "index": 101, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 149.71, "r_y0": 628.99, "r_x1": 480.59, "r_y1": 628.99, "r_x2": 480.59, "r_y2": 620.19, "r_x3": 149.71, "r_y3": 620.19, "coord_origin": "TOPLEFT" }, "text": "Additionally, the results show that OTSL has an advantage over HTML", "orig": "Additionally, the results show that OTSL has an advantage over HTML", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 102, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 640.94, "r_x1": 480.6, "r_y1": 640.94, "r_x2": 480.6, "r_y2": 632.15, "r_x3": 134.76, "r_y3": 632.15, "coord_origin": "TOPLEFT" }, "text": "when applied on a bigger data set like PubTables-1M and achieves significantly", "orig": "when applied on a bigger data set like PubTables-1M and achieves significantly", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 103, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 652.9, "r_x1": 480.59, "r_y1": 652.9, "r_x2": 480.59, "r_y2": 644.1, "r_x3": 134.76, "r_y3": 644.1, "coord_origin": "TOPLEFT" }, "text": "improved scores. Finally, OTSL achieves faster inference due to fewer decoding", "orig": "improved scores. Finally, OTSL achieves faster inference due to fewer decoding", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 104, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 664.85, "r_x1": 405.8, "r_y1": 664.85, "r_x2": 405.8, "r_y2": 656.06, "r_x3": 134.76, "r_y3": 656.06, "coord_origin": "TOPLEFT" }, "text": "steps which is a result of the reduced sequence representation.", "orig": "steps which is a result of the reduced sequence representation.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "Additionally, the results show that OTSL has an advantage over HTML when applied on a bigger data set like PubTables-1M and achieves significantly improved scores. Finally, OTSL achieves faster inference due to fewer decoding steps which is a result of the reduced sequence representation." } ], "body": [ { "label": "text", "id": 4, "page_no": 8, "cluster": { "id": 4, "label": "text", "bbox": { "l": 134.76, "t": 118.93, "r": 480.6, "b": 151.64, "coord_origin": "TOPLEFT" }, "confidence": 0.981, "cells": [ { "index": 2, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 127.73, "r_x1": 480.59, "r_y1": 127.73, "r_x2": 480.59, "r_y2": 118.93, "r_x3": 134.76, "r_y3": 118.93, "coord_origin": "TOPLEFT" }, "text": "order to compute the TED score. Inference timing results for all experiments", "orig": "order to compute the TED score. Inference timing results for all experiments", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 3, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 139.69, "r_x1": 480.6, "r_y1": 139.69, "r_x2": 480.6, "r_y2": 130.89, "r_x3": 134.76, "r_y3": 130.89, "coord_origin": "TOPLEFT" }, "text": "were obtained from the same machine on a single core with AMD EPYC 7763", "orig": "were obtained from the same machine on a single core with AMD EPYC 7763", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 4, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 151.64, "r_x1": 210.78, "r_y1": 151.64, "r_x2": 210.78, "r_y2": 142.84, "r_x3": 134.76, "r_y3": 142.84, "coord_origin": "TOPLEFT" }, "text": "CPU @2.45 GHz.", "orig": "CPU @2.45 GHz.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "order to compute the TED score. Inference timing results for all experiments were obtained from the same machine on a single core with AMD EPYC 7763 CPU @2.45 GHz." }, { "label": "section_header", "id": 6, "page_no": 8, "cluster": { "id": 6, "label": "section_header", "bbox": { "l": 134.76, "t": 169.19, "r": 318.45, "b": 177.99, "coord_origin": "TOPLEFT" }, "confidence": 0.958, "cells": [ { "index": 5, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 177.99, "r_x1": 149.4, "r_y1": 177.99, "r_x2": 149.4, "r_y2": 169.19, "r_x3": 134.76, "r_y3": 169.19, "coord_origin": "TOPLEFT" }, "text": "5.1", "orig": "5.1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 6, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 160.86, "r_y0": 177.99, "r_x1": 318.45, "r_y1": 177.99, "r_x2": 318.45, "r_y2": 169.19, "r_x3": 160.86, "r_y3": 169.19, "coord_origin": "TOPLEFT" }, "text": "Hyper Parameter Optimization", "orig": "Hyper Parameter Optimization", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "5.1 Hyper Parameter Optimization" }, { "label": "text", "id": 3, "page_no": 8, "cluster": { "id": 3, "label": "text", "bbox": { "l": 134.76, "t": 185.59, "r": 480.59, "b": 254.16, "coord_origin": "TOPLEFT" }, "confidence": 0.984, "cells": [ { "index": 7, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 194.38, "r_x1": 480.59, "r_y1": 194.38, "r_x2": 480.59, "r_y2": 185.59, "r_x3": 134.76, "r_y3": 185.59, "coord_origin": "TOPLEFT" }, "text": "We have chosen the PubTabNet data set to perform HPO, since it includes a", "orig": "We have chosen the PubTabNet data set to perform HPO, since it includes a", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 8, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 206.34, "r_x1": 480.59, "r_y1": 206.34, "r_x2": 480.59, "r_y2": 197.54, "r_x3": 134.76, "r_y3": 197.54, "coord_origin": "TOPLEFT" }, "text": "highly diverse set of tables. Also we report TED scores separately for simple and", "orig": "highly diverse set of tables. Also we report TED scores separately for simple and", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 9, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 218.29, "r_x1": 480.59, "r_y1": 218.29, "r_x2": 480.59, "r_y2": 209.5, "r_x3": 134.76, "r_y3": 209.5, "coord_origin": "TOPLEFT" }, "text": "complex tables (tables with cell spans). Results are presented in Table. 1. It is", "orig": "complex tables (tables with cell spans). Results are presented in Table. 1. It is", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 10, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 230.25, "r_x1": 480.59, "r_y1": 230.25, "r_x2": 480.59, "r_y2": 221.45, "r_x3": 134.76, "r_y3": 221.45, "coord_origin": "TOPLEFT" }, "text": "evident that with OTSL, our model achieves the same TED score and slightly", "orig": "evident that with OTSL, our model achieves the same TED score and slightly", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 11, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 242.2, "r_x1": 440.94, "r_y1": 242.2, "r_x2": 440.94, "r_y2": 233.41, "r_x3": 134.76, "r_y3": 233.41, "coord_origin": "TOPLEFT" }, "text": "better mAP scores in comparison to HTML. However OTSL yields a", "orig": "better mAP scores in comparison to HTML. However OTSL yields a", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 12, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 444.87, "r_y0": 242.2, "r_x1": 480.59, "r_y1": 242.2, "r_x2": 480.59, "r_y2": 233.41, "r_x3": 444.87, "r_y3": 233.41, "coord_origin": "TOPLEFT" }, "text": "2x speed", "orig": "2x speed", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 13, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 254.16, "r_x1": 145.2, "r_y1": 254.16, "r_x2": 145.2, "r_y2": 245.36, "r_x3": 134.76, "r_y3": 245.36, "coord_origin": "TOPLEFT" }, "text": "up", "orig": "up", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 14, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 149.15, "r_y0": 254.16, "r_x1": 311.22, "r_y1": 254.16, "r_x2": 311.22, "r_y2": 245.36, "r_x3": 149.15, "r_y3": 245.36, "coord_origin": "TOPLEFT" }, "text": "in the inference runtime over HTML.", "orig": "in the inference runtime over HTML.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "We have chosen the PubTabNet data set to perform HPO, since it includes a highly diverse set of tables. Also we report TED scores separately for simple and complex tables (tables with cell spans). Results are presented in Table. 1. It is evident that with OTSL, our model achieves the same TED score and slightly better mAP scores in comparison to HTML. However OTSL yields a 2x speed up in the inference runtime over HTML." }, { "label": "caption", "id": 7, "page_no": 8, "cluster": { "id": 7, "label": "caption", "bbox": { "l": 134.76, "t": 275.07, "r": 480.6, "b": 327.04, "coord_origin": "TOPLEFT" }, "confidence": 0.957, "cells": [ { "index": 15, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 283.0, "r_x1": 160.12, "r_y1": 283.0, "r_x2": 160.12, "r_y2": 275.07, "r_x3": 134.76, "r_y3": 275.07, "coord_origin": "TOPLEFT" }, "text": "Table", "orig": "Table", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 16, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 167.35, "r_y0": 283.0, "r_x1": 175.6, "r_y1": 283.0, "r_x2": 175.6, "r_y2": 275.07, "r_x3": 167.35, "r_y3": 275.07, "coord_origin": "TOPLEFT" }, "text": "1.", "orig": "1.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 17, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 188.13, "r_y0": 283.2, "r_x1": 480.59, "r_y1": 283.2, "r_x2": 480.59, "r_y2": 275.14, "r_x3": 188.13, "r_y3": 275.14, "coord_origin": "TOPLEFT" }, "text": "HPO performed in OTSL and HTML representation on the same", "orig": "HPO performed in OTSL and HTML representation on the same", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 18, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 294.16, "r_x1": 480.59, "r_y1": 294.16, "r_x2": 480.59, "r_y2": 286.09, "r_x3": 134.76, "r_y3": 286.09, "coord_origin": "TOPLEFT" }, "text": "transformer-based TableFormer [9] architecture, trained only on PubTabNet [22]. Ef-", "orig": "transformer-based TableFormer [9] architecture, trained only on PubTabNet [22]. Ef-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 19, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 305.12, "r_x1": 480.6, "r_y1": 305.12, "r_x2": 480.6, "r_y2": 297.05, "r_x3": 134.76, "r_y3": 297.05, "coord_origin": "TOPLEFT" }, "text": "fects of reducing the # of layers in encoder and decoder stages of the model show that", "orig": "fects of reducing the # of layers in encoder and decoder stages of the model show that", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 20, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 316.08, "r_x1": 480.59, "r_y1": 316.08, "r_x2": 480.59, "r_y2": 308.01, "r_x3": 134.76, "r_y3": 308.01, "coord_origin": "TOPLEFT" }, "text": "smaller models trained on OTSL perform better, especially in recognizing complex", "orig": "smaller models trained on OTSL perform better, especially in recognizing complex", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 21, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 327.04, "r_x1": 480.59, "r_y1": 327.04, "r_x2": 480.59, "r_y2": 318.97, "r_x3": 134.76, "r_y3": 318.97, "coord_origin": "TOPLEFT" }, "text": "table structures, and maintain a much higher mAP score than the HTML counterpart.", "orig": "table structures, and maintain a much higher mAP score than the HTML counterpart.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "Table 1. HPO performed in OTSL and HTML representation on the same transformer-based TableFormer [9] architecture, trained only on PubTabNet [22]. Effects of reducing the # of layers in encoder and decoder stages of the model show that smaller models trained on OTSL perform better, especially in recognizing complex table structures, and maintain a much higher mAP score than the HTML counterpart." }, { "label": "table", "id": 0, "page_no": 8, "cluster": { "id": 0, "label": "table", "bbox": { "l": 139.67, "t": 337.57, "r": 475.0, "b": 469.47, "coord_origin": "TOPLEFT" }, "confidence": 0.99, "cells": [ { "index": 22, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 160.37, "r_y0": 349.8, "r_x1": 168.05, "r_y1": 349.8, "r_x2": 168.05, "r_y2": 341.73, "r_x3": 160.37, "r_y3": 341.73, "coord_origin": "TOPLEFT" }, "text": "#", "orig": "#", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 23, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 144.59, "r_y0": 362.76, "r_x1": 183.83, "r_y1": 362.76, "r_x2": 183.83, "r_y2": 354.69, "r_x3": 144.59, "r_y3": 354.69, "coord_origin": "TOPLEFT" }, "text": "enc-layers", "orig": "enc-layers", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 24, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 207.97, "r_y0": 349.8, "r_x1": 215.65, "r_y1": 349.8, "r_x2": 215.65, "r_y2": 341.73, "r_x3": 207.97, "r_y3": 341.73, "coord_origin": "TOPLEFT" }, "text": "#", "orig": "#", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 25, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 192.19, "r_y0": 362.76, "r_x1": 231.43, "r_y1": 362.76, "r_x2": 231.43, "r_y2": 354.69, "r_x3": 192.19, "r_y3": 354.69, "coord_origin": "TOPLEFT" }, "text": "dec-layers", "orig": "dec-layers", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 26, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 239.8, "r_y0": 355.28, "r_x1": 278.32, "r_y1": 355.28, "r_x2": 278.32, "r_y2": 347.21, "r_x3": 239.8, "r_y3": 347.21, "coord_origin": "TOPLEFT" }, "text": "Language", "orig": "Language", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 27, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 324.67, "r_y0": 349.8, "r_x1": 348.26, "r_y1": 349.8, "r_x2": 348.26, "r_y2": 341.73, "r_x3": 324.67, "r_y3": 341.73, "coord_origin": "TOPLEFT" }, "text": "TEDs", "orig": "TEDs", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 28, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 396.27, "r_y0": 349.8, "r_x1": 417.13, "r_y1": 349.8, "r_x2": 417.13, "r_y2": 341.73, "r_x3": 396.27, "r_y3": 341.73, "coord_origin": "TOPLEFT" }, "text": "mAP", "orig": "mAP", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 29, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 394.93, "r_y0": 360.76, "r_x1": 418.47, "r_y1": 360.76, "r_x2": 418.47, "r_y2": 352.69, "r_x3": 394.93, "r_y3": 352.69, "coord_origin": "TOPLEFT" }, "text": "(0.75)", "orig": "(0.75)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 30, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 430.77, "r_y0": 349.8, "r_x1": 467.14, "r_y1": 349.8, "r_x2": 467.14, "r_y2": 341.73, "r_x3": 430.77, "r_y3": 341.73, "coord_origin": "TOPLEFT" }, "text": "Inference", "orig": "Inference", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 31, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 427.15, "r_y0": 360.76, "r_x1": 470.76, "r_y1": 360.76, "r_x2": 470.76, "r_y2": 352.69, "r_x3": 427.15, "r_y3": 352.69, "coord_origin": "TOPLEFT" }, "text": "time (secs)", "orig": "time (secs)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 32, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 286.69, "r_y0": 362.76, "r_x1": 312.33, "r_y1": 362.76, "r_x2": 312.33, "r_y2": 354.69, "r_x3": 286.69, "r_y3": 354.69, "coord_origin": "TOPLEFT" }, "text": "simple", "orig": "simple", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 33, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 320.7, "r_y0": 362.76, "r_x1": 353.72, "r_y1": 362.76, "r_x2": 353.72, "r_y2": 354.69, "r_x3": 320.7, "r_y3": 354.69, "coord_origin": "TOPLEFT" }, "text": "complex", "orig": "complex", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 34, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 369.31, "r_y0": 362.76, "r_x1": 379.03, "r_y1": 362.76, "r_x2": 379.03, "r_y2": 354.69, "r_x3": 369.31, "r_y3": 354.69, "coord_origin": "TOPLEFT" }, "text": "all", "orig": "all", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 35, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 161.91, "r_y0": 381.59, "r_x1": 166.51, "r_y1": 381.59, "r_x2": 166.51, "r_y2": 373.52, "r_x3": 161.91, "r_y3": 373.52, "coord_origin": "TOPLEFT" }, "text": "6", "orig": "6", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 36, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 209.51, "r_y0": 381.59, "r_x1": 214.12, "r_y1": 381.59, "r_x2": 214.12, "r_y2": 373.52, "r_x3": 209.51, "r_y3": 373.52, "coord_origin": "TOPLEFT" }, "text": "6", "orig": "6", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 37, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 246.71, "r_y0": 376.11, "r_x1": 271.41, "r_y1": 376.11, "r_x2": 271.41, "r_y2": 368.04, "r_x3": 246.71, "r_y3": 368.04, "coord_origin": "TOPLEFT" }, "text": "OTSL", "orig": "OTSL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 38, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 289.02, "r_y0": 376.11, "r_x1": 310.0, "r_y1": 376.11, "r_x2": 310.0, "r_y2": 368.04, "r_x3": 289.02, "r_y3": 368.04, "coord_origin": "TOPLEFT" }, "text": "0.965", "orig": "0.965", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 39, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 326.72, "r_y0": 376.11, "r_x1": 347.7, "r_y1": 376.11, "r_x2": 347.7, "r_y2": 368.04, "r_x3": 326.72, "r_y3": 368.04, "coord_origin": "TOPLEFT" }, "text": "0.934", "orig": "0.934", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 40, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 363.68, "r_y0": 376.11, "r_x1": 384.66, "r_y1": 376.11, "r_x2": 384.66, "r_y2": 368.04, "r_x3": 363.68, "r_y3": 368.04, "coord_origin": "TOPLEFT" }, "text": "0.955", "orig": "0.955", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 41, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 397.27, "r_y0": 375.9, "r_x1": 416.13, "r_y1": 375.9, "r_x2": 416.13, "r_y2": 367.97, "r_x3": 397.27, "r_y3": 367.97, "coord_origin": "TOPLEFT" }, "text": "0.88", "orig": "0.88", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 42, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 439.53, "r_y0": 375.9, "r_x1": 458.38, "r_y1": 375.9, "r_x2": 458.38, "r_y2": 367.97, "r_x3": 439.53, "r_y3": 367.97, "coord_origin": "TOPLEFT" }, "text": "2.73", "orig": "2.73", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 43, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 245.18, "r_y0": 389.06, "r_x1": 272.94, "r_y1": 389.06, "r_x2": 272.94, "r_y2": 380.99, "r_x3": 245.18, "r_y3": 380.99, "coord_origin": "TOPLEFT" }, "text": "HTML", "orig": "HTML", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 44, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 289.02, "r_y0": 389.06, "r_x1": 310.0, "r_y1": 389.06, "r_x2": 310.0, "r_y2": 380.99, "r_x3": 289.02, "r_y3": 380.99, "coord_origin": "TOPLEFT" }, "text": "0.969", "orig": "0.969", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 45, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 326.72, "r_y0": 389.06, "r_x1": 347.7, "r_y1": 389.06, "r_x2": 347.7, "r_y2": 380.99, "r_x3": 326.72, "r_y3": 380.99, "coord_origin": "TOPLEFT" }, "text": "0.927", "orig": "0.927", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 46, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 363.68, "r_y0": 389.06, "r_x1": 384.66, "r_y1": 389.06, "r_x2": 384.66, "r_y2": 380.99, "r_x3": 363.68, "r_y3": 380.99, "coord_origin": "TOPLEFT" }, "text": "0.955", "orig": "0.955", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 47, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 396.21, "r_y0": 389.06, "r_x1": 417.19, "r_y1": 389.06, "r_x2": 417.19, "r_y2": 380.99, "r_x3": 396.21, "r_y3": 380.99, "coord_origin": "TOPLEFT" }, "text": "0.857", "orig": "0.857", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 48, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 440.77, "r_y0": 389.06, "r_x1": 457.15, "r_y1": 389.06, "r_x2": 457.15, "r_y2": 380.99, "r_x3": 440.77, "r_y3": 380.99, "coord_origin": "TOPLEFT" }, "text": "5.39", "orig": "5.39", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 49, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 161.91, "r_y0": 407.89, "r_x1": 166.51, "r_y1": 407.89, "r_x2": 166.51, "r_y2": 399.82, "r_x3": 161.91, "r_y3": 399.82, "coord_origin": "TOPLEFT" }, "text": "4", "orig": "4", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 50, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 209.51, "r_y0": 407.89, "r_x1": 214.12, "r_y1": 407.89, "r_x2": 214.12, "r_y2": 399.82, "r_x3": 209.51, "r_y3": 399.82, "coord_origin": "TOPLEFT" }, "text": "4", "orig": "4", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 51, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 246.71, "r_y0": 402.41, "r_x1": 271.41, "r_y1": 402.41, "r_x2": 271.41, "r_y2": 394.34, "r_x3": 246.71, "r_y3": 394.34, "coord_origin": "TOPLEFT" }, "text": "OTSL", "orig": "OTSL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 52, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 289.02, "r_y0": 402.41, "r_x1": 310.0, "r_y1": 402.41, "r_x2": 310.0, "r_y2": 394.34, "r_x3": 289.02, "r_y3": 394.34, "coord_origin": "TOPLEFT" }, "text": "0.938", "orig": "0.938", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 53, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 326.72, "r_y0": 402.41, "r_x1": 347.7, "r_y1": 402.41, "r_x2": 347.7, "r_y2": 394.34, "r_x3": 326.72, "r_y3": 394.34, "coord_origin": "TOPLEFT" }, "text": "0.904", "orig": "0.904", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 54, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 363.68, "r_y0": 402.41, "r_x1": 384.66, "r_y1": 402.41, "r_x2": 384.66, "r_y2": 394.34, "r_x3": 363.68, "r_y3": 394.34, "coord_origin": "TOPLEFT" }, "text": "0.927", "orig": "0.927", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 55, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 394.62, "r_y0": 402.2, "r_x1": 418.78, "r_y1": 402.2, "r_x2": 418.78, "r_y2": 394.28, "r_x3": 394.62, "r_y3": 394.28, "coord_origin": "TOPLEFT" }, "text": "0.853", "orig": "0.853", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 56, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 439.53, "r_y0": 402.2, "r_x1": 458.38, "r_y1": 402.2, "r_x2": 458.38, "r_y2": 394.28, "r_x3": 439.53, "r_y3": 394.28, "coord_origin": "TOPLEFT" }, "text": "1.97", "orig": "1.97", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 57, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 245.18, "r_y0": 415.36, "r_x1": 272.94, "r_y1": 415.36, "r_x2": 272.94, "r_y2": 407.29, "r_x3": 245.18, "r_y3": 407.29, "coord_origin": "TOPLEFT" }, "text": "HTML", "orig": "HTML", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 58, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 289.02, "r_y0": 415.36, "r_x1": 310.0, "r_y1": 415.36, "r_x2": 310.0, "r_y2": 407.29, "r_x3": 289.02, "r_y3": 407.29, "coord_origin": "TOPLEFT" }, "text": "0.952", "orig": "0.952", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 59, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 326.72, "r_y0": 415.36, "r_x1": 347.7, "r_y1": 415.36, "r_x2": 347.7, "r_y2": 407.29, "r_x3": 326.72, "r_y3": 407.29, "coord_origin": "TOPLEFT" }, "text": "0.909", "orig": "0.909", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 60, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 362.09, "r_y0": 415.15, "r_x1": 386.25, "r_y1": 415.15, "r_x2": 386.25, "r_y2": 407.23, "r_x3": 362.09, "r_y3": 407.23, "coord_origin": "TOPLEFT" }, "text": "0.938", "orig": "0.938", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 61, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 396.21, "r_y0": 415.36, "r_x1": 417.19, "r_y1": 415.36, "r_x2": 417.19, "r_y2": 407.29, "r_x3": 396.21, "r_y3": 407.29, "coord_origin": "TOPLEFT" }, "text": "0.843", "orig": "0.843", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 62, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 440.77, "r_y0": 415.36, "r_x1": 457.15, "r_y1": 415.36, "r_x2": 457.15, "r_y2": 407.29, "r_x3": 440.77, "r_y3": 407.29, "coord_origin": "TOPLEFT" }, "text": "3.77", "orig": "3.77", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 63, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 161.91, "r_y0": 434.19, "r_x1": 166.51, "r_y1": 434.19, "r_x2": 166.51, "r_y2": 426.12, "r_x3": 161.91, "r_y3": 426.12, "coord_origin": "TOPLEFT" }, "text": "2", "orig": "2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 64, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 209.51, "r_y0": 434.19, "r_x1": 214.12, "r_y1": 434.19, "r_x2": 214.12, "r_y2": 426.12, "r_x3": 209.51, "r_y3": 426.12, "coord_origin": "TOPLEFT" }, "text": "4", "orig": "4", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 65, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 246.71, "r_y0": 428.71, "r_x1": 271.41, "r_y1": 428.71, "r_x2": 271.41, "r_y2": 420.64, "r_x3": 246.71, "r_y3": 420.64, "coord_origin": "TOPLEFT" }, "text": "OTSL", "orig": "OTSL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 66, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 289.02, "r_y0": 428.71, "r_x1": 310.0, "r_y1": 428.71, "r_x2": 310.0, "r_y2": 420.64, "r_x3": 289.02, "r_y3": 420.64, "coord_origin": "TOPLEFT" }, "text": "0.923", "orig": "0.923", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 67, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 326.72, "r_y0": 428.71, "r_x1": 347.7, "r_y1": 428.71, "r_x2": 347.7, "r_y2": 420.64, "r_x3": 326.72, "r_y3": 420.64, "coord_origin": "TOPLEFT" }, "text": "0.897", "orig": "0.897", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 68, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 363.68, "r_y0": 428.71, "r_x1": 384.66, "r_y1": 428.71, "r_x2": 384.66, "r_y2": 420.64, "r_x3": 363.68, "r_y3": 420.64, "coord_origin": "TOPLEFT" }, "text": "0.915", "orig": "0.915", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 69, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 394.62, "r_y0": 428.5, "r_x1": 418.78, "r_y1": 428.5, "r_x2": 418.78, "r_y2": 420.58, "r_x3": 394.62, "r_y3": 420.58, "coord_origin": "TOPLEFT" }, "text": "0.859", "orig": "0.859", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 70, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 439.53, "r_y0": 428.5, "r_x1": 458.38, "r_y1": 428.5, "r_x2": 458.38, "r_y2": 420.58, "r_x3": 439.53, "r_y3": 420.58, "coord_origin": "TOPLEFT" }, "text": "1.91", "orig": "1.91", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 71, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 245.18, "r_y0": 441.66, "r_x1": 272.94, "r_y1": 441.66, "r_x2": 272.94, "r_y2": 433.59, "r_x3": 245.18, "r_y3": 433.59, "coord_origin": "TOPLEFT" }, "text": "HTML", "orig": "HTML", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 72, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 289.02, "r_y0": 441.66, "r_x1": 310.0, "r_y1": 441.66, "r_x2": 310.0, "r_y2": 433.59, "r_x3": 289.02, "r_y3": 433.59, "coord_origin": "TOPLEFT" }, "text": "0.945", "orig": "0.945", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 73, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 326.72, "r_y0": 441.66, "r_x1": 347.7, "r_y1": 441.66, "r_x2": 347.7, "r_y2": 433.59, "r_x3": 326.72, "r_y3": 433.59, "coord_origin": "TOPLEFT" }, "text": "0.901", "orig": "0.901", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 74, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 362.09, "r_y0": 441.45, "r_x1": 386.25, "r_y1": 441.45, "r_x2": 386.25, "r_y2": 433.53, "r_x3": 362.09, "r_y3": 433.53, "coord_origin": "TOPLEFT" }, "text": "0.931", "orig": "0.931", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 75, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 396.21, "r_y0": 441.66, "r_x1": 417.19, "r_y1": 441.66, "r_x2": 417.19, "r_y2": 433.59, "r_x3": 396.21, "r_y3": 433.59, "coord_origin": "TOPLEFT" }, "text": "0.834", "orig": "0.834", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 76, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 440.77, "r_y0": 441.66, "r_x1": 457.15, "r_y1": 441.66, "r_x2": 457.15, "r_y2": 433.59, "r_x3": 440.77, "r_y3": 433.59, "coord_origin": "TOPLEFT" }, "text": "3.81", "orig": "3.81", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 77, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 161.91, "r_y0": 460.49, "r_x1": 166.51, "r_y1": 460.49, "r_x2": 166.51, "r_y2": 452.42, "r_x3": 161.91, "r_y3": 452.42, "coord_origin": "TOPLEFT" }, "text": "4", "orig": "4", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 78, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 209.51, "r_y0": 460.49, "r_x1": 214.12, "r_y1": 460.49, "r_x2": 214.12, "r_y2": 452.42, "r_x3": 209.51, "r_y3": 452.42, "coord_origin": "TOPLEFT" }, "text": "2", "orig": "2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 79, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 246.71, "r_y0": 455.01, "r_x1": 271.41, "r_y1": 455.01, "r_x2": 271.41, "r_y2": 446.94, "r_x3": 246.71, "r_y3": 446.94, "coord_origin": "TOPLEFT" }, "text": "OTSL", "orig": "OTSL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 80, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 289.02, "r_y0": 455.01, "r_x1": 310.0, "r_y1": 455.01, "r_x2": 310.0, "r_y2": 446.94, "r_x3": 289.02, "r_y3": 446.94, "coord_origin": "TOPLEFT" }, "text": "0.952", "orig": "0.952", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 81, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 329.02, "r_y0": 455.01, "r_x1": 345.4, "r_y1": 455.01, "r_x2": 345.4, "r_y2": 446.94, "r_x3": 329.02, "r_y3": 446.94, "coord_origin": "TOPLEFT" }, "text": "0.92", "orig": "0.92", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 82, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 362.09, "r_y0": 454.8, "r_x1": 386.25, "r_y1": 454.8, "r_x2": 386.25, "r_y2": 446.88, "r_x3": 362.09, "r_y3": 446.88, "coord_origin": "TOPLEFT" }, "text": "0.942", "orig": "0.942", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 83, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 394.62, "r_y0": 454.8, "r_x1": 418.78, "r_y1": 454.8, "r_x2": 418.78, "r_y2": 446.88, "r_x3": 394.62, "r_y3": 446.88, "coord_origin": "TOPLEFT" }, "text": "0.857", "orig": "0.857", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 84, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 439.53, "r_y0": 454.8, "r_x1": 458.38, "r_y1": 454.8, "r_x2": 458.38, "r_y2": 446.88, "r_x3": 439.53, "r_y3": 446.88, "coord_origin": "TOPLEFT" }, "text": "1.22", "orig": "1.22", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 85, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 245.18, "r_y0": 467.96, "r_x1": 272.94, "r_y1": 467.96, "r_x2": 272.94, "r_y2": 459.89, "r_x3": 245.18, "r_y3": 459.89, "coord_origin": "TOPLEFT" }, "text": "HTML", "orig": "HTML", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 86, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 289.02, "r_y0": 467.96, "r_x1": 310.0, "r_y1": 467.96, "r_x2": 310.0, "r_y2": 459.89, "r_x3": 289.02, "r_y3": 459.89, "coord_origin": "TOPLEFT" }, "text": "0.944", "orig": "0.944", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 87, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 326.72, "r_y0": 467.96, "r_x1": 347.7, "r_y1": 467.96, "r_x2": 347.7, "r_y2": 459.89, "r_x3": 326.72, "r_y3": 459.89, "coord_origin": "TOPLEFT" }, "text": "0.903", "orig": "0.903", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 88, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 363.68, "r_y0": 467.96, "r_x1": 384.66, "r_y1": 467.96, "r_x2": 384.66, "r_y2": 459.89, "r_x3": 363.68, "r_y3": 459.89, "coord_origin": "TOPLEFT" }, "text": "0.931", "orig": "0.931", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 89, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 396.21, "r_y0": 467.96, "r_x1": 417.19, "r_y1": 467.96, "r_x2": 417.19, "r_y2": 459.89, "r_x3": 396.21, "r_y3": 459.89, "coord_origin": "TOPLEFT" }, "text": "0.824", "orig": "0.824", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 90, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 446.65, "r_y0": 467.96, "r_x1": 451.26, "r_y1": 467.96, "r_x2": 451.26, "r_y2": 459.89, "r_x3": 446.65, "r_y3": 459.89, "coord_origin": "TOPLEFT" }, "text": "2", "orig": "2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [ { "id": 11, "label": "text", "bbox": { "l": 160.37, "t": 341.73, "r": 168.05, "b": 349.8, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 22, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 160.37, "r_y0": 349.8, "r_x1": 168.05, "r_y1": 349.8, "r_x2": 168.05, "r_y2": 341.73, "r_x3": 160.37, "r_y3": 341.73, "coord_origin": "TOPLEFT" }, "text": "#", "orig": "#", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 12, "label": "text", "bbox": { "l": 144.59, "t": 354.69, "r": 183.83, "b": 362.76, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 23, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 144.59, "r_y0": 362.76, "r_x1": 183.83, "r_y1": 362.76, "r_x2": 183.83, "r_y2": 354.69, "r_x3": 144.59, "r_y3": 354.69, "coord_origin": "TOPLEFT" }, "text": "enc-layers", "orig": "enc-layers", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 13, "label": "text", "bbox": { "l": 207.97, "t": 341.73, "r": 215.65, "b": 349.8, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 24, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 207.97, "r_y0": 349.8, "r_x1": 215.65, "r_y1": 349.8, "r_x2": 215.65, "r_y2": 341.73, "r_x3": 207.97, "r_y3": 341.73, "coord_origin": "TOPLEFT" }, "text": "#", "orig": "#", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 14, "label": "text", "bbox": { "l": 192.19, "t": 354.69, "r": 231.43, "b": 362.76, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 25, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 192.19, "r_y0": 362.76, "r_x1": 231.43, "r_y1": 362.76, "r_x2": 231.43, "r_y2": 354.69, "r_x3": 192.19, "r_y3": 354.69, "coord_origin": "TOPLEFT" }, "text": "dec-layers", "orig": "dec-layers", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 15, "label": "text", "bbox": { "l": 239.8, "t": 347.21, "r": 278.32, "b": 355.28, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 26, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 239.8, "r_y0": 355.28, "r_x1": 278.32, "r_y1": 355.28, "r_x2": 278.32, "r_y2": 347.21, "r_x3": 239.8, "r_y3": 347.21, "coord_origin": "TOPLEFT" }, "text": "Language", "orig": "Language", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 16, "label": "text", "bbox": { "l": 324.67, "t": 341.73, "r": 348.26, "b": 349.8, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 27, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 324.67, "r_y0": 349.8, "r_x1": 348.26, "r_y1": 349.8, "r_x2": 348.26, "r_y2": 341.73, "r_x3": 324.67, "r_y3": 341.73, "coord_origin": "TOPLEFT" }, "text": "TEDs", "orig": "TEDs", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 17, "label": "text", "bbox": { "l": 396.27, "t": 341.73, "r": 417.13, "b": 349.8, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 28, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 396.27, "r_y0": 349.8, "r_x1": 417.13, "r_y1": 349.8, "r_x2": 417.13, "r_y2": 341.73, "r_x3": 396.27, "r_y3": 341.73, "coord_origin": "TOPLEFT" }, "text": "mAP", "orig": "mAP", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 18, "label": "text", "bbox": { "l": 394.93, "t": 352.69, "r": 418.47, "b": 360.76, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 29, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 394.93, "r_y0": 360.76, "r_x1": 418.47, "r_y1": 360.76, "r_x2": 418.47, "r_y2": 352.69, "r_x3": 394.93, "r_y3": 352.69, "coord_origin": "TOPLEFT" }, "text": "(0.75)", "orig": "(0.75)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 19, "label": "text", "bbox": { "l": 430.77, "t": 341.73, "r": 467.14, "b": 349.8, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 30, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 430.77, "r_y0": 349.8, "r_x1": 467.14, "r_y1": 349.8, "r_x2": 467.14, "r_y2": 341.73, "r_x3": 430.77, "r_y3": 341.73, "coord_origin": "TOPLEFT" }, "text": "Inference", "orig": "Inference", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 20, "label": "text", "bbox": { "l": 427.15, "t": 352.69, "r": 470.76, "b": 360.76, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 31, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 427.15, "r_y0": 360.76, "r_x1": 470.76, "r_y1": 360.76, "r_x2": 470.76, "r_y2": 352.69, "r_x3": 427.15, "r_y3": 352.69, "coord_origin": "TOPLEFT" }, "text": "time (secs)", "orig": "time (secs)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 21, "label": "text", "bbox": { "l": 286.69, "t": 354.69, "r": 312.33, "b": 362.76, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 32, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 286.69, "r_y0": 362.76, "r_x1": 312.33, "r_y1": 362.76, "r_x2": 312.33, "r_y2": 354.69, "r_x3": 286.69, "r_y3": 354.69, "coord_origin": "TOPLEFT" }, "text": "simple", "orig": "simple", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 22, "label": "text", "bbox": { "l": 320.7, "t": 354.69, "r": 353.72, "b": 362.76, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 33, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 320.7, "r_y0": 362.76, "r_x1": 353.72, "r_y1": 362.76, "r_x2": 353.72, "r_y2": 354.69, "r_x3": 320.7, "r_y3": 354.69, "coord_origin": "TOPLEFT" }, "text": "complex", "orig": "complex", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 23, "label": "text", "bbox": { "l": 369.31, "t": 354.69, "r": 379.03, "b": 362.76, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 34, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 369.31, "r_y0": 362.76, "r_x1": 379.03, "r_y1": 362.76, "r_x2": 379.03, "r_y2": 354.69, "r_x3": 369.31, "r_y3": 354.69, "coord_origin": "TOPLEFT" }, "text": "all", "orig": "all", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 24, "label": "text", "bbox": { "l": 161.91, "t": 373.52, "r": 166.51, "b": 381.59, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 35, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 161.91, "r_y0": 381.59, "r_x1": 166.51, "r_y1": 381.59, "r_x2": 166.51, "r_y2": 373.52, "r_x3": 161.91, "r_y3": 373.52, "coord_origin": "TOPLEFT" }, "text": "6", "orig": "6", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 25, "label": "text", "bbox": { "l": 209.51, "t": 373.52, "r": 214.12, "b": 381.59, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 36, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 209.51, "r_y0": 381.59, "r_x1": 214.12, "r_y1": 381.59, "r_x2": 214.12, "r_y2": 373.52, "r_x3": 209.51, "r_y3": 373.52, "coord_origin": "TOPLEFT" }, "text": "6", "orig": "6", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 26, "label": "text", "bbox": { "l": 246.71, "t": 368.04, "r": 271.41, "b": 376.11, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 37, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 246.71, "r_y0": 376.11, "r_x1": 271.41, "r_y1": 376.11, "r_x2": 271.41, "r_y2": 368.04, "r_x3": 246.71, "r_y3": 368.04, "coord_origin": "TOPLEFT" }, "text": "OTSL", "orig": "OTSL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 27, "label": "text", "bbox": { "l": 289.02, "t": 368.04, "r": 310.0, "b": 376.11, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 38, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 289.02, "r_y0": 376.11, "r_x1": 310.0, "r_y1": 376.11, "r_x2": 310.0, "r_y2": 368.04, "r_x3": 289.02, "r_y3": 368.04, "coord_origin": "TOPLEFT" }, "text": "0.965", "orig": "0.965", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 28, "label": "text", "bbox": { "l": 326.72, "t": 368.04, "r": 347.7, "b": 376.11, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 39, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 326.72, "r_y0": 376.11, "r_x1": 347.7, "r_y1": 376.11, "r_x2": 347.7, "r_y2": 368.04, "r_x3": 326.72, "r_y3": 368.04, "coord_origin": "TOPLEFT" }, "text": "0.934", "orig": "0.934", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 29, "label": "text", "bbox": { "l": 363.68, "t": 368.04, "r": 384.66, "b": 376.11, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 40, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 363.68, "r_y0": 376.11, "r_x1": 384.66, "r_y1": 376.11, "r_x2": 384.66, "r_y2": 368.04, "r_x3": 363.68, "r_y3": 368.04, "coord_origin": "TOPLEFT" }, "text": "0.955", "orig": "0.955", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 30, "label": "text", "bbox": { "l": 397.27, "t": 367.97, "r": 416.13, "b": 375.9, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 41, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 397.27, "r_y0": 375.9, "r_x1": 416.13, "r_y1": 375.9, "r_x2": 416.13, "r_y2": 367.97, "r_x3": 397.27, "r_y3": 367.97, "coord_origin": "TOPLEFT" }, "text": "0.88", "orig": "0.88", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 31, "label": "text", "bbox": { "l": 439.53, "t": 367.97, "r": 458.38, "b": 375.9, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 42, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 439.53, "r_y0": 375.9, "r_x1": 458.38, "r_y1": 375.9, "r_x2": 458.38, "r_y2": 367.97, "r_x3": 439.53, "r_y3": 367.97, "coord_origin": "TOPLEFT" }, "text": "2.73", "orig": "2.73", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 32, "label": "text", "bbox": { "l": 245.18, "t": 380.99, "r": 272.94, "b": 389.06, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 43, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 245.18, "r_y0": 389.06, "r_x1": 272.94, "r_y1": 389.06, "r_x2": 272.94, "r_y2": 380.99, "r_x3": 245.18, "r_y3": 380.99, "coord_origin": "TOPLEFT" }, "text": "HTML", "orig": "HTML", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 33, "label": "text", "bbox": { "l": 289.02, "t": 380.99, "r": 310.0, "b": 389.06, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 44, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 289.02, "r_y0": 389.06, "r_x1": 310.0, "r_y1": 389.06, "r_x2": 310.0, "r_y2": 380.99, "r_x3": 289.02, "r_y3": 380.99, "coord_origin": "TOPLEFT" }, "text": "0.969", "orig": "0.969", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 34, "label": "text", "bbox": { "l": 326.72, "t": 380.99, "r": 347.7, "b": 389.06, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 45, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 326.72, "r_y0": 389.06, "r_x1": 347.7, "r_y1": 389.06, "r_x2": 347.7, "r_y2": 380.99, "r_x3": 326.72, "r_y3": 380.99, "coord_origin": "TOPLEFT" }, "text": "0.927", "orig": "0.927", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 35, "label": "text", "bbox": { "l": 363.68, "t": 380.99, "r": 384.66, "b": 389.06, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 46, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 363.68, "r_y0": 389.06, "r_x1": 384.66, "r_y1": 389.06, "r_x2": 384.66, "r_y2": 380.99, "r_x3": 363.68, "r_y3": 380.99, "coord_origin": "TOPLEFT" }, "text": "0.955", "orig": "0.955", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 36, "label": "text", "bbox": { "l": 396.21, "t": 380.99, "r": 417.19, "b": 389.06, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 47, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 396.21, "r_y0": 389.06, "r_x1": 417.19, "r_y1": 389.06, "r_x2": 417.19, "r_y2": 380.99, "r_x3": 396.21, "r_y3": 380.99, "coord_origin": "TOPLEFT" }, "text": "0.857", "orig": "0.857", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 37, "label": "text", "bbox": { "l": 440.77, "t": 380.99, "r": 457.15, "b": 389.06, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 48, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 440.77, "r_y0": 389.06, "r_x1": 457.15, "r_y1": 389.06, "r_x2": 457.15, "r_y2": 380.99, "r_x3": 440.77, "r_y3": 380.99, "coord_origin": "TOPLEFT" }, "text": "5.39", "orig": "5.39", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 38, "label": "text", "bbox": { "l": 161.91, "t": 399.82, "r": 166.51, "b": 407.89, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 49, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 161.91, "r_y0": 407.89, "r_x1": 166.51, "r_y1": 407.89, "r_x2": 166.51, "r_y2": 399.82, "r_x3": 161.91, "r_y3": 399.82, "coord_origin": "TOPLEFT" }, "text": "4", "orig": "4", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 39, "label": "text", "bbox": { "l": 209.51, "t": 399.82, "r": 214.12, "b": 407.89, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 50, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 209.51, "r_y0": 407.89, "r_x1": 214.12, "r_y1": 407.89, "r_x2": 214.12, "r_y2": 399.82, "r_x3": 209.51, "r_y3": 399.82, "coord_origin": "TOPLEFT" }, "text": "4", "orig": "4", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 40, "label": "text", "bbox": { "l": 246.71, "t": 394.34, "r": 271.41, "b": 402.41, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 51, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 246.71, "r_y0": 402.41, "r_x1": 271.41, "r_y1": 402.41, "r_x2": 271.41, "r_y2": 394.34, "r_x3": 246.71, "r_y3": 394.34, "coord_origin": "TOPLEFT" }, "text": "OTSL", "orig": "OTSL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 41, "label": "text", "bbox": { "l": 289.02, "t": 394.34, "r": 310.0, "b": 402.41, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 52, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 289.02, "r_y0": 402.41, "r_x1": 310.0, "r_y1": 402.41, "r_x2": 310.0, "r_y2": 394.34, "r_x3": 289.02, "r_y3": 394.34, "coord_origin": "TOPLEFT" }, "text": "0.938", "orig": "0.938", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 42, "label": "text", "bbox": { "l": 326.72, "t": 394.34, "r": 347.7, "b": 402.41, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 53, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 326.72, "r_y0": 402.41, "r_x1": 347.7, "r_y1": 402.41, "r_x2": 347.7, "r_y2": 394.34, "r_x3": 326.72, "r_y3": 394.34, "coord_origin": "TOPLEFT" }, "text": "0.904", "orig": "0.904", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 43, "label": "text", "bbox": { "l": 363.68, "t": 394.34, "r": 384.66, "b": 402.41, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 54, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 363.68, "r_y0": 402.41, "r_x1": 384.66, "r_y1": 402.41, "r_x2": 384.66, "r_y2": 394.34, "r_x3": 363.68, "r_y3": 394.34, "coord_origin": "TOPLEFT" }, "text": "0.927", "orig": "0.927", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 44, "label": "text", "bbox": { "l": 394.62, "t": 394.28, "r": 418.78, "b": 402.2, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 55, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 394.62, "r_y0": 402.2, "r_x1": 418.78, "r_y1": 402.2, "r_x2": 418.78, "r_y2": 394.28, "r_x3": 394.62, "r_y3": 394.28, "coord_origin": "TOPLEFT" }, "text": "0.853", "orig": "0.853", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 45, "label": "text", "bbox": { "l": 439.53, "t": 394.28, "r": 458.38, "b": 402.2, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 56, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 439.53, "r_y0": 402.2, "r_x1": 458.38, "r_y1": 402.2, "r_x2": 458.38, "r_y2": 394.28, "r_x3": 439.53, "r_y3": 394.28, "coord_origin": "TOPLEFT" }, "text": "1.97", "orig": "1.97", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 46, "label": "text", "bbox": { "l": 245.18, "t": 407.29, "r": 272.94, "b": 415.36, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 57, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 245.18, "r_y0": 415.36, "r_x1": 272.94, "r_y1": 415.36, "r_x2": 272.94, "r_y2": 407.29, "r_x3": 245.18, "r_y3": 407.29, "coord_origin": "TOPLEFT" }, "text": "HTML", "orig": "HTML", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 47, "label": "text", "bbox": { "l": 289.02, "t": 407.29, "r": 310.0, "b": 415.36, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 58, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 289.02, "r_y0": 415.36, "r_x1": 310.0, "r_y1": 415.36, "r_x2": 310.0, "r_y2": 407.29, "r_x3": 289.02, "r_y3": 407.29, "coord_origin": "TOPLEFT" }, "text": "0.952", "orig": "0.952", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 48, "label": "text", "bbox": { "l": 326.72, "t": 407.29, "r": 347.7, "b": 415.36, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 59, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 326.72, "r_y0": 415.36, "r_x1": 347.7, "r_y1": 415.36, "r_x2": 347.7, "r_y2": 407.29, "r_x3": 326.72, "r_y3": 407.29, "coord_origin": "TOPLEFT" }, "text": "0.909", "orig": "0.909", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 49, "label": "text", "bbox": { "l": 362.09, "t": 407.23, "r": 386.25, "b": 415.15, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 60, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 362.09, "r_y0": 415.15, "r_x1": 386.25, "r_y1": 415.15, "r_x2": 386.25, "r_y2": 407.23, "r_x3": 362.09, "r_y3": 407.23, "coord_origin": "TOPLEFT" }, "text": "0.938", "orig": "0.938", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 50, "label": "text", "bbox": { "l": 396.21, "t": 407.29, "r": 417.19, "b": 415.36, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 61, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 396.21, "r_y0": 415.36, "r_x1": 417.19, "r_y1": 415.36, "r_x2": 417.19, "r_y2": 407.29, "r_x3": 396.21, "r_y3": 407.29, "coord_origin": "TOPLEFT" }, "text": "0.843", "orig": "0.843", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 51, "label": "text", "bbox": { "l": 440.77, "t": 407.29, "r": 457.15, "b": 415.36, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 62, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 440.77, "r_y0": 415.36, "r_x1": 457.15, "r_y1": 415.36, "r_x2": 457.15, "r_y2": 407.29, "r_x3": 440.77, "r_y3": 407.29, "coord_origin": "TOPLEFT" }, "text": "3.77", "orig": "3.77", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 52, "label": "text", "bbox": { "l": 161.91, "t": 426.12, "r": 166.51, "b": 434.19, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 63, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 161.91, "r_y0": 434.19, "r_x1": 166.51, "r_y1": 434.19, "r_x2": 166.51, "r_y2": 426.12, "r_x3": 161.91, "r_y3": 426.12, "coord_origin": "TOPLEFT" }, "text": "2", "orig": "2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 53, "label": "text", "bbox": { "l": 209.51, "t": 426.12, "r": 214.12, "b": 434.19, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 64, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 209.51, "r_y0": 434.19, "r_x1": 214.12, "r_y1": 434.19, "r_x2": 214.12, "r_y2": 426.12, "r_x3": 209.51, "r_y3": 426.12, "coord_origin": "TOPLEFT" }, "text": "4", "orig": "4", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 54, "label": "text", "bbox": { "l": 246.71, "t": 420.64, "r": 271.41, "b": 428.71, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 65, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 246.71, "r_y0": 428.71, "r_x1": 271.41, "r_y1": 428.71, "r_x2": 271.41, "r_y2": 420.64, "r_x3": 246.71, "r_y3": 420.64, "coord_origin": "TOPLEFT" }, "text": "OTSL", "orig": "OTSL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 55, "label": "text", "bbox": { "l": 289.02, "t": 420.64, "r": 310.0, "b": 428.71, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 66, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 289.02, "r_y0": 428.71, "r_x1": 310.0, "r_y1": 428.71, "r_x2": 310.0, "r_y2": 420.64, "r_x3": 289.02, "r_y3": 420.64, "coord_origin": "TOPLEFT" }, "text": "0.923", "orig": "0.923", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 56, "label": "text", "bbox": { "l": 326.72, "t": 420.64, "r": 347.7, "b": 428.71, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 67, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 326.72, "r_y0": 428.71, "r_x1": 347.7, "r_y1": 428.71, "r_x2": 347.7, "r_y2": 420.64, "r_x3": 326.72, "r_y3": 420.64, "coord_origin": "TOPLEFT" }, "text": "0.897", "orig": "0.897", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 57, "label": "text", "bbox": { "l": 363.68, "t": 420.64, "r": 384.66, "b": 428.71, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 68, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 363.68, "r_y0": 428.71, "r_x1": 384.66, "r_y1": 428.71, "r_x2": 384.66, "r_y2": 420.64, "r_x3": 363.68, "r_y3": 420.64, "coord_origin": "TOPLEFT" }, "text": "0.915", "orig": "0.915", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 58, "label": "text", "bbox": { "l": 394.62, "t": 420.58, "r": 418.78, "b": 428.5, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 69, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 394.62, "r_y0": 428.5, "r_x1": 418.78, "r_y1": 428.5, "r_x2": 418.78, "r_y2": 420.58, "r_x3": 394.62, "r_y3": 420.58, "coord_origin": "TOPLEFT" }, "text": "0.859", "orig": "0.859", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 59, "label": "text", "bbox": { "l": 439.53, "t": 420.58, "r": 458.38, "b": 428.5, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 70, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 439.53, "r_y0": 428.5, "r_x1": 458.38, "r_y1": 428.5, "r_x2": 458.38, "r_y2": 420.58, "r_x3": 439.53, "r_y3": 420.58, "coord_origin": "TOPLEFT" }, "text": "1.91", "orig": "1.91", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 60, "label": "text", "bbox": { "l": 245.18, "t": 433.59, "r": 272.94, "b": 441.66, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 71, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 245.18, "r_y0": 441.66, "r_x1": 272.94, "r_y1": 441.66, "r_x2": 272.94, "r_y2": 433.59, "r_x3": 245.18, "r_y3": 433.59, "coord_origin": "TOPLEFT" }, "text": "HTML", "orig": "HTML", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 61, "label": "text", "bbox": { "l": 289.02, "t": 433.59, "r": 310.0, "b": 441.66, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 72, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 289.02, "r_y0": 441.66, "r_x1": 310.0, "r_y1": 441.66, "r_x2": 310.0, "r_y2": 433.59, "r_x3": 289.02, "r_y3": 433.59, "coord_origin": "TOPLEFT" }, "text": "0.945", "orig": "0.945", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 62, "label": "text", "bbox": { "l": 326.72, "t": 433.59, "r": 347.7, "b": 441.66, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 73, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 326.72, "r_y0": 441.66, "r_x1": 347.7, "r_y1": 441.66, "r_x2": 347.7, "r_y2": 433.59, "r_x3": 326.72, "r_y3": 433.59, "coord_origin": "TOPLEFT" }, "text": "0.901", "orig": "0.901", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 63, "label": "text", "bbox": { "l": 362.09, "t": 433.53, "r": 386.25, "b": 441.45, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 74, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 362.09, "r_y0": 441.45, "r_x1": 386.25, "r_y1": 441.45, "r_x2": 386.25, "r_y2": 433.53, "r_x3": 362.09, "r_y3": 433.53, "coord_origin": "TOPLEFT" }, "text": "0.931", "orig": "0.931", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 64, "label": "text", "bbox": { "l": 396.21, "t": 433.59, "r": 417.19, "b": 441.66, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 75, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 396.21, "r_y0": 441.66, "r_x1": 417.19, "r_y1": 441.66, "r_x2": 417.19, "r_y2": 433.59, "r_x3": 396.21, "r_y3": 433.59, "coord_origin": "TOPLEFT" }, "text": "0.834", "orig": "0.834", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 65, "label": "text", "bbox": { "l": 440.77, "t": 433.59, "r": 457.15, "b": 441.66, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 76, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 440.77, "r_y0": 441.66, "r_x1": 457.15, "r_y1": 441.66, "r_x2": 457.15, "r_y2": 433.59, "r_x3": 440.77, "r_y3": 433.59, "coord_origin": "TOPLEFT" }, "text": "3.81", "orig": "3.81", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 66, "label": "text", "bbox": { "l": 161.91, "t": 452.42, "r": 166.51, "b": 460.49, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 77, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 161.91, "r_y0": 460.49, "r_x1": 166.51, "r_y1": 460.49, "r_x2": 166.51, "r_y2": 452.42, "r_x3": 161.91, "r_y3": 452.42, "coord_origin": "TOPLEFT" }, "text": "4", "orig": "4", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 67, "label": "text", "bbox": { "l": 209.51, "t": 452.42, "r": 214.12, "b": 460.49, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 78, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 209.51, "r_y0": 460.49, "r_x1": 214.12, "r_y1": 460.49, "r_x2": 214.12, "r_y2": 452.42, "r_x3": 209.51, "r_y3": 452.42, "coord_origin": "TOPLEFT" }, "text": "2", "orig": "2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 68, "label": "text", "bbox": { "l": 246.71, "t": 446.94, "r": 271.41, "b": 455.01, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 79, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 246.71, "r_y0": 455.01, "r_x1": 271.41, "r_y1": 455.01, "r_x2": 271.41, "r_y2": 446.94, "r_x3": 246.71, "r_y3": 446.94, "coord_origin": "TOPLEFT" }, "text": "OTSL", "orig": "OTSL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 69, "label": "text", "bbox": { "l": 289.02, "t": 446.94, "r": 310.0, "b": 455.01, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 80, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 289.02, "r_y0": 455.01, "r_x1": 310.0, "r_y1": 455.01, "r_x2": 310.0, "r_y2": 446.94, "r_x3": 289.02, "r_y3": 446.94, "coord_origin": "TOPLEFT" }, "text": "0.952", "orig": "0.952", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 70, "label": "text", "bbox": { "l": 329.02, "t": 446.94, "r": 345.4, "b": 455.01, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 81, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 329.02, "r_y0": 455.01, "r_x1": 345.4, "r_y1": 455.01, "r_x2": 345.4, "r_y2": 446.94, "r_x3": 329.02, "r_y3": 446.94, "coord_origin": "TOPLEFT" }, "text": "0.92", "orig": "0.92", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 71, "label": "text", "bbox": { "l": 362.09, "t": 446.88, "r": 386.25, "b": 454.8, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 82, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 362.09, "r_y0": 454.8, "r_x1": 386.25, "r_y1": 454.8, "r_x2": 386.25, "r_y2": 446.88, "r_x3": 362.09, "r_y3": 446.88, "coord_origin": "TOPLEFT" }, "text": "0.942", "orig": "0.942", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 72, "label": "text", "bbox": { "l": 394.62, "t": 446.88, "r": 418.78, "b": 454.8, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 83, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 394.62, "r_y0": 454.8, "r_x1": 418.78, "r_y1": 454.8, "r_x2": 418.78, "r_y2": 446.88, "r_x3": 394.62, "r_y3": 446.88, "coord_origin": "TOPLEFT" }, "text": "0.857", "orig": "0.857", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 73, "label": "text", "bbox": { "l": 439.53, "t": 446.88, "r": 458.38, "b": 454.8, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 84, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 439.53, "r_y0": 454.8, "r_x1": 458.38, "r_y1": 454.8, "r_x2": 458.38, "r_y2": 446.88, "r_x3": 439.53, "r_y3": 446.88, "coord_origin": "TOPLEFT" }, "text": "1.22", "orig": "1.22", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 74, "label": "text", "bbox": { "l": 245.18, "t": 459.89, "r": 272.94, "b": 467.96, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 85, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 245.18, "r_y0": 467.96, "r_x1": 272.94, "r_y1": 467.96, "r_x2": 272.94, "r_y2": 459.89, "r_x3": 245.18, "r_y3": 459.89, "coord_origin": "TOPLEFT" }, "text": "HTML", "orig": "HTML", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 75, "label": "text", "bbox": { "l": 289.02, "t": 459.89, "r": 310.0, "b": 467.96, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 86, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 289.02, "r_y0": 467.96, "r_x1": 310.0, "r_y1": 467.96, "r_x2": 310.0, "r_y2": 459.89, "r_x3": 289.02, "r_y3": 459.89, "coord_origin": "TOPLEFT" }, "text": "0.944", "orig": "0.944", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 76, "label": "text", "bbox": { "l": 326.72, "t": 459.89, "r": 347.7, "b": 467.96, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 87, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 326.72, "r_y0": 467.96, "r_x1": 347.7, "r_y1": 467.96, "r_x2": 347.7, "r_y2": 459.89, "r_x3": 326.72, "r_y3": 459.89, "coord_origin": "TOPLEFT" }, "text": "0.903", "orig": "0.903", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 77, "label": "text", "bbox": { "l": 363.68, "t": 459.89, "r": 384.66, "b": 467.96, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 88, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 363.68, "r_y0": 467.96, "r_x1": 384.66, "r_y1": 467.96, "r_x2": 384.66, "r_y2": 459.89, "r_x3": 363.68, "r_y3": 459.89, "coord_origin": "TOPLEFT" }, "text": "0.931", "orig": "0.931", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 78, "label": "text", "bbox": { "l": 396.21, "t": 459.89, "r": 417.19, "b": 467.96, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 89, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 396.21, "r_y0": 467.96, "r_x1": 417.19, "r_y1": 467.96, "r_x2": 417.19, "r_y2": 459.89, "r_x3": 396.21, "r_y3": 459.89, "coord_origin": "TOPLEFT" }, "text": "0.824", "orig": "0.824", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 79, "label": "text", "bbox": { "l": 446.65, "t": 459.89, "r": 451.26, "b": 467.96, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 90, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 446.65, "r_y0": 467.96, "r_x1": 451.26, "r_y1": 467.96, "r_x2": 451.26, "r_y2": 459.89, "r_x3": 446.65, "r_y3": 459.89, "coord_origin": "TOPLEFT" }, "text": "2", "orig": "2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] } ] }, "text": null, "otsl_seq": [ "ched", "ched", "ched", "ched", "lcel", "lcel", "ched", "ched", "nl", "ucel", "ucel", "ucel", "ched", "ched", "ched", "ched", "ched", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "nl" ], "num_rows": 6, "num_cols": 8, "table_cells": [ { "bbox": { "l": 160.37, "t": 341.73, "r": 168.05, "b": 349.8, "coord_origin": "TOPLEFT" }, "row_span": 2, "col_span": 1, "start_row_offset_idx": 0, "end_row_offset_idx": 2, "start_col_offset_idx": 0, "end_col_offset_idx": 1, "text": "# enc-layers", "column_header": true, "row_header": false, "row_section": false }, { "bbox": { "l": 207.97, "t": 341.73, "r": 215.65, "b": 349.8, "coord_origin": "TOPLEFT" }, "row_span": 2, "col_span": 1, "start_row_offset_idx": 0, "end_row_offset_idx": 2, "start_col_offset_idx": 1, "end_col_offset_idx": 2, "text": "# dec-layers", "column_header": true, "row_header": false, "row_section": false }, { "bbox": { "l": 239.8, "t": 347.21, "r": 278.32, "b": 355.28, "coord_origin": "TOPLEFT" }, "row_span": 2, "col_span": 1, "start_row_offset_idx": 0, "end_row_offset_idx": 2, "start_col_offset_idx": 2, "end_col_offset_idx": 3, "text": "Language", "column_header": true, "row_header": false, "row_section": false }, { "bbox": { "l": 324.67, "t": 341.73, "r": 348.26, "b": 349.8, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 3, "start_row_offset_idx": 0, "end_row_offset_idx": 1, "start_col_offset_idx": 3, "end_col_offset_idx": 6, "text": "TEDs", "column_header": true, "row_header": false, "row_section": false }, { "bbox": { "l": 396.27, "t": 341.73, "r": 417.13, "b": 349.8, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 0, "end_row_offset_idx": 1, "start_col_offset_idx": 6, "end_col_offset_idx": 7, "text": "mAP", "column_header": true, "row_header": false, "row_section": false }, { "bbox": { "l": 394.93, "t": 352.69, "r": 418.47, "b": 360.76, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 1, "end_row_offset_idx": 2, "start_col_offset_idx": 6, "end_col_offset_idx": 7, "text": "(0.75)", "column_header": true, "row_header": false, "row_section": false }, { "bbox": { "l": 430.77, "t": 341.73, "r": 467.14, "b": 349.8, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 0, "end_row_offset_idx": 1, "start_col_offset_idx": 7, "end_col_offset_idx": 8, "text": "Inference", "column_header": true, "row_header": false, "row_section": false }, { "bbox": { "l": 427.15, "t": 352.69, "r": 470.76, "b": 360.76, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 1, "end_row_offset_idx": 2, "start_col_offset_idx": 7, "end_col_offset_idx": 8, "text": "time (secs)", "column_header": true, "row_header": false, "row_section": false }, { "bbox": { "l": 286.69, "t": 354.69, "r": 312.33, "b": 362.76, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 1, "end_row_offset_idx": 2, "start_col_offset_idx": 3, "end_col_offset_idx": 4, "text": "simple", "column_header": true, "row_header": false, "row_section": false }, { "bbox": { "l": 320.7, "t": 354.69, "r": 353.72, "b": 362.76, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 1, "end_row_offset_idx": 2, "start_col_offset_idx": 4, "end_col_offset_idx": 5, "text": "complex", "column_header": true, "row_header": false, "row_section": false }, { "bbox": { "l": 369.31, "t": 354.69, "r": 379.03, "b": 362.76, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 1, "end_row_offset_idx": 2, "start_col_offset_idx": 5, "end_col_offset_idx": 6, "text": "all", "column_header": true, "row_header": false, "row_section": false }, { "bbox": { "l": 161.91, "t": 373.52, "r": 166.51, "b": 381.59, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 2, "end_row_offset_idx": 3, "start_col_offset_idx": 0, "end_col_offset_idx": 1, "text": "6", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 209.51, "t": 373.52, "r": 214.12, "b": 381.59, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 2, "end_row_offset_idx": 3, "start_col_offset_idx": 1, "end_col_offset_idx": 2, "text": "6", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 246.71, "t": 368.04, "r": 271.41, "b": 376.11, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 2, "end_row_offset_idx": 3, "start_col_offset_idx": 2, "end_col_offset_idx": 3, "text": "OTSL HTML", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 289.02, "t": 368.04, "r": 310.0, "b": 376.11, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 2, "end_row_offset_idx": 3, "start_col_offset_idx": 3, "end_col_offset_idx": 4, "text": "0.965 0.969", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 326.72, "t": 368.04, "r": 347.7, "b": 376.11, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 2, "end_row_offset_idx": 3, "start_col_offset_idx": 4, "end_col_offset_idx": 5, "text": "0.934 0.927", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 363.68, "t": 368.04, "r": 384.66, "b": 376.11, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 2, "end_row_offset_idx": 3, "start_col_offset_idx": 5, "end_col_offset_idx": 6, "text": "0.955 0.955", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 397.27, "t": 367.97, "r": 416.13, "b": 375.9, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 2, "end_row_offset_idx": 3, "start_col_offset_idx": 6, "end_col_offset_idx": 7, "text": "0.88 0.857", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 439.53, "t": 367.97, "r": 458.38, "b": 375.9, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 2, "end_row_offset_idx": 3, "start_col_offset_idx": 7, "end_col_offset_idx": 8, "text": "2.73 5.39", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 161.91, "t": 399.82, "r": 166.51, "b": 407.89, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 3, "end_row_offset_idx": 4, "start_col_offset_idx": 0, "end_col_offset_idx": 1, "text": "4", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 209.51, "t": 399.82, "r": 214.12, "b": 407.89, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 3, "end_row_offset_idx": 4, "start_col_offset_idx": 1, "end_col_offset_idx": 2, "text": "4", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 246.71, "t": 394.34, "r": 271.41, "b": 402.41, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 3, "end_row_offset_idx": 4, "start_col_offset_idx": 2, "end_col_offset_idx": 3, "text": "OTSL HTML", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 289.02, "t": 394.34, "r": 310.0, "b": 402.41, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 3, "end_row_offset_idx": 4, "start_col_offset_idx": 3, "end_col_offset_idx": 4, "text": "0.938 0.952", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 326.72, "t": 394.34, "r": 347.7, "b": 402.41, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 3, "end_row_offset_idx": 4, "start_col_offset_idx": 4, "end_col_offset_idx": 5, "text": "0.904 0.909", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 363.68, "t": 394.34, "r": 384.66, "b": 402.41, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 3, "end_row_offset_idx": 4, "start_col_offset_idx": 5, "end_col_offset_idx": 6, "text": "0.927 0.938", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 394.62, "t": 394.28, "r": 418.78, "b": 402.2, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 3, "end_row_offset_idx": 4, "start_col_offset_idx": 6, "end_col_offset_idx": 7, "text": "0.853 0.843", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 439.53, "t": 394.28, "r": 458.38, "b": 402.2, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 3, "end_row_offset_idx": 4, "start_col_offset_idx": 7, "end_col_offset_idx": 8, "text": "1.97 3.77", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 161.91, "t": 426.12, "r": 166.51, "b": 434.19, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 4, "end_row_offset_idx": 5, "start_col_offset_idx": 0, "end_col_offset_idx": 1, "text": "2", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 209.51, "t": 426.12, "r": 214.12, "b": 434.19, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 4, "end_row_offset_idx": 5, "start_col_offset_idx": 1, "end_col_offset_idx": 2, "text": "4", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 246.71, "t": 420.64, "r": 271.41, "b": 428.71, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 4, "end_row_offset_idx": 5, "start_col_offset_idx": 2, "end_col_offset_idx": 3, "text": "OTSL HTML", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 289.02, "t": 420.64, "r": 310.0, "b": 428.71, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 4, "end_row_offset_idx": 5, "start_col_offset_idx": 3, "end_col_offset_idx": 4, "text": "0.923 0.945", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 326.72, "t": 420.64, "r": 347.7, "b": 428.71, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 4, "end_row_offset_idx": 5, "start_col_offset_idx": 4, "end_col_offset_idx": 5, "text": "0.897 0.901", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 363.68, "t": 420.64, "r": 384.66, "b": 428.71, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 4, "end_row_offset_idx": 5, "start_col_offset_idx": 5, "end_col_offset_idx": 6, "text": "0.915 0.931", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 394.62, "t": 420.58, "r": 418.78, "b": 428.5, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 4, "end_row_offset_idx": 5, "start_col_offset_idx": 6, "end_col_offset_idx": 7, "text": "0.859 0.834", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 439.53, "t": 420.58, "r": 458.38, "b": 428.5, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 4, "end_row_offset_idx": 5, "start_col_offset_idx": 7, "end_col_offset_idx": 8, "text": "1.91 3.81", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 161.91, "t": 452.42, "r": 166.51, "b": 460.49, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 5, "end_row_offset_idx": 6, "start_col_offset_idx": 0, "end_col_offset_idx": 1, "text": "4", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 209.51, "t": 452.42, "r": 214.12, "b": 460.49, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 5, "end_row_offset_idx": 6, "start_col_offset_idx": 1, "end_col_offset_idx": 2, "text": "2", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 246.71, "t": 446.94, "r": 271.41, "b": 455.01, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 5, "end_row_offset_idx": 6, "start_col_offset_idx": 2, "end_col_offset_idx": 3, "text": "OTSL HTML", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 289.02, "t": 446.94, "r": 310.0, "b": 455.01, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 5, "end_row_offset_idx": 6, "start_col_offset_idx": 3, "end_col_offset_idx": 4, "text": "0.952 0.944", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 329.02, "t": 446.94, "r": 345.4, "b": 455.01, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 5, "end_row_offset_idx": 6, "start_col_offset_idx": 4, "end_col_offset_idx": 5, "text": "0.92 0.903", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 362.09, "t": 446.88, "r": 386.25, "b": 454.8, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 5, "end_row_offset_idx": 6, "start_col_offset_idx": 5, "end_col_offset_idx": 6, "text": "0.942 0.931", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 394.62, "t": 446.88, "r": 418.78, "b": 454.8, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 5, "end_row_offset_idx": 6, "start_col_offset_idx": 6, "end_col_offset_idx": 7, "text": "0.857 0.824", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 439.53, "t": 446.88, "r": 458.38, "b": 454.8, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 5, "end_row_offset_idx": 6, "start_col_offset_idx": 7, "end_col_offset_idx": 8, "text": "1.22 2", "column_header": false, "row_header": false, "row_section": false } ] }, { "label": "section_header", "id": 5, "page_no": 8, "cluster": { "id": 5, "label": "section_header", "bbox": { "l": 134.76, "t": 508.15, "r": 264.4, "b": 516.96, "coord_origin": "TOPLEFT" }, "confidence": 0.959, "cells": [ { "index": 91, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 516.96, "r_x1": 149.4, "r_y1": 516.96, "r_x2": 149.4, "r_y2": 508.15, "r_x3": 134.76, "r_y3": 508.15, "coord_origin": "TOPLEFT" }, "text": "5.2", "orig": "5.2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 92, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 160.86, "r_y0": 516.96, "r_x1": 264.4, "r_y1": 516.96, "r_x2": 264.4, "r_y2": 508.15, "r_x3": 160.86, "r_y3": 508.15, "coord_origin": "TOPLEFT" }, "text": "Quantitative Results", "orig": "Quantitative Results", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "5.2 Quantitative Results" }, { "label": "text", "id": 1, "page_no": 8, "cluster": { "id": 1, "label": "text", "bbox": { "l": 134.76, "t": 524.55, "r": 480.6, "b": 617.03, "coord_origin": "TOPLEFT" }, "confidence": 0.985, "cells": [ { "index": 93, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 533.35, "r_x1": 480.59, "r_y1": 533.35, "r_x2": 480.59, "r_y2": 524.55, "r_x3": 134.76, "r_y3": 524.55, "coord_origin": "TOPLEFT" }, "text": "We picked the model parameter configuration that produced the best prediction", "orig": "We picked the model parameter configuration that produced the best prediction", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 94, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 545.3, "r_x1": 480.59, "r_y1": 545.3, "r_x2": 480.59, "r_y2": 536.51, "r_x3": 134.76, "r_y3": 536.51, "coord_origin": "TOPLEFT" }, "text": "quality (enc=6, dec=6, heads=8) with PubTabNet alone, then independently", "orig": "quality (enc=6, dec=6, heads=8) with PubTabNet alone, then independently", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 95, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 557.26, "r_x1": 480.6, "r_y1": 557.26, "r_x2": 480.6, "r_y2": 548.46, "r_x3": 134.76, "r_y3": 548.46, "coord_origin": "TOPLEFT" }, "text": "trained and evaluated it on three publicly available data sets: PubTabNet (395k", "orig": "trained and evaluated it on three publicly available data sets: PubTabNet (395k", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 96, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 569.21, "r_x1": 480.59, "r_y1": 569.21, "r_x2": 480.59, "r_y2": 560.42, "r_x3": 134.76, "r_y3": 560.42, "coord_origin": "TOPLEFT" }, "text": "samples), FinTabNet (113k samples) and PubTables-1M (about 1M samples).", "orig": "samples), FinTabNet (113k samples) and PubTables-1M (about 1M samples).", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 97, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 581.17, "r_x1": 480.59, "r_y1": 581.17, "r_x2": 480.59, "r_y2": 572.37, "r_x3": 134.76, "r_y3": 572.37, "coord_origin": "TOPLEFT" }, "text": "Performance results are presented in Table. 2. It is clearly evident that the model", "orig": "Performance results are presented in Table. 2. It is clearly evident that the model", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 98, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 593.12, "r_x1": 480.6, "r_y1": 593.12, "r_x2": 480.6, "r_y2": 584.33, "r_x3": 134.76, "r_y3": 584.33, "coord_origin": "TOPLEFT" }, "text": "trained on OTSL outperforms HTML across the board, keeping high TEDs and", "orig": "trained on OTSL outperforms HTML across the board, keeping high TEDs and", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 99, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 605.08, "r_x1": 480.59, "r_y1": 605.08, "r_x2": 480.59, "r_y2": 596.28, "r_x3": 134.76, "r_y3": 596.28, "coord_origin": "TOPLEFT" }, "text": "mAP scores even on difficult financial tables (FinTabNet) that contain sparse", "orig": "mAP scores even on difficult financial tables (FinTabNet) that contain sparse", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 100, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 617.03, "r_x1": 206.79, "r_y1": 617.03, "r_x2": 206.79, "r_y2": 608.24, "r_x3": 134.76, "r_y3": 608.24, "coord_origin": "TOPLEFT" }, "text": "and large tables.", "orig": "and large tables.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "We picked the model parameter configuration that produced the best prediction quality (enc=6, dec=6, heads=8) with PubTabNet alone, then independently trained and evaluated it on three publicly available data sets: PubTabNet (395k samples), FinTabNet (113k samples) and PubTables-1M (about 1M samples). Performance results are presented in Table. 2. It is clearly evident that the model trained on OTSL outperforms HTML across the board, keeping high TEDs and mAP scores even on difficult financial tables (FinTabNet) that contain sparse and large tables." }, { "label": "text", "id": 2, "page_no": 8, "cluster": { "id": 2, "label": "text", "bbox": { "l": 134.76, "t": 620.19, "r": 480.6, "b": 664.85, "coord_origin": "TOPLEFT" }, "confidence": 0.985, "cells": [ { "index": 101, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 149.71, "r_y0": 628.99, "r_x1": 480.59, "r_y1": 628.99, "r_x2": 480.59, "r_y2": 620.19, "r_x3": 149.71, "r_y3": 620.19, "coord_origin": "TOPLEFT" }, "text": "Additionally, the results show that OTSL has an advantage over HTML", "orig": "Additionally, the results show that OTSL has an advantage over HTML", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 102, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 640.94, "r_x1": 480.6, "r_y1": 640.94, "r_x2": 480.6, "r_y2": 632.15, "r_x3": 134.76, "r_y3": 632.15, "coord_origin": "TOPLEFT" }, "text": "when applied on a bigger data set like PubTables-1M and achieves significantly", "orig": "when applied on a bigger data set like PubTables-1M and achieves significantly", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 103, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 652.9, "r_x1": 480.59, "r_y1": 652.9, "r_x2": 480.59, "r_y2": 644.1, "r_x3": 134.76, "r_y3": 644.1, "coord_origin": "TOPLEFT" }, "text": "improved scores. Finally, OTSL achieves faster inference due to fewer decoding", "orig": "improved scores. Finally, OTSL achieves faster inference due to fewer decoding", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 104, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 664.85, "r_x1": 405.8, "r_y1": 664.85, "r_x2": 405.8, "r_y2": 656.06, "r_x3": 134.76, "r_y3": 656.06, "coord_origin": "TOPLEFT" }, "text": "steps which is a result of the reduced sequence representation.", "orig": "steps which is a result of the reduced sequence representation.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "Additionally, the results show that OTSL has an advantage over HTML when applied on a bigger data set like PubTables-1M and achieves significantly improved scores. Finally, OTSL achieves faster inference due to fewer decoding steps which is a result of the reduced sequence representation." } ], "headers": [ { "label": "page_header", "id": 8, "page_no": 8, "cluster": { "id": 8, "label": "page_header", "bbox": { "l": 194.48, "t": 93.77, "r": 447.54, "b": 101.84, "coord_origin": "TOPLEFT" }, "confidence": 0.937, "cells": [ { "index": 0, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 194.48, "r_y0": 101.84, "r_x1": 447.54, "r_y1": 101.84, "r_x2": 447.54, "r_y2": 93.77, "r_x3": 194.48, "r_y3": 93.77, "coord_origin": "TOPLEFT" }, "text": "Optimized Table Tokenization for Table Structure Recognition", "orig": "Optimized Table Tokenization for Table Structure Recognition", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "Optimized Table Tokenization for Table Structure Recognition" }, { "label": "page_header", "id": 9, "page_no": 8, "cluster": { "id": 9, "label": "page_header", "bbox": { "l": 475.98, "t": 93.77, "r": 480.59, "b": 101.84, "coord_origin": "TOPLEFT" }, "confidence": 0.886, "cells": [ { "index": 1, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 475.98, "r_y0": 101.84, "r_x1": 480.59, "r_y1": 101.84, "r_x2": 480.59, "r_y2": 93.77, "r_x3": 475.98, "r_y3": 93.77, "coord_origin": "TOPLEFT" }, "text": "9", "orig": "9", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "9" } ] } }, { "page_no": 9, "size": { "width": 612.0, "height": 792.0 }, "parsed_page": { "dimension": { "angle": 0.0, "rect": { "r_x0": 0.0, "r_y0": 0.0, "r_x1": 612.0, "r_y1": 0.0, "r_x2": 612.0, "r_y2": 792.0, "r_x3": 0.0, "r_y3": 792.0, "coord_origin": "BOTTOMLEFT" }, "boundary_type": "crop_box", "art_bbox": { "l": 0.0, "t": 792.0, "r": 612.0, "b": 0.0, "coord_origin": "BOTTOMLEFT" }, "bleed_bbox": { "l": 0.0, "t": 792.0, "r": 612.0, "b": 0.0, "coord_origin": "BOTTOMLEFT" }, "crop_bbox": { "l": 0.0, "t": 792.0, "r": 612.0, "b": 0.0, "coord_origin": "BOTTOMLEFT" }, "media_bbox": { "l": 0.0, "t": 792.0, "r": 612.0, "b": 0.0, "coord_origin": "BOTTOMLEFT" }, "trim_bbox": { "l": 0.0, "t": 792.0, "r": 612.0, "b": 0.0, "coord_origin": "BOTTOMLEFT" } }, "bitmap_resources": [], "char_cells": [], "word_cells": [], "textline_cells": [ { "index": 0, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 101.84, "r_x1": 143.98, "r_y1": 101.84, "r_x2": 143.98, "r_y2": 93.77, "r_x3": 134.76, "r_y3": 93.77, "coord_origin": "TOPLEFT" }, "text": "10", "orig": "10", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 1, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 167.82, "r_y0": 101.84, "r_x1": 178.08, "r_y1": 101.84, "r_x2": 178.08, "r_y2": 93.77, "r_x3": 167.82, "r_y3": 93.77, "coord_origin": "TOPLEFT" }, "text": "M.", "orig": "M.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 2, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 182.38, "r_y0": 101.84, "r_x1": 231.72, "r_y1": 101.84, "r_x2": 231.72, "r_y2": 93.77, "r_x3": 182.38, "r_y3": 93.77, "coord_origin": "TOPLEFT" }, "text": "Lysak, et al.", "orig": "Lysak, et al.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 3, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 123.76, "r_x1": 173.09, "r_y1": 123.76, "r_x2": 173.09, "r_y2": 115.84, "r_x3": 134.76, "r_y3": 115.84, "coord_origin": "TOPLEFT" }, "text": "Table 2.", "orig": "Table 2.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 4, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 181.3, "r_y0": 123.97, "r_x1": 480.59, "r_y1": 123.97, "r_x2": 480.59, "r_y2": 115.9, "r_x3": 181.3, "r_y3": 115.9, "coord_origin": "TOPLEFT" }, "text": "TSR and cell detection results compared between OTSL and HTML on", "orig": "TSR and cell detection results compared between OTSL and HTML on", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 5, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 134.93, "r_x1": 480.59, "r_y1": 134.93, "r_x2": 480.59, "r_y2": 126.86, "r_x3": 134.76, "r_y3": 126.86, "coord_origin": "TOPLEFT" }, "text": "the PubTabNet [22], FinTabNet [21] and PubTables-1M [14] data sets using Table-", "orig": "the PubTabNet [22], FinTabNet [21] and PubTables-1M [14] data sets using Table-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 6, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 145.89, "r_x1": 305.96, "r_y1": 145.89, "r_x2": 305.96, "r_y2": 137.82, "r_x3": 134.76, "r_y3": 137.82, "coord_origin": "TOPLEFT" }, "text": "Former [9] (with enc=6, dec=6, heads=8).", "orig": "Former [9] (with enc=6, dec=6, heads=8).", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 7, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 160.78, "r_y0": 174.63, "r_x1": 195.0, "r_y1": 174.63, "r_x2": 195.0, "r_y2": 166.56, "r_x3": 160.78, "r_y3": 166.56, "coord_origin": "TOPLEFT" }, "text": "Data set", "orig": "Data set", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 8, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 215.52, "r_y0": 174.6, "r_x1": 254.04, "r_y1": 174.6, "r_x2": 254.04, "r_y2": 166.53, "r_x3": 215.52, "r_y3": 166.53, "coord_origin": "TOPLEFT" }, "text": "Language", "orig": "Language", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 9, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 300.4, "r_y0": 169.15, "r_x1": 323.99, "r_y1": 169.15, "r_x2": 323.99, "r_y2": 161.08, "r_x3": 300.4, "r_y3": 161.08, "coord_origin": "TOPLEFT" }, "text": "TEDs", "orig": "TEDs", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 10, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 370.35, "r_y0": 174.63, "r_x1": 414.75, "r_y1": 174.63, "r_x2": 414.75, "r_y2": 166.56, "r_x3": 370.35, "r_y3": 166.56, "coord_origin": "TOPLEFT" }, "text": "mAP(0.75)", "orig": "mAP(0.75)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 11, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 426.74, "r_y0": 169.15, "r_x1": 463.11, "r_y1": 169.15, "r_x2": 463.11, "r_y2": 161.08, "r_x3": 426.74, "r_y3": 161.08, "coord_origin": "TOPLEFT" }, "text": "Inference", "orig": "Inference", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 12, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 423.11, "r_y0": 180.11, "r_x1": 466.73, "r_y1": 180.11, "r_x2": 466.73, "r_y2": 172.04, "r_x3": 423.11, "r_y3": 172.04, "coord_origin": "TOPLEFT" }, "text": "time (secs)", "orig": "time (secs)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 13, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 262.41, "r_y0": 182.1, "r_x1": 288.06, "r_y1": 182.1, "r_x2": 288.06, "r_y2": 174.03, "r_x3": 262.41, "r_y3": 174.03, "coord_origin": "TOPLEFT" }, "text": "simple", "orig": "simple", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 14, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 296.43, "r_y0": 182.1, "r_x1": 329.45, "r_y1": 182.1, "r_x2": 329.45, "r_y2": 174.03, "r_x3": 296.43, "r_y3": 174.03, "coord_origin": "TOPLEFT" }, "text": "complex", "orig": "complex", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 15, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 345.03, "r_y0": 182.1, "r_x1": 354.76, "r_y1": 182.1, "r_x2": 354.76, "r_y2": 174.03, "r_x3": 345.03, "r_y3": 174.03, "coord_origin": "TOPLEFT" }, "text": "all", "orig": "all", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 16, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 154.54, "r_y0": 200.93, "r_x1": 201.24, "r_y1": 200.93, "r_x2": 201.24, "r_y2": 192.86, "r_x3": 154.54, "r_y3": 192.86, "coord_origin": "TOPLEFT" }, "text": "PubTabNet", "orig": "PubTabNet", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 17, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 222.44, "r_y0": 195.45, "r_x1": 247.13, "r_y1": 195.45, "r_x2": 247.13, "r_y2": 187.38, "r_x3": 222.44, "r_y3": 187.38, "coord_origin": "TOPLEFT" }, "text": "OTSL", "orig": "OTSL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 18, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 264.74, "r_y0": 195.45, "r_x1": 285.73, "r_y1": 195.45, "r_x2": 285.73, "r_y2": 187.38, "r_x3": 264.74, "r_y3": 187.38, "coord_origin": "TOPLEFT" }, "text": "0.965", "orig": "0.965", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 19, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 302.44, "r_y0": 195.45, "r_x1": 323.43, "r_y1": 195.45, "r_x2": 323.43, "r_y2": 187.38, "r_x3": 302.44, "r_y3": 187.38, "coord_origin": "TOPLEFT" }, "text": "0.934", "orig": "0.934", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 20, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 339.4, "r_y0": 195.45, "r_x1": 360.39, "r_y1": 195.45, "r_x2": 360.39, "r_y2": 187.38, "r_x3": 339.4, "r_y3": 187.38, "coord_origin": "TOPLEFT" }, "text": "0.955", "orig": "0.955", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 21, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 383.12, "r_y0": 195.24, "r_x1": 401.97, "r_y1": 195.24, "r_x2": 401.97, "r_y2": 187.32, "r_x3": 383.12, "r_y3": 187.32, "coord_origin": "TOPLEFT" }, "text": "0.88", "orig": "0.88", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 22, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 435.49, "r_y0": 195.24, "r_x1": 454.35, "r_y1": 195.24, "r_x2": 454.35, "r_y2": 187.32, "r_x3": 435.49, "r_y3": 187.32, "coord_origin": "TOPLEFT" }, "text": "2.73", "orig": "2.73", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 23, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 220.9, "r_y0": 208.4, "r_x1": 248.67, "r_y1": 208.4, "r_x2": 248.67, "r_y2": 200.33, "r_x3": 220.9, "r_y3": 200.33, "coord_origin": "TOPLEFT" }, "text": "HTML", "orig": "HTML", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 24, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 264.74, "r_y0": 208.4, "r_x1": 285.73, "r_y1": 208.4, "r_x2": 285.73, "r_y2": 200.33, "r_x3": 264.74, "r_y3": 200.33, "coord_origin": "TOPLEFT" }, "text": "0.969", "orig": "0.969", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 25, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 302.44, "r_y0": 208.4, "r_x1": 323.43, "r_y1": 208.4, "r_x2": 323.43, "r_y2": 200.33, "r_x3": 302.44, "r_y3": 200.33, "coord_origin": "TOPLEFT" }, "text": "0.927", "orig": "0.927", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 26, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 339.4, "r_y0": 208.4, "r_x1": 360.39, "r_y1": 208.4, "r_x2": 360.39, "r_y2": 200.33, "r_x3": 339.4, "r_y3": 200.33, "coord_origin": "TOPLEFT" }, "text": "0.955", "orig": "0.955", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 27, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 382.05, "r_y0": 208.4, "r_x1": 403.04, "r_y1": 208.4, "r_x2": 403.04, "r_y2": 200.33, "r_x3": 382.05, "r_y3": 200.33, "coord_origin": "TOPLEFT" }, "text": "0.857", "orig": "0.857", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 28, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 436.73, "r_y0": 208.4, "r_x1": 453.11, "r_y1": 208.4, "r_x2": 453.11, "r_y2": 200.33, "r_x3": 436.73, "r_y3": 200.33, "coord_origin": "TOPLEFT" }, "text": "5.39", "orig": "5.39", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 29, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 155.95, "r_y0": 227.23, "r_x1": 199.83, "r_y1": 227.23, "r_x2": 199.83, "r_y2": 219.16, "r_x3": 155.95, "r_y3": 219.16, "coord_origin": "TOPLEFT" }, "text": "FinTabNet", "orig": "FinTabNet", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 30, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 222.44, "r_y0": 221.75, "r_x1": 247.13, "r_y1": 221.75, "r_x2": 247.13, "r_y2": 213.68, "r_x3": 222.44, "r_y3": 213.68, "coord_origin": "TOPLEFT" }, "text": "OTSL", "orig": "OTSL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 31, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 264.74, "r_y0": 221.75, "r_x1": 285.73, "r_y1": 221.75, "r_x2": 285.73, "r_y2": 213.68, "r_x3": 264.74, "r_y3": 213.68, "coord_origin": "TOPLEFT" }, "text": "0.955", "orig": "0.955", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 32, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 302.44, "r_y0": 221.75, "r_x1": 323.43, "r_y1": 221.75, "r_x2": 323.43, "r_y2": 213.68, "r_x3": 302.44, "r_y3": 213.68, "coord_origin": "TOPLEFT" }, "text": "0.961", "orig": "0.961", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 33, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 337.81, "r_y0": 221.55, "r_x1": 361.98, "r_y1": 221.55, "r_x2": 361.98, "r_y2": 213.62, "r_x3": 337.81, "r_y3": 213.62, "coord_origin": "TOPLEFT" }, "text": "0.959", "orig": "0.959", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 34, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 380.46, "r_y0": 221.55, "r_x1": 404.62, "r_y1": 221.55, "r_x2": 404.62, "r_y2": 213.62, "r_x3": 380.46, "r_y3": 213.62, "coord_origin": "TOPLEFT" }, "text": "0.862", "orig": "0.862", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 35, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 435.49, "r_y0": 221.55, "r_x1": 454.35, "r_y1": 221.55, "r_x2": 454.35, "r_y2": 213.62, "r_x3": 435.49, "r_y3": 213.62, "coord_origin": "TOPLEFT" }, "text": "1.85", "orig": "1.85", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 36, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 220.9, "r_y0": 234.7, "r_x1": 248.67, "r_y1": 234.7, "r_x2": 248.67, "r_y2": 226.63, "r_x3": 220.9, "r_y3": 226.63, "coord_origin": "TOPLEFT" }, "text": "HTML", "orig": "HTML", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 37, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 264.74, "r_y0": 234.7, "r_x1": 285.73, "r_y1": 234.7, "r_x2": 285.73, "r_y2": 226.63, "r_x3": 264.74, "r_y3": 226.63, "coord_origin": "TOPLEFT" }, "text": "0.917", "orig": "0.917", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 38, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 302.44, "r_y0": 234.7, "r_x1": 323.43, "r_y1": 234.7, "r_x2": 323.43, "r_y2": 226.63, "r_x3": 302.44, "r_y3": 226.63, "coord_origin": "TOPLEFT" }, "text": "0.922", "orig": "0.922", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 39, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 341.71, "r_y0": 234.7, "r_x1": 358.09, "r_y1": 234.7, "r_x2": 358.09, "r_y2": 226.63, "r_x3": 341.71, "r_y3": 226.63, "coord_origin": "TOPLEFT" }, "text": "0.92", "orig": "0.92", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 40, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 382.05, "r_y0": 234.7, "r_x1": 403.04, "r_y1": 234.7, "r_x2": 403.04, "r_y2": 226.63, "r_x3": 382.05, "r_y3": 226.63, "coord_origin": "TOPLEFT" }, "text": "0.722", "orig": "0.722", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 41, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 436.73, "r_y0": 234.7, "r_x1": 453.11, "r_y1": 234.7, "r_x2": 453.11, "r_y2": 226.63, "r_x3": 436.73, "r_y3": 226.63, "coord_origin": "TOPLEFT" }, "text": "3.26", "orig": "3.26", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 42, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 148.63, "r_y0": 253.53, "r_x1": 207.15, "r_y1": 253.53, "r_x2": 207.15, "r_y2": 245.46, "r_x3": 148.63, "r_y3": 245.46, "coord_origin": "TOPLEFT" }, "text": "PubTables-1M", "orig": "PubTables-1M", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 43, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 222.44, "r_y0": 248.05, "r_x1": 247.13, "r_y1": 248.05, "r_x2": 247.13, "r_y2": 239.98, "r_x3": 222.44, "r_y3": 239.98, "coord_origin": "TOPLEFT" }, "text": "OTSL", "orig": "OTSL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 44, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 264.74, "r_y0": 248.05, "r_x1": 285.73, "r_y1": 248.05, "r_x2": 285.73, "r_y2": 239.98, "r_x3": 264.74, "r_y3": 239.98, "coord_origin": "TOPLEFT" }, "text": "0.987", "orig": "0.987", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 45, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 302.44, "r_y0": 248.05, "r_x1": 323.43, "r_y1": 248.05, "r_x2": 323.43, "r_y2": 239.98, "r_x3": 302.44, "r_y3": 239.98, "coord_origin": "TOPLEFT" }, "text": "0.964", "orig": "0.964", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 46, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 337.81, "r_y0": 247.85, "r_x1": 361.98, "r_y1": 247.85, "r_x2": 361.98, "r_y2": 239.92, "r_x3": 337.81, "r_y3": 239.92, "coord_origin": "TOPLEFT" }, "text": "0.977", "orig": "0.977", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 47, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 380.46, "r_y0": 247.85, "r_x1": 404.62, "r_y1": 247.85, "r_x2": 404.62, "r_y2": 239.92, "r_x3": 380.46, "r_y3": 239.92, "coord_origin": "TOPLEFT" }, "text": "0.896", "orig": "0.896", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 48, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 435.49, "r_y0": 247.85, "r_x1": 454.35, "r_y1": 247.85, "r_x2": 454.35, "r_y2": 239.92, "r_x3": 435.49, "r_y3": 239.92, "coord_origin": "TOPLEFT" }, "text": "1.79", "orig": "1.79", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 49, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 220.9, "r_y0": 261.0, "r_x1": 248.67, "r_y1": 261.0, "r_x2": 248.67, "r_y2": 252.93, "r_x3": 220.9, "r_y3": 252.93, "coord_origin": "TOPLEFT" }, "text": "HTML", "orig": "HTML", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 50, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 264.74, "r_y0": 261.0, "r_x1": 285.73, "r_y1": 261.0, "r_x2": 285.73, "r_y2": 252.93, "r_x3": 264.74, "r_y3": 252.93, "coord_origin": "TOPLEFT" }, "text": "0.983", "orig": "0.983", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 51, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 302.44, "r_y0": 261.0, "r_x1": 323.43, "r_y1": 261.0, "r_x2": 323.43, "r_y2": 252.93, "r_x3": 302.44, "r_y3": 252.93, "coord_origin": "TOPLEFT" }, "text": "0.944", "orig": "0.944", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 52, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 339.4, "r_y0": 261.0, "r_x1": 360.39, "r_y1": 261.0, "r_x2": 360.39, "r_y2": 252.93, "r_x3": 339.4, "r_y3": 252.93, "coord_origin": "TOPLEFT" }, "text": "0.966", "orig": "0.966", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 53, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 382.05, "r_y0": 261.0, "r_x1": 403.04, "r_y1": 261.0, "r_x2": 403.04, "r_y2": 252.93, "r_x3": 382.05, "r_y3": 252.93, "coord_origin": "TOPLEFT" }, "text": "0.889", "orig": "0.889", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 54, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 436.73, "r_y0": 261.0, "r_x1": 453.11, "r_y1": 261.0, "r_x2": 453.11, "r_y2": 252.93, "r_x3": 436.73, "r_y3": 252.93, "coord_origin": "TOPLEFT" }, "text": "3.26", "orig": "3.26", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 55, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 297.72, "r_x1": 149.4, "r_y1": 297.72, "r_x2": 149.4, "r_y2": 288.91, "r_x3": 134.76, "r_y3": 288.91, "coord_origin": "TOPLEFT" }, "text": "5.3", "orig": "5.3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 56, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 160.86, "r_y0": 297.72, "r_x1": 257.09, "r_y1": 297.72, "r_x2": 257.09, "r_y2": 288.91, "r_x3": 160.86, "r_y3": 288.91, "coord_origin": "TOPLEFT" }, "text": "Qualitative Results", "orig": "Qualitative Results", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 57, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 318.66, "r_x1": 480.59, "r_y1": 318.66, "r_x2": 480.59, "r_y2": 309.86, "r_x3": 134.76, "r_y3": 309.86, "coord_origin": "TOPLEFT" }, "text": "To illustrate the qualitative differences between OTSL and HTML, Figure 5", "orig": "To illustrate the qualitative differences between OTSL and HTML, Figure 5", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 58, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 330.61, "r_x1": 480.59, "r_y1": 330.61, "r_x2": 480.59, "r_y2": 321.82, "r_x3": 134.76, "r_y3": 321.82, "coord_origin": "TOPLEFT" }, "text": "demonstrates less overlap and more accurate bounding boxes with OTSL. In", "orig": "demonstrates less overlap and more accurate bounding boxes with OTSL. In", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 59, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 342.57, "r_x1": 480.59, "r_y1": 342.57, "r_x2": 480.59, "r_y2": 333.77, "r_x3": 134.76, "r_y3": 333.77, "coord_origin": "TOPLEFT" }, "text": "Figure 6, OTSL proves to be more effective in handling tables with longer to-", "orig": "Figure 6, OTSL proves to be more effective in handling tables with longer to-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 60, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 354.52, "r_x1": 480.59, "r_y1": 354.52, "r_x2": 480.59, "r_y2": 345.73, "r_x3": 134.76, "r_y3": 345.73, "coord_origin": "TOPLEFT" }, "text": "ken sequences, resulting in even more precise structure prediction and bounding", "orig": "ken sequences, resulting in even more precise structure prediction and bounding", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 61, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 366.48, "r_x1": 161.66, "r_y1": 366.48, "r_x2": 161.66, "r_y2": 357.68, "r_x3": 134.76, "r_y3": 357.68, "coord_origin": "TOPLEFT" }, "text": "boxes.", "orig": "boxes.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 62, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 405.52, "r_x1": 162.64, "r_y1": 405.52, "r_x2": 162.64, "r_y2": 397.59, "r_x3": 134.76, "r_y3": 397.59, "coord_origin": "TOPLEFT" }, "text": "Fig. 5.", "orig": "Fig. 5.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 63, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 167.38, "r_y0": 405.72, "r_x1": 480.59, "r_y1": 405.72, "r_x2": 480.59, "r_y2": 397.65, "r_x3": 167.38, "r_y3": 397.65, "coord_origin": "TOPLEFT" }, "text": "The OTSL model produces more accurate bounding boxes with less over-", "orig": "The OTSL model produces more accurate bounding boxes with less over-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 64, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 416.68, "r_x1": 480.59, "r_y1": 416.68, "r_x2": 480.59, "r_y2": 408.61, "r_x3": 134.76, "r_y3": 408.61, "coord_origin": "TOPLEFT" }, "text": "lap (E) than the HTML model (D), when predicting the structure of a sparse ta-", "orig": "lap (E) than the HTML model (D), when predicting the structure of a sparse ta-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 65, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 427.64, "r_x1": 480.59, "r_y1": 427.64, "r_x2": 480.59, "r_y2": 419.57, "r_x3": 134.76, "r_y3": 419.57, "coord_origin": "TOPLEFT" }, "text": "ble (A), at twice the inference speed because of shorter sequence length (B),(C).", "orig": "ble (A), at twice the inference speed because of shorter sequence length (B),(C).", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 66, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 438.6, "r_x1": 304.69, "r_y1": 438.6, "r_x2": 304.69, "r_y2": 430.53, "r_x3": 134.76, "r_y3": 430.53, "coord_origin": "TOPLEFT" }, "text": "\"PMC2807444_006_00.png\" PubTabNet.", "orig": "\"PMC2807444_006_00.png\" PubTabNet.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 67, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 180.12, "r_y0": 518.95, "r_x1": 190.62, "r_y1": 518.95, "r_x2": 190.62, "r_y2": 516.23, "r_x3": 180.12, "r_y3": 516.23, "coord_origin": "TOPLEFT" }, "text": "", "orig": "
", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 68, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 183.24, "r_y0": 522.85, "r_x1": 304.55, "r_y1": 522.85, "r_x2": 304.55, "r_y2": 520.13, "r_x3": 183.24, "r_y3": 520.13, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 69, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 183.24, "r_y0": 526.75, "r_x1": 388.42, "r_y1": 526.75, "r_x2": 388.42, "r_y2": 524.03, "r_x3": 183.24, "r_y3": 524.03, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 70, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 183.24, "r_y0": 530.65, "r_x1": 388.42, "r_y1": 530.65, "r_x2": 388.42, "r_y2": 527.93, "r_x3": 183.24, "r_y3": 527.93, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 71, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 183.24, "r_y0": 534.55, "r_x1": 388.42, "r_y1": 534.55, "r_x2": 388.42, "r_y2": 531.83, "r_x3": 183.24, "r_y3": 531.83, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 72, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 183.24, "r_y0": 538.44, "r_x1": 388.42, "r_y1": 538.44, "r_x2": 388.42, "r_y2": 535.73, "r_x3": 183.24, "r_y3": 535.73, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 73, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 183.24, "r_y0": 542.34, "r_x1": 388.42, "r_y1": 542.34, "r_x2": 388.42, "r_y2": 539.63, "r_x3": 183.24, "r_y3": 539.63, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 74, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 183.24, "r_y0": 546.24, "r_x1": 388.42, "r_y1": 546.24, "r_x2": 388.42, "r_y2": 543.53, "r_x3": 183.24, "r_y3": 543.53, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 75, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 183.24, "r_y0": 550.14, "r_x1": 388.42, "r_y1": 550.14, "r_x2": 388.42, "r_y2": 547.42, "r_x3": 183.24, "r_y3": 547.42, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 76, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 183.24, "r_y0": 554.04, "r_x1": 388.42, "r_y1": 554.04, "r_x2": 388.42, "r_y2": 551.32, "r_x3": 183.24, "r_y3": 551.32, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 77, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 180.12, "r_y0": 557.94, "r_x1": 191.87, "r_y1": 557.94, "r_x2": 191.87, "r_y2": 555.22, "r_x3": 180.12, "r_y3": 555.22, "coord_origin": "TOPLEFT" }, "text": "
", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 78, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 407.38, "r_y0": 521.02, "r_x1": 408.82, "r_y1": 521.02, "r_x2": 408.82, "r_y2": 518.3, "r_x3": 407.38, "r_y3": 518.3, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 79, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 410.26, "r_y0": 521.02, "r_x1": 450.49, "r_y1": 521.02, "r_x2": 450.49, "r_y2": 518.3, "r_x3": 410.26, "r_y3": 518.3, "coord_origin": "TOPLEFT" }, "text": "C L L L C L L L L L C L L NL", "orig": "C L L L C L L L L L C L L NL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 80, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 407.38, "r_y0": 524.92, "r_x1": 408.82, "r_y1": 524.92, "r_x2": 408.82, "r_y2": 522.2, "r_x3": 407.38, "r_y3": 522.2, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 81, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 410.26, "r_y0": 524.92, "r_x1": 450.49, "r_y1": 524.92, "r_x2": 450.49, "r_y2": 522.2, "r_x3": 410.26, "r_y3": 522.2, "coord_origin": "TOPLEFT" }, "text": "C C C C C C C C C C C C C NL", "orig": "C C C C C C C C C C C C C NL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 82, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 407.38, "r_y0": 528.81, "r_x1": 408.82, "r_y1": 528.81, "r_x2": 408.82, "r_y2": 526.1, "r_x3": 407.38, "r_y3": 526.1, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 83, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 410.26, "r_y0": 528.81, "r_x1": 450.49, "r_y1": 528.81, "r_x2": 450.49, "r_y2": 526.1, "r_x3": 410.26, "r_y3": 526.1, "coord_origin": "TOPLEFT" }, "text": "C C C C C C C C C C C C C NL", "orig": "C C C C C C C C C C C C C NL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 84, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 407.38, "r_y0": 532.71, "r_x1": 408.82, "r_y1": 532.71, "r_x2": 408.82, "r_y2": 530.0, "r_x3": 407.38, "r_y3": 530.0, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 85, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 410.26, "r_y0": 532.71, "r_x1": 450.49, "r_y1": 532.71, "r_x2": 450.49, "r_y2": 530.0, "r_x3": 410.26, "r_y3": 530.0, "coord_origin": "TOPLEFT" }, "text": "C C C C C C C C C C C C C NL", "orig": "C C C C C C C C C C C C C NL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 86, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 407.38, "r_y0": 536.61, "r_x1": 408.82, "r_y1": 536.61, "r_x2": 408.82, "r_y2": 533.9, "r_x3": 407.38, "r_y3": 533.9, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 87, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 410.26, "r_y0": 536.61, "r_x1": 450.49, "r_y1": 536.61, "r_x2": 450.49, "r_y2": 533.9, "r_x3": 410.26, "r_y3": 533.9, "coord_origin": "TOPLEFT" }, "text": "C C C C C C C C C C C C C NL", "orig": "C C C C C C C C C C C C C NL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 88, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 407.38, "r_y0": 540.51, "r_x1": 408.82, "r_y1": 540.51, "r_x2": 408.82, "r_y2": 537.79, "r_x3": 407.38, "r_y3": 537.79, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 89, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 410.26, "r_y0": 540.51, "r_x1": 450.49, "r_y1": 540.51, "r_x2": 450.49, "r_y2": 537.79, "r_x3": 410.26, "r_y3": 537.79, "coord_origin": "TOPLEFT" }, "text": "C C C C C C C C C C C C C NL", "orig": "C C C C C C C C C C C C C NL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 90, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 407.38, "r_y0": 544.41, "r_x1": 408.82, "r_y1": 544.41, "r_x2": 408.82, "r_y2": 541.69, "r_x3": 407.38, "r_y3": 541.69, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 91, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 410.26, "r_y0": 544.41, "r_x1": 450.49, "r_y1": 544.41, "r_x2": 450.49, "r_y2": 541.69, "r_x3": 410.26, "r_y3": 541.69, "coord_origin": "TOPLEFT" }, "text": "C C C C C C C C C C C C C NL", "orig": "C C C C C C C C C C C C C NL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 92, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 407.38, "r_y0": 548.31, "r_x1": 408.82, "r_y1": 548.31, "r_x2": 408.82, "r_y2": 545.59, "r_x3": 407.38, "r_y3": 545.59, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 93, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 410.26, "r_y0": 548.31, "r_x1": 450.49, "r_y1": 548.31, "r_x2": 450.49, "r_y2": 545.59, "r_x3": 410.26, "r_y3": 545.59, "coord_origin": "TOPLEFT" }, "text": "C C C C C C C C C C C C C NL", "orig": "C C C C C C C C C C C C C NL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 94, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 407.38, "r_y0": 552.21, "r_x1": 408.82, "r_y1": 552.21, "r_x2": 408.82, "r_y2": 549.49, "r_x3": 407.38, "r_y3": 549.49, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 95, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 410.26, "r_y0": 552.21, "r_x1": 450.49, "r_y1": 552.21, "r_x2": 450.49, "r_y2": 549.49, "r_x3": 410.26, "r_y3": 549.49, "coord_origin": "TOPLEFT" }, "text": "C C C C C C C C C C C C C NL", "orig": "C C C C C C C C C C C C C NL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 96, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 164.53, "r_y0": 515.31, "r_x1": 181.85, "r_y1": 515.31, "r_x2": 181.85, "r_y2": 509.46, "r_x3": 164.53, "r_y3": 509.46, "coord_origin": "TOPLEFT" }, "text": "HTML", "orig": "HTML", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 97, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 183.58, "r_y0": 515.31, "r_x1": 186.4, "r_y1": 515.31, "r_x2": 186.4, "r_y2": 509.46, "r_x3": 183.58, "r_y3": 509.46, "coord_origin": "TOPLEFT" }, "text": "#", "orig": "#", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 98, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 189.21, "r_y0": 515.31, "r_x1": 208.9, "r_y1": 515.31, "r_x2": 208.9, "r_y2": 509.46, "r_x3": 189.21, "r_y3": 509.46, "coord_origin": "TOPLEFT" }, "text": "tokens:", "orig": "tokens:", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 99, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 210.63, "r_y0": 515.31, "r_x1": 221.04, "r_y1": 515.31, "r_x2": 221.04, "r_y2": 509.46, "r_x3": 210.63, "r_y3": 509.46, "coord_origin": "TOPLEFT" }, "text": "258", "orig": "258", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 100, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 390.2, "r_y0": 515.46, "r_x1": 406.84, "r_y1": 515.46, "r_x2": 406.84, "r_y2": 509.6, "r_x3": 390.2, "r_y3": 509.6, "coord_origin": "TOPLEFT" }, "text": "OTSL", "orig": "OTSL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 101, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 408.57, "r_y0": 515.46, "r_x1": 411.38, "r_y1": 515.46, "r_x2": 411.38, "r_y2": 509.6, "r_x3": 408.57, "r_y3": 509.6, "coord_origin": "TOPLEFT" }, "text": "#", "orig": "#", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 102, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 414.2, "r_y0": 515.46, "r_x1": 433.89, "r_y1": 515.46, "r_x2": 433.89, "r_y2": 509.6, "r_x3": 414.2, "r_y3": 509.6, "coord_origin": "TOPLEFT" }, "text": "tokens:", "orig": "tokens:", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 103, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 435.62, "r_y0": 515.46, "r_x1": 446.03, "r_y1": 515.46, "r_x2": 446.03, "r_y2": 509.6, "r_x3": 435.62, "r_y3": 509.6, "coord_origin": "TOPLEFT" }, "text": "135", "orig": "135", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 104, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 167.19, "r_y0": 526.39, "r_x1": 172.82, "r_y1": 526.39, "r_x2": 172.82, "r_y2": 519.07, "r_x3": 167.19, "r_y3": 519.07, "coord_origin": "TOPLEFT" }, "text": "B", "orig": "B", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 105, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 187.34, "r_y0": 455.94, "r_x1": 192.97, "r_y1": 455.94, "r_x2": 192.97, "r_y2": 448.62, "r_x3": 187.34, "r_y3": 448.62, "coord_origin": "TOPLEFT" }, "text": "A", "orig": "A", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 106, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 167.39, "r_y0": 573.32, "r_x1": 173.02, "r_y1": 573.32, "r_x2": 173.02, "r_y2": 566.01, "r_x3": 167.39, "r_y3": 566.01, "coord_origin": "TOPLEFT" }, "text": "D", "orig": "D", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 107, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 248.46, "r_y0": 629.09, "r_x1": 253.66, "r_y1": 629.09, "r_x2": 253.66, "r_y2": 621.78, "r_x3": 248.46, "r_y3": 621.78, "coord_origin": "TOPLEFT" }, "text": "E", "orig": "E", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 108, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 395.9, "r_y0": 526.51, "r_x1": 401.53, "r_y1": 526.51, "r_x2": 401.53, "r_y2": 519.2, "r_x3": 395.9, "r_y3": 519.2, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 109, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 171.63, "r_y0": 597.27, "r_x1": 177.48, "r_y1": 597.27, "r_x2": 177.48, "r_y2": 580.29, "r_x3": 171.63, "r_y3": 580.29, "coord_origin": "TOPLEFT" }, "text": "HTML", "orig": "HTML", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 110, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 251.06, "r_y0": 649.92, "r_x1": 256.91, "r_y1": 649.92, "r_x2": 256.91, "r_y2": 633.63, "r_x3": 251.06, "r_y3": 633.63, "coord_origin": "TOPLEFT" }, "text": "OTSL", "orig": "OTSL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 111, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 372.15, "r_y0": 607.31, "r_x1": 427.04, "r_y1": 607.31, "r_x2": 427.04, "r_y2": 601.46, "r_x3": 372.15, "r_y3": 601.46, "coord_origin": "TOPLEFT" }, "text": "HTML model shows", "orig": "HTML model shows", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 112, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 372.15, "r_y0": 613.75, "r_x1": 430.07, "r_y1": 613.75, "r_x2": 430.07, "r_y2": 607.9, "r_x3": 372.15, "r_y3": 607.9, "coord_origin": "TOPLEFT" }, "text": "bounding box drifting", "orig": "bounding box drifting", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 113, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 176.88, "r_y0": 648.72, "r_x1": 231.08, "r_y1": 648.72, "r_x2": 231.08, "r_y2": 642.87, "r_x3": 176.88, "r_y3": 642.87, "coord_origin": "TOPLEFT" }, "text": "OTSL model shows", "orig": "OTSL model shows", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 114, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 176.88, "r_y0": 655.17, "r_x1": 230.99, "r_y1": 655.17, "r_x2": 230.99, "r_y2": 649.31, "r_x3": 176.88, "r_y3": 649.31, "coord_origin": "TOPLEFT" }, "text": "clean bounding box", "orig": "clean bounding box", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 115, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 176.88, "r_y0": 661.61, "r_x1": 203.93, "r_y1": 661.61, "r_x2": 203.93, "r_y2": 655.76, "r_x3": 176.88, "r_y3": 655.76, "coord_origin": "TOPLEFT" }, "text": "alignment", "orig": "alignment", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 116, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 215.93, "r_y0": 569.16, "r_x1": 218.47, "r_y1": 569.16, "r_x2": 218.47, "r_y2": 557.56, "r_x3": 215.93, "r_y3": 557.56, "coord_origin": "TOPLEFT" }, "text": "\u2264", "orig": "\u2264", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 117, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 229.06, "r_y0": 569.16, "r_x1": 231.72, "r_y1": 569.16, "r_x2": 231.72, "r_y2": 557.56, "r_x3": 229.06, "r_y3": 557.56, "coord_origin": "TOPLEFT" }, "text": "\u03bc", "orig": "\u03bc", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 118, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 342.63, "r_y0": 439.72, "r_x1": 344.82, "r_y1": 439.72, "r_x2": 344.82, "r_y2": 430.2, "r_x3": 342.63, "r_y3": 430.2, "coord_origin": "TOPLEFT" }, "text": "\u03bc", "orig": "\u03bc", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 119, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 261.21, "r_y0": 451.2, "r_x1": 263.57, "r_y1": 451.2, "r_x2": 263.57, "r_y2": 448.46, "r_x3": 261.21, "r_y3": 448.46, "coord_origin": "TOPLEFT" }, "text": "S", "orig": "S", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 120, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 312.33, "r_y0": 451.2, "r_x1": 313.64, "r_y1": 451.2, "r_x2": 313.64, "r_y2": 448.46, "r_x3": 312.33, "r_y3": 448.46, "coord_origin": "TOPLEFT" }, "text": "I", "orig": "I", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 121, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 377.41, "r_y0": 451.2, "r_x1": 380.06, "r_y1": 451.2, "r_x2": 380.06, "r_y2": 448.46, "r_x3": 377.41, "r_y3": 448.46, "coord_origin": "TOPLEFT" }, "text": "R", "orig": "R", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 122, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 200.64, "r_y0": 456.08, "r_x1": 205.82, "r_y1": 456.08, "r_x2": 205.82, "r_y2": 453.34, "r_x3": 200.64, "r_y3": 453.34, "coord_origin": "TOPLEFT" }, "text": "ST", "orig": "ST", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 123, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 222.21, "r_y0": 456.08, "r_x1": 229.77, "r_y1": 456.08, "r_x2": 229.77, "r_y2": 453.34, "r_x3": 222.21, "r_y3": 453.34, "coord_origin": "TOPLEFT" }, "text": "0.03", "orig": "0.03", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 124, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 243.27, "r_y0": 456.08, "r_x1": 250.83, "r_y1": 456.08, "r_x2": 250.83, "r_y2": 453.34, "r_x3": 243.27, "r_y3": 453.34, "coord_origin": "TOPLEFT" }, "text": "0.06", "orig": "0.06", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 125, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 264.3, "r_y0": 456.08, "r_x1": 271.85, "r_y1": 456.08, "r_x2": 271.85, "r_y2": 453.34, "r_x3": 264.3, "r_y3": 453.34, "coord_origin": "TOPLEFT" }, "text": "0.12", "orig": "0.12", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 126, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 285.32, "r_y0": 456.08, "r_x1": 292.88, "r_y1": 456.08, "r_x2": 292.88, "r_y2": 453.34, "r_x3": 285.32, "r_y3": 453.34, "coord_origin": "TOPLEFT" }, "text": "0.25", "orig": "0.25", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 127, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 306.38, "r_y0": 456.08, "r_x1": 311.77, "r_y1": 456.08, "r_x2": 311.77, "r_y2": 453.34, "r_x3": 306.38, "r_y3": 453.34, "coord_origin": "TOPLEFT" }, "text": "0.5", "orig": "0.5", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 128, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 323.42, "r_y0": 456.08, "r_x1": 325.58, "r_y1": 456.08, "r_x2": 325.58, "r_y2": 453.34, "r_x3": 323.42, "r_y3": 453.34, "coord_origin": "TOPLEFT" }, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 129, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 334.46, "r_y0": 456.08, "r_x1": 336.62, "r_y1": 456.08, "r_x2": 336.62, "r_y2": 453.34, "r_x3": 334.46, "r_y3": 453.34, "coord_origin": "TOPLEFT" }, "text": "2", "orig": "2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 130, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 345.53, "r_y0": 456.08, "r_x1": 347.69, "r_y1": 456.08, "r_x2": 347.69, "r_y2": 453.34, "r_x3": 345.53, "r_y3": 453.34, "coord_origin": "TOPLEFT" }, "text": "4", "orig": "4", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 131, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 356.57, "r_y0": 456.08, "r_x1": 358.73, "r_y1": 456.08, "r_x2": 358.73, "r_y2": 453.34, "r_x3": 356.57, "r_y3": 453.34, "coord_origin": "TOPLEFT" }, "text": "8", "orig": "8", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 132, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 367.64, "r_y0": 456.08, "r_x1": 371.97, "r_y1": 456.08, "r_x2": 371.97, "r_y2": 453.34, "r_x3": 367.64, "r_y3": 453.34, "coord_origin": "TOPLEFT" }, "text": "16", "orig": "16", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 133, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 382.67, "r_y0": 456.08, "r_x1": 387.01, "r_y1": 456.08, "r_x2": 387.01, "r_y2": 453.34, "r_x3": 382.67, "r_y3": 453.34, "coord_origin": "TOPLEFT" }, "text": "32", "orig": "32", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 134, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 397.74, "r_y0": 456.08, "r_x1": 402.07, "r_y1": 456.08, "r_x2": 402.07, "r_y2": 453.34, "r_x3": 397.74, "r_y3": 453.34, "coord_origin": "TOPLEFT" }, "text": "64", "orig": "64", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 135, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 412.79, "r_y0": 457.8, "r_x1": 414.93, "r_y1": 457.8, "r_x2": 414.93, "r_y2": 447.99, "r_x3": 412.79, "r_y3": 447.99, "coord_origin": "TOPLEFT" }, "text": "\u2265", "orig": "\u2265", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 136, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 414.96, "r_y0": 456.08, "r_x1": 422.52, "r_y1": 456.08, "r_x2": 422.52, "r_y2": 453.34, "r_x3": 414.96, "r_y3": 453.34, "coord_origin": "TOPLEFT" }, "text": " 128", "orig": " 128", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 137, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 200.64, "r_y0": 466.66, "r_x1": 204.58, "r_y1": 466.66, "r_x2": 204.58, "r_y2": 463.92, "r_x3": 200.64, "r_y3": 463.92, "coord_origin": "TOPLEFT" }, "text": "63", "orig": "63", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 138, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 367.63, "r_y0": 466.66, "r_x1": 369.58, "r_y1": 466.66, "r_x2": 369.58, "r_y2": 463.92, "r_x3": 367.63, "r_y3": 463.92, "coord_origin": "TOPLEFT" }, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 139, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 382.66, "r_y0": 466.66, "r_x1": 384.62, "r_y1": 466.66, "r_x2": 384.62, "r_y2": 463.92, "r_x3": 382.66, "r_y3": 463.92, "coord_origin": "TOPLEFT" }, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 140, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 397.73, "r_y0": 466.66, "r_x1": 399.68, "r_y1": 466.66, "r_x2": 399.68, "r_y2": 463.92, "r_x3": 397.73, "r_y3": 463.92, "coord_origin": "TOPLEFT" }, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 141, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 200.64, "r_y0": 471.54, "r_x1": 206.52, "r_y1": 471.54, "r_x2": 206.52, "r_y2": 468.8, "r_x3": 200.64, "r_y3": 468.8, "coord_origin": "TOPLEFT" }, "text": "199", "orig": "199", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 142, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 264.29, "r_y0": 471.54, "r_x1": 266.26, "r_y1": 471.54, "r_x2": 266.26, "r_y2": 468.8, "r_x3": 264.29, "r_y3": 468.8, "coord_origin": "TOPLEFT" }, "text": "5", "orig": "5", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 143, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 306.37, "r_y0": 471.54, "r_x1": 308.34, "r_y1": 471.54, "r_x2": 308.34, "r_y2": 468.8, "r_x3": 306.37, "r_y3": 468.8, "coord_origin": "TOPLEFT" }, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 144, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 345.52, "r_y0": 471.54, "r_x1": 347.48, "r_y1": 471.54, "r_x2": 347.48, "r_y2": 468.8, "r_x3": 345.52, "r_y3": 468.8, "coord_origin": "TOPLEFT" }, "text": "2", "orig": "2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 145, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 356.56, "r_y0": 471.54, "r_x1": 358.52, "r_y1": 471.54, "r_x2": 358.52, "r_y2": 468.8, "r_x3": 356.56, "r_y3": 468.8, "coord_origin": "TOPLEFT" }, "text": "4", "orig": "4", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 146, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 367.63, "r_y0": 471.54, "r_x1": 369.59, "r_y1": 471.54, "r_x2": 369.59, "r_y2": 468.8, "r_x3": 367.63, "r_y3": 468.8, "coord_origin": "TOPLEFT" }, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 147, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 382.66, "r_y0": 471.54, "r_x1": 384.63, "r_y1": 471.54, "r_x2": 384.63, "r_y2": 468.8, "r_x3": 382.66, "r_y3": 468.8, "coord_origin": "TOPLEFT" }, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 148, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 200.64, "r_y0": 476.42, "r_x1": 206.52, "r_y1": 476.42, "r_x2": 206.52, "r_y2": 473.68, "r_x3": 200.64, "r_y3": 473.68, "coord_origin": "TOPLEFT" }, "text": "416", "orig": "416", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 149, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 264.29, "r_y0": 476.42, "r_x1": 266.26, "r_y1": 476.42, "r_x2": 266.26, "r_y2": 473.68, "r_x3": 264.29, "r_y3": 473.68, "coord_origin": "TOPLEFT" }, "text": "4", "orig": "4", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 150, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 200.64, "r_y0": 481.27, "r_x1": 206.52, "r_y1": 481.27, "r_x2": 206.52, "r_y2": 478.53, "r_x3": 200.64, "r_y3": 478.53, "coord_origin": "TOPLEFT" }, "text": "230", "orig": "230", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 151, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 243.26, "r_y0": 481.27, "r_x1": 245.23, "r_y1": 481.27, "r_x2": 245.23, "r_y2": 478.53, "r_x3": 243.26, "r_y3": 478.53, "coord_origin": "TOPLEFT" }, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 152, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 264.29, "r_y0": 481.27, "r_x1": 266.26, "r_y1": 481.27, "r_x2": 266.26, "r_y2": 478.53, "r_x3": 264.29, "r_y3": 478.53, "coord_origin": "TOPLEFT" }, "text": "9", "orig": "9", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 153, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 323.4, "r_y0": 481.27, "r_x1": 325.37, "r_y1": 481.27, "r_x2": 325.37, "r_y2": 478.53, "r_x3": 323.4, "r_y3": 478.53, "coord_origin": "TOPLEFT" }, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 154, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 397.73, "r_y0": 481.27, "r_x1": 399.69, "r_y1": 481.27, "r_x2": 399.69, "r_y2": 478.53, "r_x3": 397.73, "r_y3": 478.53, "coord_origin": "TOPLEFT" }, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 155, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 200.64, "r_y0": 486.15, "r_x1": 206.52, "r_y1": 486.15, "r_x2": 206.52, "r_y2": 483.41, "r_x3": 200.64, "r_y3": 483.41, "coord_origin": "TOPLEFT" }, "text": "276", "orig": "276", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 156, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 382.66, "r_y0": 486.15, "r_x1": 384.62, "r_y1": 486.15, "r_x2": 384.62, "r_y2": 483.41, "r_x3": 382.66, "r_y3": 483.41, "coord_origin": "TOPLEFT" }, "text": "2", "orig": "2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 157, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 397.73, "r_y0": 486.15, "r_x1": 401.65, "r_y1": 486.15, "r_x2": 401.65, "r_y2": 483.41, "r_x3": 397.73, "r_y3": 483.41, "coord_origin": "TOPLEFT" }, "text": "12", "orig": "12", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 158, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 412.79, "r_y0": 486.15, "r_x1": 414.74, "r_y1": 486.15, "r_x2": 414.74, "r_y2": 483.41, "r_x3": 412.79, "r_y3": 483.41, "coord_origin": "TOPLEFT" }, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 159, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 200.64, "r_y0": 491.03, "r_x1": 207.14, "r_y1": 491.03, "r_x2": 207.14, "r_y2": 488.29, "r_x3": 200.64, "r_y3": 488.29, "coord_origin": "TOPLEFT" }, "text": "320", "orig": "320", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 160, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 367.63, "r_y0": 491.03, "r_x1": 369.78, "r_y1": 491.03, "r_x2": 369.78, "r_y2": 488.29, "r_x3": 367.63, "r_y3": 488.29, "coord_origin": "TOPLEFT" }, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 161, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 382.66, "r_y0": 491.03, "r_x1": 384.82, "r_y1": 491.03, "r_x2": 384.82, "r_y2": 488.29, "r_x3": 382.66, "r_y3": 488.29, "coord_origin": "TOPLEFT" }, "text": "4", "orig": "4", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 162, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 397.73, "r_y0": 491.03, "r_x1": 402.05, "r_y1": 491.03, "r_x2": 402.05, "r_y2": 488.29, "r_x3": 397.73, "r_y3": 488.29, "coord_origin": "TOPLEFT" }, "text": "20", "orig": "20", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 163, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 200.64, "r_y0": 495.9, "r_x1": 208.49, "r_y1": 495.9, "r_x2": 208.49, "r_y2": 493.17, "r_x3": 200.64, "r_y3": 493.17, "coord_origin": "TOPLEFT" }, "text": "2013", "orig": "2013", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 164, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 264.29, "r_y0": 495.9, "r_x1": 266.26, "r_y1": 495.9, "r_x2": 266.26, "r_y2": 493.17, "r_x3": 264.29, "r_y3": 493.17, "coord_origin": "TOPLEFT" }, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 165, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 227.91, "r_y0": 675.35, "r_x1": 230.1, "r_y1": 675.35, "r_x2": 230.1, "r_y2": 665.83, "r_x3": 227.91, "r_y3": 665.83, "coord_origin": "TOPLEFT" }, "text": "\u03bc", "orig": "\u03bc", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 166, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 300.58, "r_y0": 693.43, "r_x1": 302.73, "r_y1": 693.43, "r_x2": 302.73, "r_y2": 683.62, "r_x3": 300.58, "r_y3": 683.62, "coord_origin": "TOPLEFT" }, "text": "\u2265", "orig": "\u2265", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "has_chars": false, "has_words": false, "has_lines": true, "image": null, "lines": [] }, "predictions": { "layout": { "clusters": [ { "id": 7, "label": "page_header", "bbox": { "l": 134.76, "t": 93.77, "r": 143.98, "b": 101.84, "coord_origin": "TOPLEFT" }, "confidence": 0.831, "cells": [ { "index": 0, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 101.84, "r_x1": 143.98, "r_y1": 101.84, "r_x2": 143.98, "r_y2": 93.77, "r_x3": 134.76, "r_y3": 93.77, "coord_origin": "TOPLEFT" }, "text": "10", "orig": "10", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 6, "label": "page_header", "bbox": { "l": 167.82, "t": 93.77, "r": 231.72, "b": 101.84, "coord_origin": "TOPLEFT" }, "confidence": 0.837, "cells": [ { "index": 1, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 167.82, "r_y0": 101.84, "r_x1": 178.08, "r_y1": 101.84, "r_x2": 178.08, "r_y2": 93.77, "r_x3": 167.82, "r_y3": 93.77, "coord_origin": "TOPLEFT" }, "text": "M.", "orig": "M.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 2, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 182.38, "r_y0": 101.84, "r_x1": 231.72, "r_y1": 101.84, "r_x2": 231.72, "r_y2": 93.77, "r_x3": 182.38, "r_y3": 93.77, "coord_origin": "TOPLEFT" }, "text": "Lysak, et al.", "orig": "Lysak, et al.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 4, "label": "caption", "bbox": { "l": 134.76, "t": 115.84, "r": 480.59, "b": 145.89, "coord_origin": "TOPLEFT" }, "confidence": 0.951, "cells": [ { "index": 3, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 123.76, "r_x1": 173.09, "r_y1": 123.76, "r_x2": 173.09, "r_y2": 115.84, "r_x3": 134.76, "r_y3": 115.84, "coord_origin": "TOPLEFT" }, "text": "Table 2.", "orig": "Table 2.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 4, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 181.3, "r_y0": 123.97, "r_x1": 480.59, "r_y1": 123.97, "r_x2": 480.59, "r_y2": 115.9, "r_x3": 181.3, "r_y3": 115.9, "coord_origin": "TOPLEFT" }, "text": "TSR and cell detection results compared between OTSL and HTML on", "orig": "TSR and cell detection results compared between OTSL and HTML on", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 5, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 134.93, "r_x1": 480.59, "r_y1": 134.93, "r_x2": 480.59, "r_y2": 126.86, "r_x3": 134.76, "r_y3": 126.86, "coord_origin": "TOPLEFT" }, "text": "the PubTabNet [22], FinTabNet [21] and PubTables-1M [14] data sets using Table-", "orig": "the PubTabNet [22], FinTabNet [21] and PubTables-1M [14] data sets using Table-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 6, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 145.89, "r_x1": 305.96, "r_y1": 145.89, "r_x2": 305.96, "r_y2": 137.82, "r_x3": 134.76, "r_y3": 137.82, "coord_origin": "TOPLEFT" }, "text": "Former [9] (with enc=6, dec=6, heads=8).", "orig": "Former [9] (with enc=6, dec=6, heads=8).", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 0, "label": "table", "bbox": { "l": 143.64, "t": 156.35, "r": 470.85, "b": 263.26, "coord_origin": "TOPLEFT" }, "confidence": 0.988, "cells": [ { "index": 7, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 160.78, "r_y0": 174.63, "r_x1": 195.0, "r_y1": 174.63, "r_x2": 195.0, "r_y2": 166.56, "r_x3": 160.78, "r_y3": 166.56, "coord_origin": "TOPLEFT" }, "text": "Data set", "orig": "Data set", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 8, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 215.52, "r_y0": 174.6, "r_x1": 254.04, "r_y1": 174.6, "r_x2": 254.04, "r_y2": 166.53, "r_x3": 215.52, "r_y3": 166.53, "coord_origin": "TOPLEFT" }, "text": "Language", "orig": "Language", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 9, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 300.4, "r_y0": 169.15, "r_x1": 323.99, "r_y1": 169.15, "r_x2": 323.99, "r_y2": 161.08, "r_x3": 300.4, "r_y3": 161.08, "coord_origin": "TOPLEFT" }, "text": "TEDs", "orig": "TEDs", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 10, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 370.35, "r_y0": 174.63, "r_x1": 414.75, "r_y1": 174.63, "r_x2": 414.75, "r_y2": 166.56, "r_x3": 370.35, "r_y3": 166.56, "coord_origin": "TOPLEFT" }, "text": "mAP(0.75)", "orig": "mAP(0.75)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 11, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 426.74, "r_y0": 169.15, "r_x1": 463.11, "r_y1": 169.15, "r_x2": 463.11, "r_y2": 161.08, "r_x3": 426.74, "r_y3": 161.08, "coord_origin": "TOPLEFT" }, "text": "Inference", "orig": "Inference", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 12, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 423.11, "r_y0": 180.11, "r_x1": 466.73, "r_y1": 180.11, "r_x2": 466.73, "r_y2": 172.04, "r_x3": 423.11, "r_y3": 172.04, "coord_origin": "TOPLEFT" }, "text": "time (secs)", "orig": "time (secs)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 13, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 262.41, "r_y0": 182.1, "r_x1": 288.06, "r_y1": 182.1, "r_x2": 288.06, "r_y2": 174.03, "r_x3": 262.41, "r_y3": 174.03, "coord_origin": "TOPLEFT" }, "text": "simple", "orig": "simple", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 14, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 296.43, "r_y0": 182.1, "r_x1": 329.45, "r_y1": 182.1, "r_x2": 329.45, "r_y2": 174.03, "r_x3": 296.43, "r_y3": 174.03, "coord_origin": "TOPLEFT" }, "text": "complex", "orig": "complex", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 15, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 345.03, "r_y0": 182.1, "r_x1": 354.76, "r_y1": 182.1, "r_x2": 354.76, "r_y2": 174.03, "r_x3": 345.03, "r_y3": 174.03, "coord_origin": "TOPLEFT" }, "text": "all", "orig": "all", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 16, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 154.54, "r_y0": 200.93, "r_x1": 201.24, "r_y1": 200.93, "r_x2": 201.24, "r_y2": 192.86, "r_x3": 154.54, "r_y3": 192.86, "coord_origin": "TOPLEFT" }, "text": "PubTabNet", "orig": "PubTabNet", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 17, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 222.44, "r_y0": 195.45, "r_x1": 247.13, "r_y1": 195.45, "r_x2": 247.13, "r_y2": 187.38, "r_x3": 222.44, "r_y3": 187.38, "coord_origin": "TOPLEFT" }, "text": "OTSL", "orig": "OTSL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 18, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 264.74, "r_y0": 195.45, "r_x1": 285.73, "r_y1": 195.45, "r_x2": 285.73, "r_y2": 187.38, "r_x3": 264.74, "r_y3": 187.38, "coord_origin": "TOPLEFT" }, "text": "0.965", "orig": "0.965", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 19, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 302.44, "r_y0": 195.45, "r_x1": 323.43, "r_y1": 195.45, "r_x2": 323.43, "r_y2": 187.38, "r_x3": 302.44, "r_y3": 187.38, "coord_origin": "TOPLEFT" }, "text": "0.934", "orig": "0.934", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 20, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 339.4, "r_y0": 195.45, "r_x1": 360.39, "r_y1": 195.45, "r_x2": 360.39, "r_y2": 187.38, "r_x3": 339.4, "r_y3": 187.38, "coord_origin": "TOPLEFT" }, "text": "0.955", "orig": "0.955", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 21, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 383.12, "r_y0": 195.24, "r_x1": 401.97, "r_y1": 195.24, "r_x2": 401.97, "r_y2": 187.32, "r_x3": 383.12, "r_y3": 187.32, "coord_origin": "TOPLEFT" }, "text": "0.88", "orig": "0.88", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 22, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 435.49, "r_y0": 195.24, "r_x1": 454.35, "r_y1": 195.24, "r_x2": 454.35, "r_y2": 187.32, "r_x3": 435.49, "r_y3": 187.32, "coord_origin": "TOPLEFT" }, "text": "2.73", "orig": "2.73", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 23, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 220.9, "r_y0": 208.4, "r_x1": 248.67, "r_y1": 208.4, "r_x2": 248.67, "r_y2": 200.33, "r_x3": 220.9, "r_y3": 200.33, "coord_origin": "TOPLEFT" }, "text": "HTML", "orig": "HTML", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 24, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 264.74, "r_y0": 208.4, "r_x1": 285.73, "r_y1": 208.4, "r_x2": 285.73, "r_y2": 200.33, "r_x3": 264.74, "r_y3": 200.33, "coord_origin": "TOPLEFT" }, "text": "0.969", "orig": "0.969", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 25, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 302.44, "r_y0": 208.4, "r_x1": 323.43, "r_y1": 208.4, "r_x2": 323.43, "r_y2": 200.33, "r_x3": 302.44, "r_y3": 200.33, "coord_origin": "TOPLEFT" }, "text": "0.927", "orig": "0.927", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 26, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 339.4, "r_y0": 208.4, "r_x1": 360.39, "r_y1": 208.4, "r_x2": 360.39, "r_y2": 200.33, "r_x3": 339.4, "r_y3": 200.33, "coord_origin": "TOPLEFT" }, "text": "0.955", "orig": "0.955", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 27, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 382.05, "r_y0": 208.4, "r_x1": 403.04, "r_y1": 208.4, "r_x2": 403.04, "r_y2": 200.33, "r_x3": 382.05, "r_y3": 200.33, "coord_origin": "TOPLEFT" }, "text": "0.857", "orig": "0.857", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 28, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 436.73, "r_y0": 208.4, "r_x1": 453.11, "r_y1": 208.4, "r_x2": 453.11, "r_y2": 200.33, "r_x3": 436.73, "r_y3": 200.33, "coord_origin": "TOPLEFT" }, "text": "5.39", "orig": "5.39", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 29, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 155.95, "r_y0": 227.23, "r_x1": 199.83, "r_y1": 227.23, "r_x2": 199.83, "r_y2": 219.16, "r_x3": 155.95, "r_y3": 219.16, "coord_origin": "TOPLEFT" }, "text": "FinTabNet", "orig": "FinTabNet", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 30, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 222.44, "r_y0": 221.75, "r_x1": 247.13, "r_y1": 221.75, "r_x2": 247.13, "r_y2": 213.68, "r_x3": 222.44, "r_y3": 213.68, "coord_origin": "TOPLEFT" }, "text": "OTSL", "orig": "OTSL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 31, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 264.74, "r_y0": 221.75, "r_x1": 285.73, "r_y1": 221.75, "r_x2": 285.73, "r_y2": 213.68, "r_x3": 264.74, "r_y3": 213.68, "coord_origin": "TOPLEFT" }, "text": "0.955", "orig": "0.955", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 32, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 302.44, "r_y0": 221.75, "r_x1": 323.43, "r_y1": 221.75, "r_x2": 323.43, "r_y2": 213.68, "r_x3": 302.44, "r_y3": 213.68, "coord_origin": "TOPLEFT" }, "text": "0.961", "orig": "0.961", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 33, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 337.81, "r_y0": 221.55, "r_x1": 361.98, "r_y1": 221.55, "r_x2": 361.98, "r_y2": 213.62, "r_x3": 337.81, "r_y3": 213.62, "coord_origin": "TOPLEFT" }, "text": "0.959", "orig": "0.959", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 34, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 380.46, "r_y0": 221.55, "r_x1": 404.62, "r_y1": 221.55, "r_x2": 404.62, "r_y2": 213.62, "r_x3": 380.46, "r_y3": 213.62, "coord_origin": "TOPLEFT" }, "text": "0.862", "orig": "0.862", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 35, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 435.49, "r_y0": 221.55, "r_x1": 454.35, "r_y1": 221.55, "r_x2": 454.35, "r_y2": 213.62, "r_x3": 435.49, "r_y3": 213.62, "coord_origin": "TOPLEFT" }, "text": "1.85", "orig": "1.85", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 36, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 220.9, "r_y0": 234.7, "r_x1": 248.67, "r_y1": 234.7, "r_x2": 248.67, "r_y2": 226.63, "r_x3": 220.9, "r_y3": 226.63, "coord_origin": "TOPLEFT" }, "text": "HTML", "orig": "HTML", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 37, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 264.74, "r_y0": 234.7, "r_x1": 285.73, "r_y1": 234.7, "r_x2": 285.73, "r_y2": 226.63, "r_x3": 264.74, "r_y3": 226.63, "coord_origin": "TOPLEFT" }, "text": "0.917", "orig": "0.917", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 38, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 302.44, "r_y0": 234.7, "r_x1": 323.43, "r_y1": 234.7, "r_x2": 323.43, "r_y2": 226.63, "r_x3": 302.44, "r_y3": 226.63, "coord_origin": "TOPLEFT" }, "text": "0.922", "orig": "0.922", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 39, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 341.71, "r_y0": 234.7, "r_x1": 358.09, "r_y1": 234.7, "r_x2": 358.09, "r_y2": 226.63, "r_x3": 341.71, "r_y3": 226.63, "coord_origin": "TOPLEFT" }, "text": "0.92", "orig": "0.92", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 40, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 382.05, "r_y0": 234.7, "r_x1": 403.04, "r_y1": 234.7, "r_x2": 403.04, "r_y2": 226.63, "r_x3": 382.05, "r_y3": 226.63, "coord_origin": "TOPLEFT" }, "text": "0.722", "orig": "0.722", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 41, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 436.73, "r_y0": 234.7, "r_x1": 453.11, "r_y1": 234.7, "r_x2": 453.11, "r_y2": 226.63, "r_x3": 436.73, "r_y3": 226.63, "coord_origin": "TOPLEFT" }, "text": "3.26", "orig": "3.26", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 42, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 148.63, "r_y0": 253.53, "r_x1": 207.15, "r_y1": 253.53, "r_x2": 207.15, "r_y2": 245.46, "r_x3": 148.63, "r_y3": 245.46, "coord_origin": "TOPLEFT" }, "text": "PubTables-1M", "orig": "PubTables-1M", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 43, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 222.44, "r_y0": 248.05, "r_x1": 247.13, "r_y1": 248.05, "r_x2": 247.13, "r_y2": 239.98, "r_x3": 222.44, "r_y3": 239.98, "coord_origin": "TOPLEFT" }, "text": "OTSL", "orig": "OTSL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 44, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 264.74, "r_y0": 248.05, "r_x1": 285.73, "r_y1": 248.05, "r_x2": 285.73, "r_y2": 239.98, "r_x3": 264.74, "r_y3": 239.98, "coord_origin": "TOPLEFT" }, "text": "0.987", "orig": "0.987", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 45, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 302.44, "r_y0": 248.05, "r_x1": 323.43, "r_y1": 248.05, "r_x2": 323.43, "r_y2": 239.98, "r_x3": 302.44, "r_y3": 239.98, "coord_origin": "TOPLEFT" }, "text": "0.964", "orig": "0.964", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 46, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 337.81, "r_y0": 247.85, "r_x1": 361.98, "r_y1": 247.85, "r_x2": 361.98, "r_y2": 239.92, "r_x3": 337.81, "r_y3": 239.92, "coord_origin": "TOPLEFT" }, "text": "0.977", "orig": "0.977", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 47, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 380.46, "r_y0": 247.85, "r_x1": 404.62, "r_y1": 247.85, "r_x2": 404.62, "r_y2": 239.92, "r_x3": 380.46, "r_y3": 239.92, "coord_origin": "TOPLEFT" }, "text": "0.896", "orig": "0.896", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 48, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 435.49, "r_y0": 247.85, "r_x1": 454.35, "r_y1": 247.85, "r_x2": 454.35, "r_y2": 239.92, "r_x3": 435.49, "r_y3": 239.92, "coord_origin": "TOPLEFT" }, "text": "1.79", "orig": "1.79", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 49, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 220.9, "r_y0": 261.0, "r_x1": 248.67, "r_y1": 261.0, "r_x2": 248.67, "r_y2": 252.93, "r_x3": 220.9, "r_y3": 252.93, "coord_origin": "TOPLEFT" }, "text": "HTML", "orig": "HTML", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 50, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 264.74, "r_y0": 261.0, "r_x1": 285.73, "r_y1": 261.0, "r_x2": 285.73, "r_y2": 252.93, "r_x3": 264.74, "r_y3": 252.93, "coord_origin": "TOPLEFT" }, "text": "0.983", "orig": "0.983", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 51, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 302.44, "r_y0": 261.0, "r_x1": 323.43, "r_y1": 261.0, "r_x2": 323.43, "r_y2": 252.93, "r_x3": 302.44, "r_y3": 252.93, "coord_origin": "TOPLEFT" }, "text": "0.944", "orig": "0.944", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 52, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 339.4, "r_y0": 261.0, "r_x1": 360.39, "r_y1": 261.0, "r_x2": 360.39, "r_y2": 252.93, "r_x3": 339.4, "r_y3": 252.93, "coord_origin": "TOPLEFT" }, "text": "0.966", "orig": "0.966", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 53, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 382.05, "r_y0": 261.0, "r_x1": 403.04, "r_y1": 261.0, "r_x2": 403.04, "r_y2": 252.93, "r_x3": 382.05, "r_y3": 252.93, "coord_origin": "TOPLEFT" }, "text": "0.889", "orig": "0.889", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 54, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 436.73, "r_y0": 261.0, "r_x1": 453.11, "r_y1": 261.0, "r_x2": 453.11, "r_y2": 252.93, "r_x3": 436.73, "r_y3": 252.93, "coord_origin": "TOPLEFT" }, "text": "3.26", "orig": "3.26", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [ { "id": 10, "label": "text", "bbox": { "l": 160.78, "t": 166.56, "r": 195.0, "b": 174.63, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 7, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 160.78, "r_y0": 174.63, "r_x1": 195.0, "r_y1": 174.63, "r_x2": 195.0, "r_y2": 166.56, "r_x3": 160.78, "r_y3": 166.56, "coord_origin": "TOPLEFT" }, "text": "Data set", "orig": "Data set", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 11, "label": "text", "bbox": { "l": 215.52, "t": 166.53, "r": 254.04, "b": 174.6, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 8, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 215.52, "r_y0": 174.6, "r_x1": 254.04, "r_y1": 174.6, "r_x2": 254.04, "r_y2": 166.53, "r_x3": 215.52, "r_y3": 166.53, "coord_origin": "TOPLEFT" }, "text": "Language", "orig": "Language", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 12, "label": "text", "bbox": { "l": 300.4, "t": 161.08, "r": 323.99, "b": 169.15, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 9, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 300.4, "r_y0": 169.15, "r_x1": 323.99, "r_y1": 169.15, "r_x2": 323.99, "r_y2": 161.08, "r_x3": 300.4, "r_y3": 161.08, "coord_origin": "TOPLEFT" }, "text": "TEDs", "orig": "TEDs", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 13, "label": "text", "bbox": { "l": 370.35, "t": 166.56, "r": 414.75, "b": 174.63, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 10, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 370.35, "r_y0": 174.63, "r_x1": 414.75, "r_y1": 174.63, "r_x2": 414.75, "r_y2": 166.56, "r_x3": 370.35, "r_y3": 166.56, "coord_origin": "TOPLEFT" }, "text": "mAP(0.75)", "orig": "mAP(0.75)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 14, "label": "text", "bbox": { "l": 426.74, "t": 161.08, "r": 463.11, "b": 169.15, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 11, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 426.74, "r_y0": 169.15, "r_x1": 463.11, "r_y1": 169.15, "r_x2": 463.11, "r_y2": 161.08, "r_x3": 426.74, "r_y3": 161.08, "coord_origin": "TOPLEFT" }, "text": "Inference", "orig": "Inference", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 15, "label": "text", "bbox": { "l": 423.11, "t": 172.04, "r": 466.73, "b": 180.11, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 12, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 423.11, "r_y0": 180.11, "r_x1": 466.73, "r_y1": 180.11, "r_x2": 466.73, "r_y2": 172.04, "r_x3": 423.11, "r_y3": 172.04, "coord_origin": "TOPLEFT" }, "text": "time (secs)", "orig": "time (secs)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 16, "label": "text", "bbox": { "l": 262.41, "t": 174.03, "r": 288.06, "b": 182.1, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 13, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 262.41, "r_y0": 182.1, "r_x1": 288.06, "r_y1": 182.1, "r_x2": 288.06, "r_y2": 174.03, "r_x3": 262.41, "r_y3": 174.03, "coord_origin": "TOPLEFT" }, "text": "simple", "orig": "simple", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 17, "label": "text", "bbox": { "l": 296.43, "t": 174.03, "r": 329.45, "b": 182.1, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 14, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 296.43, "r_y0": 182.1, "r_x1": 329.45, "r_y1": 182.1, "r_x2": 329.45, "r_y2": 174.03, "r_x3": 296.43, "r_y3": 174.03, "coord_origin": "TOPLEFT" }, "text": "complex", "orig": "complex", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 18, "label": "text", "bbox": { "l": 345.03, "t": 174.03, "r": 354.76, "b": 182.1, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 15, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 345.03, "r_y0": 182.1, "r_x1": 354.76, "r_y1": 182.1, "r_x2": 354.76, "r_y2": 174.03, "r_x3": 345.03, "r_y3": 174.03, "coord_origin": "TOPLEFT" }, "text": "all", "orig": "all", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 19, "label": "text", "bbox": { "l": 154.54, "t": 192.86, "r": 201.24, "b": 200.93, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 16, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 154.54, "r_y0": 200.93, "r_x1": 201.24, "r_y1": 200.93, "r_x2": 201.24, "r_y2": 192.86, "r_x3": 154.54, "r_y3": 192.86, "coord_origin": "TOPLEFT" }, "text": "PubTabNet", "orig": "PubTabNet", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 20, "label": "text", "bbox": { "l": 222.44, "t": 187.38, "r": 247.13, "b": 195.45, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 17, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 222.44, "r_y0": 195.45, "r_x1": 247.13, "r_y1": 195.45, "r_x2": 247.13, "r_y2": 187.38, "r_x3": 222.44, "r_y3": 187.38, "coord_origin": "TOPLEFT" }, "text": "OTSL", "orig": "OTSL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 21, "label": "text", "bbox": { "l": 264.74, "t": 187.38, "r": 285.73, "b": 195.45, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 18, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 264.74, "r_y0": 195.45, "r_x1": 285.73, "r_y1": 195.45, "r_x2": 285.73, "r_y2": 187.38, "r_x3": 264.74, "r_y3": 187.38, "coord_origin": "TOPLEFT" }, "text": "0.965", "orig": "0.965", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 22, "label": "text", "bbox": { "l": 302.44, "t": 187.38, "r": 323.43, "b": 195.45, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 19, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 302.44, "r_y0": 195.45, "r_x1": 323.43, "r_y1": 195.45, "r_x2": 323.43, "r_y2": 187.38, "r_x3": 302.44, "r_y3": 187.38, "coord_origin": "TOPLEFT" }, "text": "0.934", "orig": "0.934", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 23, "label": "text", "bbox": { "l": 339.4, "t": 187.38, "r": 360.39, "b": 195.45, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 20, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 339.4, "r_y0": 195.45, "r_x1": 360.39, "r_y1": 195.45, "r_x2": 360.39, "r_y2": 187.38, "r_x3": 339.4, "r_y3": 187.38, "coord_origin": "TOPLEFT" }, "text": "0.955", "orig": "0.955", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 24, "label": "text", "bbox": { "l": 383.12, "t": 187.32, "r": 401.97, "b": 195.24, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 21, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 383.12, "r_y0": 195.24, "r_x1": 401.97, "r_y1": 195.24, "r_x2": 401.97, "r_y2": 187.32, "r_x3": 383.12, "r_y3": 187.32, "coord_origin": "TOPLEFT" }, "text": "0.88", "orig": "0.88", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 25, "label": "text", "bbox": { "l": 435.49, "t": 187.32, "r": 454.35, "b": 195.24, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 22, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 435.49, "r_y0": 195.24, "r_x1": 454.35, "r_y1": 195.24, "r_x2": 454.35, "r_y2": 187.32, "r_x3": 435.49, "r_y3": 187.32, "coord_origin": "TOPLEFT" }, "text": "2.73", "orig": "2.73", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 26, "label": "text", "bbox": { "l": 220.9, "t": 200.33, "r": 248.67, "b": 208.4, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 23, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 220.9, "r_y0": 208.4, "r_x1": 248.67, "r_y1": 208.4, "r_x2": 248.67, "r_y2": 200.33, "r_x3": 220.9, "r_y3": 200.33, "coord_origin": "TOPLEFT" }, "text": "HTML", "orig": "HTML", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 27, "label": "text", "bbox": { "l": 264.74, "t": 200.33, "r": 285.73, "b": 208.4, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 24, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 264.74, "r_y0": 208.4, "r_x1": 285.73, "r_y1": 208.4, "r_x2": 285.73, "r_y2": 200.33, "r_x3": 264.74, "r_y3": 200.33, "coord_origin": "TOPLEFT" }, "text": "0.969", "orig": "0.969", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 28, "label": "text", "bbox": { "l": 302.44, "t": 200.33, "r": 323.43, "b": 208.4, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 25, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 302.44, "r_y0": 208.4, "r_x1": 323.43, "r_y1": 208.4, "r_x2": 323.43, "r_y2": 200.33, "r_x3": 302.44, "r_y3": 200.33, "coord_origin": "TOPLEFT" }, "text": "0.927", "orig": "0.927", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 29, "label": "text", "bbox": { "l": 339.4, "t": 200.33, "r": 360.39, "b": 208.4, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 26, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 339.4, "r_y0": 208.4, "r_x1": 360.39, "r_y1": 208.4, "r_x2": 360.39, "r_y2": 200.33, "r_x3": 339.4, "r_y3": 200.33, "coord_origin": "TOPLEFT" }, "text": "0.955", "orig": "0.955", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 30, "label": "text", "bbox": { "l": 382.05, "t": 200.33, "r": 403.04, "b": 208.4, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 27, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 382.05, "r_y0": 208.4, "r_x1": 403.04, "r_y1": 208.4, "r_x2": 403.04, "r_y2": 200.33, "r_x3": 382.05, "r_y3": 200.33, "coord_origin": "TOPLEFT" }, "text": "0.857", "orig": "0.857", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 31, "label": "text", "bbox": { "l": 436.73, "t": 200.33, "r": 453.11, "b": 208.4, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 28, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 436.73, "r_y0": 208.4, "r_x1": 453.11, "r_y1": 208.4, "r_x2": 453.11, "r_y2": 200.33, "r_x3": 436.73, "r_y3": 200.33, "coord_origin": "TOPLEFT" }, "text": "5.39", "orig": "5.39", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 32, "label": "text", "bbox": { "l": 155.95, "t": 219.16, "r": 199.83, "b": 227.23, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 29, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 155.95, "r_y0": 227.23, "r_x1": 199.83, "r_y1": 227.23, "r_x2": 199.83, "r_y2": 219.16, "r_x3": 155.95, "r_y3": 219.16, "coord_origin": "TOPLEFT" }, "text": "FinTabNet", "orig": "FinTabNet", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 33, "label": "text", "bbox": { "l": 222.44, "t": 213.68, "r": 247.13, "b": 221.75, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 30, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 222.44, "r_y0": 221.75, "r_x1": 247.13, "r_y1": 221.75, "r_x2": 247.13, "r_y2": 213.68, "r_x3": 222.44, "r_y3": 213.68, "coord_origin": "TOPLEFT" }, "text": "OTSL", "orig": "OTSL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 34, "label": "text", "bbox": { "l": 264.74, "t": 213.68, "r": 285.73, "b": 221.75, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 31, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 264.74, "r_y0": 221.75, "r_x1": 285.73, "r_y1": 221.75, "r_x2": 285.73, "r_y2": 213.68, "r_x3": 264.74, "r_y3": 213.68, "coord_origin": "TOPLEFT" }, "text": "0.955", "orig": "0.955", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 35, "label": "text", "bbox": { "l": 302.44, "t": 213.68, "r": 323.43, "b": 221.75, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 32, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 302.44, "r_y0": 221.75, "r_x1": 323.43, "r_y1": 221.75, "r_x2": 323.43, "r_y2": 213.68, "r_x3": 302.44, "r_y3": 213.68, "coord_origin": "TOPLEFT" }, "text": "0.961", "orig": "0.961", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 36, "label": "text", "bbox": { "l": 337.81, "t": 213.62, "r": 361.98, "b": 221.55, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 33, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 337.81, "r_y0": 221.55, "r_x1": 361.98, "r_y1": 221.55, "r_x2": 361.98, "r_y2": 213.62, "r_x3": 337.81, "r_y3": 213.62, "coord_origin": "TOPLEFT" }, "text": "0.959", "orig": "0.959", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 37, "label": "text", "bbox": { "l": 380.46, "t": 213.62, "r": 404.62, "b": 221.55, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 34, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 380.46, "r_y0": 221.55, "r_x1": 404.62, "r_y1": 221.55, "r_x2": 404.62, "r_y2": 213.62, "r_x3": 380.46, "r_y3": 213.62, "coord_origin": "TOPLEFT" }, "text": "0.862", "orig": "0.862", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 38, "label": "text", "bbox": { "l": 435.49, "t": 213.62, "r": 454.35, "b": 221.55, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 35, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 435.49, "r_y0": 221.55, "r_x1": 454.35, "r_y1": 221.55, "r_x2": 454.35, "r_y2": 213.62, "r_x3": 435.49, "r_y3": 213.62, "coord_origin": "TOPLEFT" }, "text": "1.85", "orig": "1.85", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 39, "label": "text", "bbox": { "l": 220.9, "t": 226.63, "r": 248.67, "b": 234.7, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 36, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 220.9, "r_y0": 234.7, "r_x1": 248.67, "r_y1": 234.7, "r_x2": 248.67, "r_y2": 226.63, "r_x3": 220.9, "r_y3": 226.63, "coord_origin": "TOPLEFT" }, "text": "HTML", "orig": "HTML", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 40, "label": "text", "bbox": { "l": 264.74, "t": 226.63, "r": 285.73, "b": 234.7, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 37, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 264.74, "r_y0": 234.7, "r_x1": 285.73, "r_y1": 234.7, "r_x2": 285.73, "r_y2": 226.63, "r_x3": 264.74, "r_y3": 226.63, "coord_origin": "TOPLEFT" }, "text": "0.917", "orig": "0.917", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 41, "label": "text", "bbox": { "l": 302.44, "t": 226.63, "r": 323.43, "b": 234.7, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 38, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 302.44, "r_y0": 234.7, "r_x1": 323.43, "r_y1": 234.7, "r_x2": 323.43, "r_y2": 226.63, "r_x3": 302.44, "r_y3": 226.63, "coord_origin": "TOPLEFT" }, "text": "0.922", "orig": "0.922", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 42, "label": "text", "bbox": { "l": 341.71, "t": 226.63, "r": 358.09, "b": 234.7, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 39, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 341.71, "r_y0": 234.7, "r_x1": 358.09, "r_y1": 234.7, "r_x2": 358.09, "r_y2": 226.63, "r_x3": 341.71, "r_y3": 226.63, "coord_origin": "TOPLEFT" }, "text": "0.92", "orig": "0.92", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 43, "label": "text", "bbox": { "l": 382.05, "t": 226.63, "r": 403.04, "b": 234.7, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 40, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 382.05, "r_y0": 234.7, "r_x1": 403.04, "r_y1": 234.7, "r_x2": 403.04, "r_y2": 226.63, "r_x3": 382.05, "r_y3": 226.63, "coord_origin": "TOPLEFT" }, "text": "0.722", "orig": "0.722", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 44, "label": "text", "bbox": { "l": 436.73, "t": 226.63, "r": 453.11, "b": 234.7, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 41, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 436.73, "r_y0": 234.7, "r_x1": 453.11, "r_y1": 234.7, "r_x2": 453.11, "r_y2": 226.63, "r_x3": 436.73, "r_y3": 226.63, "coord_origin": "TOPLEFT" }, "text": "3.26", "orig": "3.26", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 45, "label": "text", "bbox": { "l": 148.63, "t": 245.46, "r": 207.15, "b": 253.53, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 42, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 148.63, "r_y0": 253.53, "r_x1": 207.15, "r_y1": 253.53, "r_x2": 207.15, "r_y2": 245.46, "r_x3": 148.63, "r_y3": 245.46, "coord_origin": "TOPLEFT" }, "text": "PubTables-1M", "orig": "PubTables-1M", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 46, "label": "text", "bbox": { "l": 222.44, "t": 239.98, "r": 247.13, "b": 248.05, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 43, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 222.44, "r_y0": 248.05, "r_x1": 247.13, "r_y1": 248.05, "r_x2": 247.13, "r_y2": 239.98, "r_x3": 222.44, "r_y3": 239.98, "coord_origin": "TOPLEFT" }, "text": "OTSL", "orig": "OTSL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 47, "label": "text", "bbox": { "l": 264.74, "t": 239.98, "r": 285.73, "b": 248.05, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 44, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 264.74, "r_y0": 248.05, "r_x1": 285.73, "r_y1": 248.05, "r_x2": 285.73, "r_y2": 239.98, "r_x3": 264.74, "r_y3": 239.98, "coord_origin": "TOPLEFT" }, "text": "0.987", "orig": "0.987", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 48, "label": "text", "bbox": { "l": 302.44, "t": 239.98, "r": 323.43, "b": 248.05, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 45, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 302.44, "r_y0": 248.05, "r_x1": 323.43, "r_y1": 248.05, "r_x2": 323.43, "r_y2": 239.98, "r_x3": 302.44, "r_y3": 239.98, "coord_origin": "TOPLEFT" }, "text": "0.964", "orig": "0.964", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 49, "label": "text", "bbox": { "l": 337.81, "t": 239.92, "r": 361.98, "b": 247.85, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 46, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 337.81, "r_y0": 247.85, "r_x1": 361.98, "r_y1": 247.85, "r_x2": 361.98, "r_y2": 239.92, "r_x3": 337.81, "r_y3": 239.92, "coord_origin": "TOPLEFT" }, "text": "0.977", "orig": "0.977", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 50, "label": "text", "bbox": { "l": 380.46, "t": 239.92, "r": 404.62, "b": 247.85, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 47, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 380.46, "r_y0": 247.85, "r_x1": 404.62, "r_y1": 247.85, "r_x2": 404.62, "r_y2": 239.92, "r_x3": 380.46, "r_y3": 239.92, "coord_origin": "TOPLEFT" }, "text": "0.896", "orig": "0.896", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 51, "label": "text", "bbox": { "l": 435.49, "t": 239.92, "r": 454.35, "b": 247.85, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 48, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 435.49, "r_y0": 247.85, "r_x1": 454.35, "r_y1": 247.85, "r_x2": 454.35, "r_y2": 239.92, "r_x3": 435.49, "r_y3": 239.92, "coord_origin": "TOPLEFT" }, "text": "1.79", "orig": "1.79", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 52, "label": "text", "bbox": { "l": 220.9, "t": 252.93, "r": 248.67, "b": 261.0, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 49, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 220.9, "r_y0": 261.0, "r_x1": 248.67, "r_y1": 261.0, "r_x2": 248.67, "r_y2": 252.93, "r_x3": 220.9, "r_y3": 252.93, "coord_origin": "TOPLEFT" }, "text": "HTML", "orig": "HTML", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 53, "label": "text", "bbox": { "l": 264.74, "t": 252.93, "r": 285.73, "b": 261.0, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 50, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 264.74, "r_y0": 261.0, "r_x1": 285.73, "r_y1": 261.0, "r_x2": 285.73, "r_y2": 252.93, "r_x3": 264.74, "r_y3": 252.93, "coord_origin": "TOPLEFT" }, "text": "0.983", "orig": "0.983", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 54, "label": "text", "bbox": { "l": 302.44, "t": 252.93, "r": 323.43, "b": 261.0, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 51, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 302.44, "r_y0": 261.0, "r_x1": 323.43, "r_y1": 261.0, "r_x2": 323.43, "r_y2": 252.93, "r_x3": 302.44, "r_y3": 252.93, "coord_origin": "TOPLEFT" }, "text": "0.944", "orig": "0.944", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 55, "label": "text", "bbox": { "l": 339.4, "t": 252.93, "r": 360.39, "b": 261.0, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 52, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 339.4, "r_y0": 261.0, "r_x1": 360.39, "r_y1": 261.0, "r_x2": 360.39, "r_y2": 252.93, "r_x3": 339.4, "r_y3": 252.93, "coord_origin": "TOPLEFT" }, "text": "0.966", "orig": "0.966", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 56, "label": "text", "bbox": { "l": 382.05, "t": 252.93, "r": 403.04, "b": 261.0, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 53, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 382.05, "r_y0": 261.0, "r_x1": 403.04, "r_y1": 261.0, "r_x2": 403.04, "r_y2": 252.93, "r_x3": 382.05, "r_y3": 252.93, "coord_origin": "TOPLEFT" }, "text": "0.889", "orig": "0.889", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 57, "label": "text", "bbox": { "l": 436.73, "t": 252.93, "r": 453.11, "b": 261.0, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 54, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 436.73, "r_y0": 261.0, "r_x1": 453.11, "r_y1": 261.0, "r_x2": 453.11, "r_y2": 252.93, "r_x3": 436.73, "r_y3": 252.93, "coord_origin": "TOPLEFT" }, "text": "3.26", "orig": "3.26", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] } ] }, { "id": 3, "label": "section_header", "bbox": { "l": 134.76, "t": 288.91, "r": 257.09, "b": 297.72, "coord_origin": "TOPLEFT" }, "confidence": 0.955, "cells": [ { "index": 55, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 297.72, "r_x1": 149.4, "r_y1": 297.72, "r_x2": 149.4, "r_y2": 288.91, "r_x3": 134.76, "r_y3": 288.91, "coord_origin": "TOPLEFT" }, "text": "5.3", "orig": "5.3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 56, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 160.86, "r_y0": 297.72, "r_x1": 257.09, "r_y1": 297.72, "r_x2": 257.09, "r_y2": 288.91, "r_x3": 160.86, "r_y3": 288.91, "coord_origin": "TOPLEFT" }, "text": "Qualitative Results", "orig": "Qualitative Results", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 1, "label": "text", "bbox": { "l": 134.76, "t": 309.86, "r": 480.59, "b": 366.48, "coord_origin": "TOPLEFT" }, "confidence": 0.983, "cells": [ { "index": 57, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 318.66, "r_x1": 480.59, "r_y1": 318.66, "r_x2": 480.59, "r_y2": 309.86, "r_x3": 134.76, "r_y3": 309.86, "coord_origin": "TOPLEFT" }, "text": "To illustrate the qualitative differences between OTSL and HTML, Figure 5", "orig": "To illustrate the qualitative differences between OTSL and HTML, Figure 5", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 58, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 330.61, "r_x1": 480.59, "r_y1": 330.61, "r_x2": 480.59, "r_y2": 321.82, "r_x3": 134.76, "r_y3": 321.82, "coord_origin": "TOPLEFT" }, "text": "demonstrates less overlap and more accurate bounding boxes with OTSL. In", "orig": "demonstrates less overlap and more accurate bounding boxes with OTSL. In", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 59, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 342.57, "r_x1": 480.59, "r_y1": 342.57, "r_x2": 480.59, "r_y2": 333.77, "r_x3": 134.76, "r_y3": 333.77, "coord_origin": "TOPLEFT" }, "text": "Figure 6, OTSL proves to be more effective in handling tables with longer to-", "orig": "Figure 6, OTSL proves to be more effective in handling tables with longer to-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 60, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 354.52, "r_x1": 480.59, "r_y1": 354.52, "r_x2": 480.59, "r_y2": 345.73, "r_x3": 134.76, "r_y3": 345.73, "coord_origin": "TOPLEFT" }, "text": "ken sequences, resulting in even more precise structure prediction and bounding", "orig": "ken sequences, resulting in even more precise structure prediction and bounding", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 61, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 366.48, "r_x1": 161.66, "r_y1": 366.48, "r_x2": 161.66, "r_y2": 357.68, "r_x3": 134.76, "r_y3": 357.68, "coord_origin": "TOPLEFT" }, "text": "boxes.", "orig": "boxes.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 5, "label": "caption", "bbox": { "l": 134.76, "t": 397.59, "r": 480.59, "b": 439.72, "coord_origin": "TOPLEFT" }, "confidence": 0.948, "cells": [ { "index": 62, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 405.52, "r_x1": 162.64, "r_y1": 405.52, "r_x2": 162.64, "r_y2": 397.59, "r_x3": 134.76, "r_y3": 397.59, "coord_origin": "TOPLEFT" }, "text": "Fig. 5.", "orig": "Fig. 5.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 63, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 167.38, "r_y0": 405.72, "r_x1": 480.59, "r_y1": 405.72, "r_x2": 480.59, "r_y2": 397.65, "r_x3": 167.38, "r_y3": 397.65, "coord_origin": "TOPLEFT" }, "text": "The OTSL model produces more accurate bounding boxes with less over-", "orig": "The OTSL model produces more accurate bounding boxes with less over-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 64, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 416.68, "r_x1": 480.59, "r_y1": 416.68, "r_x2": 480.59, "r_y2": 408.61, "r_x3": 134.76, "r_y3": 408.61, "coord_origin": "TOPLEFT" }, "text": "lap (E) than the HTML model (D), when predicting the structure of a sparse ta-", "orig": "lap (E) than the HTML model (D), when predicting the structure of a sparse ta-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 65, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 427.64, "r_x1": 480.59, "r_y1": 427.64, "r_x2": 480.59, "r_y2": 419.57, "r_x3": 134.76, "r_y3": 419.57, "coord_origin": "TOPLEFT" }, "text": "ble (A), at twice the inference speed because of shorter sequence length (B),(C).", "orig": "ble (A), at twice the inference speed because of shorter sequence length (B),(C).", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 66, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 438.6, "r_x1": 304.69, "r_y1": 438.6, "r_x2": 304.69, "r_y2": 430.53, "r_x3": 134.76, "r_y3": 430.53, "coord_origin": "TOPLEFT" }, "text": "\"PMC2807444_006_00.png\" PubTabNet.", "orig": "\"PMC2807444_006_00.png\" PubTabNet.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 118, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 342.63, "r_y0": 439.72, "r_x1": 344.82, "r_y1": 439.72, "r_x2": 344.82, "r_y2": 430.2, "r_x3": 342.63, "r_y3": 430.2, "coord_origin": "TOPLEFT" }, "text": "\u03bc", "orig": "\u03bc", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 2, "label": "picture", "bbox": { "l": 162.67, "t": 444.62, "r": 451.7, "b": 663.21, "coord_origin": "TOPLEFT" }, "confidence": 0.974, "cells": [ { "index": 67, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 180.12, "r_y0": 518.95, "r_x1": 190.62, "r_y1": 518.95, "r_x2": 190.62, "r_y2": 516.23, "r_x3": 180.12, "r_y3": 516.23, "coord_origin": "TOPLEFT" }, "text": "", "orig": "
", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 68, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 183.24, "r_y0": 522.85, "r_x1": 304.55, "r_y1": 522.85, "r_x2": 304.55, "r_y2": 520.13, "r_x3": 183.24, "r_y3": 520.13, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 69, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 183.24, "r_y0": 526.75, "r_x1": 388.42, "r_y1": 526.75, "r_x2": 388.42, "r_y2": 524.03, "r_x3": 183.24, "r_y3": 524.03, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 70, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 183.24, "r_y0": 530.65, "r_x1": 388.42, "r_y1": 530.65, "r_x2": 388.42, "r_y2": 527.93, "r_x3": 183.24, "r_y3": 527.93, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 71, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 183.24, "r_y0": 534.55, "r_x1": 388.42, "r_y1": 534.55, "r_x2": 388.42, "r_y2": 531.83, "r_x3": 183.24, "r_y3": 531.83, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 72, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 183.24, "r_y0": 538.44, "r_x1": 388.42, "r_y1": 538.44, "r_x2": 388.42, "r_y2": 535.73, "r_x3": 183.24, "r_y3": 535.73, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 73, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 183.24, "r_y0": 542.34, "r_x1": 388.42, "r_y1": 542.34, "r_x2": 388.42, "r_y2": 539.63, "r_x3": 183.24, "r_y3": 539.63, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 74, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 183.24, "r_y0": 546.24, "r_x1": 388.42, "r_y1": 546.24, "r_x2": 388.42, "r_y2": 543.53, "r_x3": 183.24, "r_y3": 543.53, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 75, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 183.24, "r_y0": 550.14, "r_x1": 388.42, "r_y1": 550.14, "r_x2": 388.42, "r_y2": 547.42, "r_x3": 183.24, "r_y3": 547.42, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 76, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 183.24, "r_y0": 554.04, "r_x1": 388.42, "r_y1": 554.04, "r_x2": 388.42, "r_y2": 551.32, "r_x3": 183.24, "r_y3": 551.32, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 77, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 180.12, "r_y0": 557.94, "r_x1": 191.87, "r_y1": 557.94, "r_x2": 191.87, "r_y2": 555.22, "r_x3": 180.12, "r_y3": 555.22, "coord_origin": "TOPLEFT" }, "text": "
", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 78, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 407.38, "r_y0": 521.02, "r_x1": 408.82, "r_y1": 521.02, "r_x2": 408.82, "r_y2": 518.3, "r_x3": 407.38, "r_y3": 518.3, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 79, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 410.26, "r_y0": 521.02, "r_x1": 450.49, "r_y1": 521.02, "r_x2": 450.49, "r_y2": 518.3, "r_x3": 410.26, "r_y3": 518.3, "coord_origin": "TOPLEFT" }, "text": "C L L L C L L L L L C L L NL", "orig": "C L L L C L L L L L C L L NL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 80, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 407.38, "r_y0": 524.92, "r_x1": 408.82, "r_y1": 524.92, "r_x2": 408.82, "r_y2": 522.2, "r_x3": 407.38, "r_y3": 522.2, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 81, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 410.26, "r_y0": 524.92, "r_x1": 450.49, "r_y1": 524.92, "r_x2": 450.49, "r_y2": 522.2, "r_x3": 410.26, "r_y3": 522.2, "coord_origin": "TOPLEFT" }, "text": "C C C C C C C C C C C C C NL", "orig": "C C C C C C C C C C C C C NL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 82, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 407.38, "r_y0": 528.81, "r_x1": 408.82, "r_y1": 528.81, "r_x2": 408.82, "r_y2": 526.1, "r_x3": 407.38, "r_y3": 526.1, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 83, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 410.26, "r_y0": 528.81, "r_x1": 450.49, "r_y1": 528.81, "r_x2": 450.49, "r_y2": 526.1, "r_x3": 410.26, "r_y3": 526.1, "coord_origin": "TOPLEFT" }, "text": "C C C C C C C C C C C C C NL", "orig": "C C C C C C C C C C C C C NL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 84, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 407.38, "r_y0": 532.71, "r_x1": 408.82, "r_y1": 532.71, "r_x2": 408.82, "r_y2": 530.0, "r_x3": 407.38, "r_y3": 530.0, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 85, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 410.26, "r_y0": 532.71, "r_x1": 450.49, "r_y1": 532.71, "r_x2": 450.49, "r_y2": 530.0, "r_x3": 410.26, "r_y3": 530.0, "coord_origin": "TOPLEFT" }, "text": "C C C C C C C C C C C C C NL", "orig": "C C C C C C C C C C C C C NL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 86, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 407.38, "r_y0": 536.61, "r_x1": 408.82, "r_y1": 536.61, "r_x2": 408.82, "r_y2": 533.9, "r_x3": 407.38, "r_y3": 533.9, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 87, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 410.26, "r_y0": 536.61, "r_x1": 450.49, "r_y1": 536.61, "r_x2": 450.49, "r_y2": 533.9, "r_x3": 410.26, "r_y3": 533.9, "coord_origin": "TOPLEFT" }, "text": "C C C C C C C C C C C C C NL", "orig": "C C C C C C C C C C C C C NL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 88, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 407.38, "r_y0": 540.51, "r_x1": 408.82, "r_y1": 540.51, "r_x2": 408.82, "r_y2": 537.79, "r_x3": 407.38, "r_y3": 537.79, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 89, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 410.26, "r_y0": 540.51, "r_x1": 450.49, "r_y1": 540.51, "r_x2": 450.49, "r_y2": 537.79, "r_x3": 410.26, "r_y3": 537.79, "coord_origin": "TOPLEFT" }, "text": "C C C C C C C C C C C C C NL", "orig": "C C C C C C C C C C C C C NL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 90, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 407.38, "r_y0": 544.41, "r_x1": 408.82, "r_y1": 544.41, "r_x2": 408.82, "r_y2": 541.69, "r_x3": 407.38, "r_y3": 541.69, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 91, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 410.26, "r_y0": 544.41, "r_x1": 450.49, "r_y1": 544.41, "r_x2": 450.49, "r_y2": 541.69, "r_x3": 410.26, "r_y3": 541.69, "coord_origin": "TOPLEFT" }, "text": "C C C C C C C C C C C C C NL", "orig": "C C C C C C C C C C C C C NL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 92, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 407.38, "r_y0": 548.31, "r_x1": 408.82, "r_y1": 548.31, "r_x2": 408.82, "r_y2": 545.59, "r_x3": 407.38, "r_y3": 545.59, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 93, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 410.26, "r_y0": 548.31, "r_x1": 450.49, "r_y1": 548.31, "r_x2": 450.49, "r_y2": 545.59, "r_x3": 410.26, "r_y3": 545.59, "coord_origin": "TOPLEFT" }, "text": "C C C C C C C C C C C C C NL", "orig": "C C C C C C C C C C C C C NL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 94, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 407.38, "r_y0": 552.21, "r_x1": 408.82, "r_y1": 552.21, "r_x2": 408.82, "r_y2": 549.49, "r_x3": 407.38, "r_y3": 549.49, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 95, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 410.26, "r_y0": 552.21, "r_x1": 450.49, "r_y1": 552.21, "r_x2": 450.49, "r_y2": 549.49, "r_x3": 410.26, "r_y3": 549.49, "coord_origin": "TOPLEFT" }, "text": "C C C C C C C C C C C C C NL", "orig": "C C C C C C C C C C C C C NL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 96, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 164.53, "r_y0": 515.31, "r_x1": 181.85, "r_y1": 515.31, "r_x2": 181.85, "r_y2": 509.46, "r_x3": 164.53, "r_y3": 509.46, "coord_origin": "TOPLEFT" }, "text": "HTML", "orig": "HTML", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 97, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 183.58, "r_y0": 515.31, "r_x1": 186.4, "r_y1": 515.31, "r_x2": 186.4, "r_y2": 509.46, "r_x3": 183.58, "r_y3": 509.46, "coord_origin": "TOPLEFT" }, "text": "#", "orig": "#", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 98, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 189.21, "r_y0": 515.31, "r_x1": 208.9, "r_y1": 515.31, "r_x2": 208.9, "r_y2": 509.46, "r_x3": 189.21, "r_y3": 509.46, "coord_origin": "TOPLEFT" }, "text": "tokens:", "orig": "tokens:", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 99, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 210.63, "r_y0": 515.31, "r_x1": 221.04, "r_y1": 515.31, "r_x2": 221.04, "r_y2": 509.46, "r_x3": 210.63, "r_y3": 509.46, "coord_origin": "TOPLEFT" }, "text": "258", "orig": "258", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 100, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 390.2, "r_y0": 515.46, "r_x1": 406.84, "r_y1": 515.46, "r_x2": 406.84, "r_y2": 509.6, "r_x3": 390.2, "r_y3": 509.6, "coord_origin": "TOPLEFT" }, "text": "OTSL", "orig": "OTSL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 101, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 408.57, "r_y0": 515.46, "r_x1": 411.38, "r_y1": 515.46, "r_x2": 411.38, "r_y2": 509.6, "r_x3": 408.57, "r_y3": 509.6, "coord_origin": "TOPLEFT" }, "text": "#", "orig": "#", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 102, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 414.2, "r_y0": 515.46, "r_x1": 433.89, "r_y1": 515.46, "r_x2": 433.89, "r_y2": 509.6, "r_x3": 414.2, "r_y3": 509.6, "coord_origin": "TOPLEFT" }, "text": "tokens:", "orig": "tokens:", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 103, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 435.62, "r_y0": 515.46, "r_x1": 446.03, "r_y1": 515.46, "r_x2": 446.03, "r_y2": 509.6, "r_x3": 435.62, "r_y3": 509.6, "coord_origin": "TOPLEFT" }, "text": "135", "orig": "135", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 104, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 167.19, "r_y0": 526.39, "r_x1": 172.82, "r_y1": 526.39, "r_x2": 172.82, "r_y2": 519.07, "r_x3": 167.19, "r_y3": 519.07, "coord_origin": "TOPLEFT" }, "text": "B", "orig": "B", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 105, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 187.34, "r_y0": 455.94, "r_x1": 192.97, "r_y1": 455.94, "r_x2": 192.97, "r_y2": 448.62, "r_x3": 187.34, "r_y3": 448.62, "coord_origin": "TOPLEFT" }, "text": "A", "orig": "A", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 106, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 167.39, "r_y0": 573.32, "r_x1": 173.02, "r_y1": 573.32, "r_x2": 173.02, "r_y2": 566.01, "r_x3": 167.39, "r_y3": 566.01, "coord_origin": "TOPLEFT" }, "text": "D", "orig": "D", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 107, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 248.46, "r_y0": 629.09, "r_x1": 253.66, "r_y1": 629.09, "r_x2": 253.66, "r_y2": 621.78, "r_x3": 248.46, "r_y3": 621.78, "coord_origin": "TOPLEFT" }, "text": "E", "orig": "E", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 108, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 395.9, "r_y0": 526.51, "r_x1": 401.53, "r_y1": 526.51, "r_x2": 401.53, "r_y2": 519.2, "r_x3": 395.9, "r_y3": 519.2, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 109, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 171.63, "r_y0": 597.27, "r_x1": 177.48, "r_y1": 597.27, "r_x2": 177.48, "r_y2": 580.29, "r_x3": 171.63, "r_y3": 580.29, "coord_origin": "TOPLEFT" }, "text": "HTML", "orig": "HTML", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 110, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 251.06, "r_y0": 649.92, "r_x1": 256.91, "r_y1": 649.92, "r_x2": 256.91, "r_y2": 633.63, "r_x3": 251.06, "r_y3": 633.63, "coord_origin": "TOPLEFT" }, "text": "OTSL", "orig": "OTSL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 111, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 372.15, "r_y0": 607.31, "r_x1": 427.04, "r_y1": 607.31, "r_x2": 427.04, "r_y2": 601.46, "r_x3": 372.15, "r_y3": 601.46, "coord_origin": "TOPLEFT" }, "text": "HTML model shows", "orig": "HTML model shows", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 112, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 372.15, "r_y0": 613.75, "r_x1": 430.07, "r_y1": 613.75, "r_x2": 430.07, "r_y2": 607.9, "r_x3": 372.15, "r_y3": 607.9, "coord_origin": "TOPLEFT" }, "text": "bounding box drifting", "orig": "bounding box drifting", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 113, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 176.88, "r_y0": 648.72, "r_x1": 231.08, "r_y1": 648.72, "r_x2": 231.08, "r_y2": 642.87, "r_x3": 176.88, "r_y3": 642.87, "coord_origin": "TOPLEFT" }, "text": "OTSL model shows", "orig": "OTSL model shows", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 114, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 176.88, "r_y0": 655.17, "r_x1": 230.99, "r_y1": 655.17, "r_x2": 230.99, "r_y2": 649.31, "r_x3": 176.88, "r_y3": 649.31, "coord_origin": "TOPLEFT" }, "text": "clean bounding box", "orig": "clean bounding box", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 115, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 176.88, "r_y0": 661.61, "r_x1": 203.93, "r_y1": 661.61, "r_x2": 203.93, "r_y2": 655.76, "r_x3": 176.88, "r_y3": 655.76, "coord_origin": "TOPLEFT" }, "text": "alignment", "orig": "alignment", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 116, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 215.93, "r_y0": 569.16, "r_x1": 218.47, "r_y1": 569.16, "r_x2": 218.47, "r_y2": 557.56, "r_x3": 215.93, "r_y3": 557.56, "coord_origin": "TOPLEFT" }, "text": "\u2264", "orig": "\u2264", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 117, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 229.06, "r_y0": 569.16, "r_x1": 231.72, "r_y1": 569.16, "r_x2": 231.72, "r_y2": 557.56, "r_x3": 229.06, "r_y3": 557.56, "coord_origin": "TOPLEFT" }, "text": "\u03bc", "orig": "\u03bc", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 119, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 261.21, "r_y0": 451.2, "r_x1": 263.57, "r_y1": 451.2, "r_x2": 263.57, "r_y2": 448.46, "r_x3": 261.21, "r_y3": 448.46, "coord_origin": "TOPLEFT" }, "text": "S", "orig": "S", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 120, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 312.33, "r_y0": 451.2, "r_x1": 313.64, "r_y1": 451.2, "r_x2": 313.64, "r_y2": 448.46, "r_x3": 312.33, "r_y3": 448.46, "coord_origin": "TOPLEFT" }, "text": "I", "orig": "I", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 121, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 377.41, "r_y0": 451.2, "r_x1": 380.06, "r_y1": 451.2, "r_x2": 380.06, "r_y2": 448.46, "r_x3": 377.41, "r_y3": 448.46, "coord_origin": "TOPLEFT" }, "text": "R", "orig": "R", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 122, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 200.64, "r_y0": 456.08, "r_x1": 205.82, "r_y1": 456.08, "r_x2": 205.82, "r_y2": 453.34, "r_x3": 200.64, "r_y3": 453.34, "coord_origin": "TOPLEFT" }, "text": "ST", "orig": "ST", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 123, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 222.21, "r_y0": 456.08, "r_x1": 229.77, "r_y1": 456.08, "r_x2": 229.77, "r_y2": 453.34, "r_x3": 222.21, "r_y3": 453.34, "coord_origin": "TOPLEFT" }, "text": "0.03", "orig": "0.03", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 124, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 243.27, "r_y0": 456.08, "r_x1": 250.83, "r_y1": 456.08, "r_x2": 250.83, "r_y2": 453.34, "r_x3": 243.27, "r_y3": 453.34, "coord_origin": "TOPLEFT" }, "text": "0.06", "orig": "0.06", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 125, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 264.3, "r_y0": 456.08, "r_x1": 271.85, "r_y1": 456.08, "r_x2": 271.85, "r_y2": 453.34, "r_x3": 264.3, "r_y3": 453.34, "coord_origin": "TOPLEFT" }, "text": "0.12", "orig": "0.12", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 126, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 285.32, "r_y0": 456.08, "r_x1": 292.88, "r_y1": 456.08, "r_x2": 292.88, "r_y2": 453.34, "r_x3": 285.32, "r_y3": 453.34, "coord_origin": "TOPLEFT" }, "text": "0.25", "orig": "0.25", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 127, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 306.38, "r_y0": 456.08, "r_x1": 311.77, "r_y1": 456.08, "r_x2": 311.77, "r_y2": 453.34, "r_x3": 306.38, "r_y3": 453.34, "coord_origin": "TOPLEFT" }, "text": "0.5", "orig": "0.5", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 128, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 323.42, "r_y0": 456.08, "r_x1": 325.58, "r_y1": 456.08, "r_x2": 325.58, "r_y2": 453.34, "r_x3": 323.42, "r_y3": 453.34, "coord_origin": "TOPLEFT" }, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 129, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 334.46, "r_y0": 456.08, "r_x1": 336.62, "r_y1": 456.08, "r_x2": 336.62, "r_y2": 453.34, "r_x3": 334.46, "r_y3": 453.34, "coord_origin": "TOPLEFT" }, "text": "2", "orig": "2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 130, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 345.53, "r_y0": 456.08, "r_x1": 347.69, "r_y1": 456.08, "r_x2": 347.69, "r_y2": 453.34, "r_x3": 345.53, "r_y3": 453.34, "coord_origin": "TOPLEFT" }, "text": "4", "orig": "4", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 131, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 356.57, "r_y0": 456.08, "r_x1": 358.73, "r_y1": 456.08, "r_x2": 358.73, "r_y2": 453.34, "r_x3": 356.57, "r_y3": 453.34, "coord_origin": "TOPLEFT" }, "text": "8", "orig": "8", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 132, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 367.64, "r_y0": 456.08, "r_x1": 371.97, "r_y1": 456.08, "r_x2": 371.97, "r_y2": 453.34, "r_x3": 367.64, "r_y3": 453.34, "coord_origin": "TOPLEFT" }, "text": "16", "orig": "16", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 133, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 382.67, "r_y0": 456.08, "r_x1": 387.01, "r_y1": 456.08, "r_x2": 387.01, "r_y2": 453.34, "r_x3": 382.67, "r_y3": 453.34, "coord_origin": "TOPLEFT" }, "text": "32", "orig": "32", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 134, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 397.74, "r_y0": 456.08, "r_x1": 402.07, "r_y1": 456.08, "r_x2": 402.07, "r_y2": 453.34, "r_x3": 397.74, "r_y3": 453.34, "coord_origin": "TOPLEFT" }, "text": "64", "orig": "64", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 135, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 412.79, "r_y0": 457.8, "r_x1": 414.93, "r_y1": 457.8, "r_x2": 414.93, "r_y2": 447.99, "r_x3": 412.79, "r_y3": 447.99, "coord_origin": "TOPLEFT" }, "text": "\u2265", "orig": "\u2265", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 136, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 414.96, "r_y0": 456.08, "r_x1": 422.52, "r_y1": 456.08, "r_x2": 422.52, "r_y2": 453.34, "r_x3": 414.96, "r_y3": 453.34, "coord_origin": "TOPLEFT" }, "text": " 128", "orig": " 128", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 137, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 200.64, "r_y0": 466.66, "r_x1": 204.58, "r_y1": 466.66, "r_x2": 204.58, "r_y2": 463.92, "r_x3": 200.64, "r_y3": 463.92, "coord_origin": "TOPLEFT" }, "text": "63", "orig": "63", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 138, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 367.63, "r_y0": 466.66, "r_x1": 369.58, "r_y1": 466.66, "r_x2": 369.58, "r_y2": 463.92, "r_x3": 367.63, "r_y3": 463.92, "coord_origin": "TOPLEFT" }, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 139, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 382.66, "r_y0": 466.66, "r_x1": 384.62, "r_y1": 466.66, "r_x2": 384.62, "r_y2": 463.92, "r_x3": 382.66, "r_y3": 463.92, "coord_origin": "TOPLEFT" }, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 140, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 397.73, "r_y0": 466.66, "r_x1": 399.68, "r_y1": 466.66, "r_x2": 399.68, "r_y2": 463.92, "r_x3": 397.73, "r_y3": 463.92, "coord_origin": "TOPLEFT" }, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 141, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 200.64, "r_y0": 471.54, "r_x1": 206.52, "r_y1": 471.54, "r_x2": 206.52, "r_y2": 468.8, "r_x3": 200.64, "r_y3": 468.8, "coord_origin": "TOPLEFT" }, "text": "199", "orig": "199", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 142, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 264.29, "r_y0": 471.54, "r_x1": 266.26, "r_y1": 471.54, "r_x2": 266.26, "r_y2": 468.8, "r_x3": 264.29, "r_y3": 468.8, "coord_origin": "TOPLEFT" }, "text": "5", "orig": "5", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 143, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 306.37, "r_y0": 471.54, "r_x1": 308.34, "r_y1": 471.54, "r_x2": 308.34, "r_y2": 468.8, "r_x3": 306.37, "r_y3": 468.8, "coord_origin": "TOPLEFT" }, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 144, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 345.52, "r_y0": 471.54, "r_x1": 347.48, "r_y1": 471.54, "r_x2": 347.48, "r_y2": 468.8, "r_x3": 345.52, "r_y3": 468.8, "coord_origin": "TOPLEFT" }, "text": "2", "orig": "2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 145, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 356.56, "r_y0": 471.54, "r_x1": 358.52, "r_y1": 471.54, "r_x2": 358.52, "r_y2": 468.8, "r_x3": 356.56, "r_y3": 468.8, "coord_origin": "TOPLEFT" }, "text": "4", "orig": "4", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 146, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 367.63, "r_y0": 471.54, "r_x1": 369.59, "r_y1": 471.54, "r_x2": 369.59, "r_y2": 468.8, "r_x3": 367.63, "r_y3": 468.8, "coord_origin": "TOPLEFT" }, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 147, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 382.66, "r_y0": 471.54, "r_x1": 384.63, "r_y1": 471.54, "r_x2": 384.63, "r_y2": 468.8, "r_x3": 382.66, "r_y3": 468.8, "coord_origin": "TOPLEFT" }, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 148, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 200.64, "r_y0": 476.42, "r_x1": 206.52, "r_y1": 476.42, "r_x2": 206.52, "r_y2": 473.68, "r_x3": 200.64, "r_y3": 473.68, "coord_origin": "TOPLEFT" }, "text": "416", "orig": "416", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 149, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 264.29, "r_y0": 476.42, "r_x1": 266.26, "r_y1": 476.42, "r_x2": 266.26, "r_y2": 473.68, "r_x3": 264.29, "r_y3": 473.68, "coord_origin": "TOPLEFT" }, "text": "4", "orig": "4", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 150, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 200.64, "r_y0": 481.27, "r_x1": 206.52, "r_y1": 481.27, "r_x2": 206.52, "r_y2": 478.53, "r_x3": 200.64, "r_y3": 478.53, "coord_origin": "TOPLEFT" }, "text": "230", "orig": "230", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 151, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 243.26, "r_y0": 481.27, "r_x1": 245.23, "r_y1": 481.27, "r_x2": 245.23, "r_y2": 478.53, "r_x3": 243.26, "r_y3": 478.53, "coord_origin": "TOPLEFT" }, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 152, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 264.29, "r_y0": 481.27, "r_x1": 266.26, "r_y1": 481.27, "r_x2": 266.26, "r_y2": 478.53, "r_x3": 264.29, "r_y3": 478.53, "coord_origin": "TOPLEFT" }, "text": "9", "orig": "9", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 153, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 323.4, "r_y0": 481.27, "r_x1": 325.37, "r_y1": 481.27, "r_x2": 325.37, "r_y2": 478.53, "r_x3": 323.4, "r_y3": 478.53, "coord_origin": "TOPLEFT" }, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 154, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 397.73, "r_y0": 481.27, "r_x1": 399.69, "r_y1": 481.27, "r_x2": 399.69, "r_y2": 478.53, "r_x3": 397.73, "r_y3": 478.53, "coord_origin": "TOPLEFT" }, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 155, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 200.64, "r_y0": 486.15, "r_x1": 206.52, "r_y1": 486.15, "r_x2": 206.52, "r_y2": 483.41, "r_x3": 200.64, "r_y3": 483.41, "coord_origin": "TOPLEFT" }, "text": "276", "orig": "276", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 156, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 382.66, "r_y0": 486.15, "r_x1": 384.62, "r_y1": 486.15, "r_x2": 384.62, "r_y2": 483.41, "r_x3": 382.66, "r_y3": 483.41, "coord_origin": "TOPLEFT" }, "text": "2", "orig": "2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 157, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 397.73, "r_y0": 486.15, "r_x1": 401.65, "r_y1": 486.15, "r_x2": 401.65, "r_y2": 483.41, "r_x3": 397.73, "r_y3": 483.41, "coord_origin": "TOPLEFT" }, "text": "12", "orig": "12", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 158, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 412.79, "r_y0": 486.15, "r_x1": 414.74, "r_y1": 486.15, "r_x2": 414.74, "r_y2": 483.41, "r_x3": 412.79, "r_y3": 483.41, "coord_origin": "TOPLEFT" }, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 159, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 200.64, "r_y0": 491.03, "r_x1": 207.14, "r_y1": 491.03, "r_x2": 207.14, "r_y2": 488.29, "r_x3": 200.64, "r_y3": 488.29, "coord_origin": "TOPLEFT" }, "text": "320", "orig": "320", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 160, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 367.63, "r_y0": 491.03, "r_x1": 369.78, "r_y1": 491.03, "r_x2": 369.78, "r_y2": 488.29, "r_x3": 367.63, "r_y3": 488.29, "coord_origin": "TOPLEFT" }, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 161, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 382.66, "r_y0": 491.03, "r_x1": 384.82, "r_y1": 491.03, "r_x2": 384.82, "r_y2": 488.29, "r_x3": 382.66, "r_y3": 488.29, "coord_origin": "TOPLEFT" }, "text": "4", "orig": "4", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 162, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 397.73, "r_y0": 491.03, "r_x1": 402.05, "r_y1": 491.03, "r_x2": 402.05, "r_y2": 488.29, "r_x3": 397.73, "r_y3": 488.29, "coord_origin": "TOPLEFT" }, "text": "20", "orig": "20", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 163, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 200.64, "r_y0": 495.9, "r_x1": 208.49, "r_y1": 495.9, "r_x2": 208.49, "r_y2": 493.17, "r_x3": 200.64, "r_y3": 493.17, "coord_origin": "TOPLEFT" }, "text": "2013", "orig": "2013", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 164, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 264.29, "r_y0": 495.9, "r_x1": 266.26, "r_y1": 495.9, "r_x2": 266.26, "r_y2": 493.17, "r_x3": 264.29, "r_y3": 493.17, "coord_origin": "TOPLEFT" }, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [ { "id": 58, "label": "text", "bbox": { "l": 180.12, "t": 516.23, "r": 190.62, "b": 518.95, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 67, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 180.12, "r_y0": 518.95, "r_x1": 190.62, "r_y1": 518.95, "r_x2": 190.62, "r_y2": 516.23, "r_x3": 180.12, "r_y3": 516.23, "coord_origin": "TOPLEFT" }, "text": "", "orig": "
", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 59, "label": "text", "bbox": { "l": 183.24, "t": 520.13, "r": 304.55, "b": 522.85, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 68, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 183.24, "r_y0": 522.85, "r_x1": 304.55, "r_y1": 522.85, "r_x2": 304.55, "r_y2": 520.13, "r_x3": 183.24, "r_y3": 520.13, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 60, "label": "text", "bbox": { "l": 183.24, "t": 524.03, "r": 388.42, "b": 526.75, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 69, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 183.24, "r_y0": 526.75, "r_x1": 388.42, "r_y1": 526.75, "r_x2": 388.42, "r_y2": 524.03, "r_x3": 183.24, "r_y3": 524.03, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 61, "label": "text", "bbox": { "l": 183.24, "t": 527.93, "r": 388.42, "b": 530.65, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 70, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 183.24, "r_y0": 530.65, "r_x1": 388.42, "r_y1": 530.65, "r_x2": 388.42, "r_y2": 527.93, "r_x3": 183.24, "r_y3": 527.93, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 62, "label": "text", "bbox": { "l": 183.24, "t": 531.83, "r": 388.42, "b": 534.55, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 71, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 183.24, "r_y0": 534.55, "r_x1": 388.42, "r_y1": 534.55, "r_x2": 388.42, "r_y2": 531.83, "r_x3": 183.24, "r_y3": 531.83, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 63, "label": "text", "bbox": { "l": 183.24, "t": 535.73, "r": 388.42, "b": 538.44, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 72, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 183.24, "r_y0": 538.44, "r_x1": 388.42, "r_y1": 538.44, "r_x2": 388.42, "r_y2": 535.73, "r_x3": 183.24, "r_y3": 535.73, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 64, "label": "text", "bbox": { "l": 183.24, "t": 539.63, "r": 388.42, "b": 542.34, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 73, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 183.24, "r_y0": 542.34, "r_x1": 388.42, "r_y1": 542.34, "r_x2": 388.42, "r_y2": 539.63, "r_x3": 183.24, "r_y3": 539.63, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 65, "label": "text", "bbox": { "l": 183.24, "t": 543.53, "r": 388.42, "b": 546.24, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 74, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 183.24, "r_y0": 546.24, "r_x1": 388.42, "r_y1": 546.24, "r_x2": 388.42, "r_y2": 543.53, "r_x3": 183.24, "r_y3": 543.53, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 66, "label": "text", "bbox": { "l": 183.24, "t": 547.42, "r": 388.42, "b": 550.14, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 75, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 183.24, "r_y0": 550.14, "r_x1": 388.42, "r_y1": 550.14, "r_x2": 388.42, "r_y2": 547.42, "r_x3": 183.24, "r_y3": 547.42, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 67, "label": "text", "bbox": { "l": 183.24, "t": 551.32, "r": 388.42, "b": 554.04, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 76, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 183.24, "r_y0": 554.04, "r_x1": 388.42, "r_y1": 554.04, "r_x2": 388.42, "r_y2": 551.32, "r_x3": 183.24, "r_y3": 551.32, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 68, "label": "text", "bbox": { "l": 180.12, "t": 555.22, "r": 191.87, "b": 557.94, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 77, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 180.12, "r_y0": 557.94, "r_x1": 191.87, "r_y1": 557.94, "r_x2": 191.87, "r_y2": 555.22, "r_x3": 180.12, "r_y3": 555.22, "coord_origin": "TOPLEFT" }, "text": "
", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 69, "label": "text", "bbox": { "l": 407.38, "t": 518.3, "r": 408.82, "b": 521.02, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 78, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 407.38, "r_y0": 521.02, "r_x1": 408.82, "r_y1": 521.02, "r_x2": 408.82, "r_y2": 518.3, "r_x3": 407.38, "r_y3": 518.3, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 70, "label": "text", "bbox": { "l": 410.26, "t": 518.3, "r": 450.49, "b": 521.02, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 79, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 410.26, "r_y0": 521.02, "r_x1": 450.49, "r_y1": 521.02, "r_x2": 450.49, "r_y2": 518.3, "r_x3": 410.26, "r_y3": 518.3, "coord_origin": "TOPLEFT" }, "text": "C L L L C L L L L L C L L NL", "orig": "C L L L C L L L L L C L L NL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 71, "label": "text", "bbox": { "l": 407.38, "t": 522.2, "r": 408.82, "b": 524.92, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 80, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 407.38, "r_y0": 524.92, "r_x1": 408.82, "r_y1": 524.92, "r_x2": 408.82, "r_y2": 522.2, "r_x3": 407.38, "r_y3": 522.2, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 72, "label": "text", "bbox": { "l": 410.26, "t": 522.2, "r": 450.49, "b": 524.92, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 81, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 410.26, "r_y0": 524.92, "r_x1": 450.49, "r_y1": 524.92, "r_x2": 450.49, "r_y2": 522.2, "r_x3": 410.26, "r_y3": 522.2, "coord_origin": "TOPLEFT" }, "text": "C C C C C C C C C C C C C NL", "orig": "C C C C C C C C C C C C C NL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 73, "label": "text", "bbox": { "l": 407.38, "t": 526.1, "r": 408.82, "b": 528.81, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 82, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 407.38, "r_y0": 528.81, "r_x1": 408.82, "r_y1": 528.81, "r_x2": 408.82, "r_y2": 526.1, "r_x3": 407.38, "r_y3": 526.1, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 74, "label": "text", "bbox": { "l": 410.26, "t": 526.1, "r": 450.49, "b": 528.81, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 83, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 410.26, "r_y0": 528.81, "r_x1": 450.49, "r_y1": 528.81, "r_x2": 450.49, "r_y2": 526.1, "r_x3": 410.26, "r_y3": 526.1, "coord_origin": "TOPLEFT" }, "text": "C C C C C C C C C C C C C NL", "orig": "C C C C C C C C C C C C C NL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 75, "label": "text", "bbox": { "l": 407.38, "t": 530.0, "r": 408.82, "b": 532.71, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 84, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 407.38, "r_y0": 532.71, "r_x1": 408.82, "r_y1": 532.71, "r_x2": 408.82, "r_y2": 530.0, "r_x3": 407.38, "r_y3": 530.0, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 76, "label": "text", "bbox": { "l": 410.26, "t": 530.0, "r": 450.49, "b": 532.71, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 85, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 410.26, "r_y0": 532.71, "r_x1": 450.49, "r_y1": 532.71, "r_x2": 450.49, "r_y2": 530.0, "r_x3": 410.26, "r_y3": 530.0, "coord_origin": "TOPLEFT" }, "text": "C C C C C C C C C C C C C NL", "orig": "C C C C C C C C C C C C C NL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 77, "label": "text", "bbox": { "l": 407.38, "t": 533.9, "r": 408.82, "b": 536.61, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 86, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 407.38, "r_y0": 536.61, "r_x1": 408.82, "r_y1": 536.61, "r_x2": 408.82, "r_y2": 533.9, "r_x3": 407.38, "r_y3": 533.9, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 78, "label": "text", "bbox": { "l": 410.26, "t": 533.9, "r": 450.49, "b": 536.61, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 87, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 410.26, "r_y0": 536.61, "r_x1": 450.49, "r_y1": 536.61, "r_x2": 450.49, "r_y2": 533.9, "r_x3": 410.26, "r_y3": 533.9, "coord_origin": "TOPLEFT" }, "text": "C C C C C C C C C C C C C NL", "orig": "C C C C C C C C C C C C C NL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 79, "label": "text", "bbox": { "l": 407.38, "t": 537.79, "r": 408.82, "b": 540.51, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 88, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 407.38, "r_y0": 540.51, "r_x1": 408.82, "r_y1": 540.51, "r_x2": 408.82, "r_y2": 537.79, "r_x3": 407.38, "r_y3": 537.79, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 80, "label": "text", "bbox": { "l": 410.26, "t": 537.79, "r": 450.49, "b": 540.51, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 89, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 410.26, "r_y0": 540.51, "r_x1": 450.49, "r_y1": 540.51, "r_x2": 450.49, "r_y2": 537.79, "r_x3": 410.26, "r_y3": 537.79, "coord_origin": "TOPLEFT" }, "text": "C C C C C C C C C C C C C NL", "orig": "C C C C C C C C C C C C C NL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 81, "label": "text", "bbox": { "l": 407.38, "t": 541.69, "r": 408.82, "b": 544.41, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 90, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 407.38, "r_y0": 544.41, "r_x1": 408.82, "r_y1": 544.41, "r_x2": 408.82, "r_y2": 541.69, "r_x3": 407.38, "r_y3": 541.69, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 82, "label": "text", "bbox": { "l": 410.26, "t": 541.69, "r": 450.49, "b": 544.41, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 91, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 410.26, "r_y0": 544.41, "r_x1": 450.49, "r_y1": 544.41, "r_x2": 450.49, "r_y2": 541.69, "r_x3": 410.26, "r_y3": 541.69, "coord_origin": "TOPLEFT" }, "text": "C C C C C C C C C C C C C NL", "orig": "C C C C C C C C C C C C C NL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 83, "label": "text", "bbox": { "l": 407.38, "t": 545.59, "r": 408.82, "b": 548.31, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 92, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 407.38, "r_y0": 548.31, "r_x1": 408.82, "r_y1": 548.31, "r_x2": 408.82, "r_y2": 545.59, "r_x3": 407.38, "r_y3": 545.59, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 84, "label": "text", "bbox": { "l": 410.26, "t": 545.59, "r": 450.49, "b": 548.31, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 93, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 410.26, "r_y0": 548.31, "r_x1": 450.49, "r_y1": 548.31, "r_x2": 450.49, "r_y2": 545.59, "r_x3": 410.26, "r_y3": 545.59, "coord_origin": "TOPLEFT" }, "text": "C C C C C C C C C C C C C NL", "orig": "C C C C C C C C C C C C C NL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 85, "label": "text", "bbox": { "l": 407.38, "t": 549.49, "r": 408.82, "b": 552.21, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 94, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 407.38, "r_y0": 552.21, "r_x1": 408.82, "r_y1": 552.21, "r_x2": 408.82, "r_y2": 549.49, "r_x3": 407.38, "r_y3": 549.49, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 86, "label": "text", "bbox": { "l": 410.26, "t": 549.49, "r": 450.49, "b": 552.21, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 95, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 410.26, "r_y0": 552.21, "r_x1": 450.49, "r_y1": 552.21, "r_x2": 450.49, "r_y2": 549.49, "r_x3": 410.26, "r_y3": 549.49, "coord_origin": "TOPLEFT" }, "text": "C C C C C C C C C C C C C NL", "orig": "C C C C C C C C C C C C C NL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 87, "label": "text", "bbox": { "l": 164.53, "t": 509.46, "r": 181.85, "b": 515.31, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 96, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 164.53, "r_y0": 515.31, "r_x1": 181.85, "r_y1": 515.31, "r_x2": 181.85, "r_y2": 509.46, "r_x3": 164.53, "r_y3": 509.46, "coord_origin": "TOPLEFT" }, "text": "HTML", "orig": "HTML", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 88, "label": "text", "bbox": { "l": 183.58, "t": 509.46, "r": 186.4, "b": 515.31, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 97, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 183.58, "r_y0": 515.31, "r_x1": 186.4, "r_y1": 515.31, "r_x2": 186.4, "r_y2": 509.46, "r_x3": 183.58, "r_y3": 509.46, "coord_origin": "TOPLEFT" }, "text": "#", "orig": "#", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 89, "label": "text", "bbox": { "l": 189.21, "t": 509.46, "r": 208.9, "b": 515.31, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 98, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 189.21, "r_y0": 515.31, "r_x1": 208.9, "r_y1": 515.31, "r_x2": 208.9, "r_y2": 509.46, "r_x3": 189.21, "r_y3": 509.46, "coord_origin": "TOPLEFT" }, "text": "tokens:", "orig": "tokens:", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 90, "label": "text", "bbox": { "l": 210.63, "t": 509.46, "r": 221.04, "b": 515.31, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 99, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 210.63, "r_y0": 515.31, "r_x1": 221.04, "r_y1": 515.31, "r_x2": 221.04, "r_y2": 509.46, "r_x3": 210.63, "r_y3": 509.46, "coord_origin": "TOPLEFT" }, "text": "258", "orig": "258", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 91, "label": "text", "bbox": { "l": 390.2, "t": 509.6, "r": 406.84, "b": 515.46, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 100, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 390.2, "r_y0": 515.46, "r_x1": 406.84, "r_y1": 515.46, "r_x2": 406.84, "r_y2": 509.6, "r_x3": 390.2, "r_y3": 509.6, "coord_origin": "TOPLEFT" }, "text": "OTSL", "orig": "OTSL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 92, "label": "text", "bbox": { "l": 408.57, "t": 509.6, "r": 411.38, "b": 515.46, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 101, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 408.57, "r_y0": 515.46, "r_x1": 411.38, "r_y1": 515.46, "r_x2": 411.38, "r_y2": 509.6, "r_x3": 408.57, "r_y3": 509.6, "coord_origin": "TOPLEFT" }, "text": "#", "orig": "#", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 93, "label": "text", "bbox": { "l": 414.2, "t": 509.6, "r": 433.89, "b": 515.46, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 102, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 414.2, "r_y0": 515.46, "r_x1": 433.89, "r_y1": 515.46, "r_x2": 433.89, "r_y2": 509.6, "r_x3": 414.2, "r_y3": 509.6, "coord_origin": "TOPLEFT" }, "text": "tokens:", "orig": "tokens:", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 94, "label": "text", "bbox": { "l": 435.62, "t": 509.6, "r": 446.03, "b": 515.46, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 103, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 435.62, "r_y0": 515.46, "r_x1": 446.03, "r_y1": 515.46, "r_x2": 446.03, "r_y2": 509.6, "r_x3": 435.62, "r_y3": 509.6, "coord_origin": "TOPLEFT" }, "text": "135", "orig": "135", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 95, "label": "text", "bbox": { "l": 167.19, "t": 519.07, "r": 172.82, "b": 526.39, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 104, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 167.19, "r_y0": 526.39, "r_x1": 172.82, "r_y1": 526.39, "r_x2": 172.82, "r_y2": 519.07, "r_x3": 167.19, "r_y3": 519.07, "coord_origin": "TOPLEFT" }, "text": "B", "orig": "B", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 96, "label": "text", "bbox": { "l": 187.34, "t": 448.62, "r": 192.97, "b": 455.94, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 105, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 187.34, "r_y0": 455.94, "r_x1": 192.97, "r_y1": 455.94, "r_x2": 192.97, "r_y2": 448.62, "r_x3": 187.34, "r_y3": 448.62, "coord_origin": "TOPLEFT" }, "text": "A", "orig": "A", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 97, "label": "text", "bbox": { "l": 167.39, "t": 566.01, "r": 173.02, "b": 573.32, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 106, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 167.39, "r_y0": 573.32, "r_x1": 173.02, "r_y1": 573.32, "r_x2": 173.02, "r_y2": 566.01, "r_x3": 167.39, "r_y3": 566.01, "coord_origin": "TOPLEFT" }, "text": "D", "orig": "D", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 98, "label": "text", "bbox": { "l": 248.46, "t": 621.78, "r": 253.66, "b": 629.09, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 107, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 248.46, "r_y0": 629.09, "r_x1": 253.66, "r_y1": 629.09, "r_x2": 253.66, "r_y2": 621.78, "r_x3": 248.46, "r_y3": 621.78, "coord_origin": "TOPLEFT" }, "text": "E", "orig": "E", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 99, "label": "text", "bbox": { "l": 395.9, "t": 519.2, "r": 401.53, "b": 526.51, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 108, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 395.9, "r_y0": 526.51, "r_x1": 401.53, "r_y1": 526.51, "r_x2": 401.53, "r_y2": 519.2, "r_x3": 395.9, "r_y3": 519.2, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 100, "label": "text", "bbox": { "l": 171.63, "t": 580.29, "r": 177.48, "b": 597.27, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 109, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 171.63, "r_y0": 597.27, "r_x1": 177.48, "r_y1": 597.27, "r_x2": 177.48, "r_y2": 580.29, "r_x3": 171.63, "r_y3": 580.29, "coord_origin": "TOPLEFT" }, "text": "HTML", "orig": "HTML", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 101, "label": "text", "bbox": { "l": 251.06, "t": 633.63, "r": 256.91, "b": 649.92, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 110, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 251.06, "r_y0": 649.92, "r_x1": 256.91, "r_y1": 649.92, "r_x2": 256.91, "r_y2": 633.63, "r_x3": 251.06, "r_y3": 633.63, "coord_origin": "TOPLEFT" }, "text": "OTSL", "orig": "OTSL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 102, "label": "text", "bbox": { "l": 372.15, "t": 601.46, "r": 427.04, "b": 607.31, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 111, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 372.15, "r_y0": 607.31, "r_x1": 427.04, "r_y1": 607.31, "r_x2": 427.04, "r_y2": 601.46, "r_x3": 372.15, "r_y3": 601.46, "coord_origin": "TOPLEFT" }, "text": "HTML model shows", "orig": "HTML model shows", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 103, "label": "text", "bbox": { "l": 372.15, "t": 607.9, "r": 430.07, "b": 613.75, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 112, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 372.15, "r_y0": 613.75, "r_x1": 430.07, "r_y1": 613.75, "r_x2": 430.07, "r_y2": 607.9, "r_x3": 372.15, "r_y3": 607.9, "coord_origin": "TOPLEFT" }, "text": "bounding box drifting", "orig": "bounding box drifting", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 104, "label": "text", "bbox": { "l": 176.88, "t": 642.87, "r": 231.08, "b": 648.72, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 113, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 176.88, "r_y0": 648.72, "r_x1": 231.08, "r_y1": 648.72, "r_x2": 231.08, "r_y2": 642.87, "r_x3": 176.88, "r_y3": 642.87, "coord_origin": "TOPLEFT" }, "text": "OTSL model shows", "orig": "OTSL model shows", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 105, "label": "text", "bbox": { "l": 176.88, "t": 649.31, "r": 230.99, "b": 655.17, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 114, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 176.88, "r_y0": 655.17, "r_x1": 230.99, "r_y1": 655.17, "r_x2": 230.99, "r_y2": 649.31, "r_x3": 176.88, "r_y3": 649.31, "coord_origin": "TOPLEFT" }, "text": "clean bounding box", "orig": "clean bounding box", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 106, "label": "text", "bbox": { "l": 176.88, "t": 655.76, "r": 203.93, "b": 661.61, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 115, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 176.88, "r_y0": 661.61, "r_x1": 203.93, "r_y1": 661.61, "r_x2": 203.93, "r_y2": 655.76, "r_x3": 176.88, "r_y3": 655.76, "coord_origin": "TOPLEFT" }, "text": "alignment", "orig": "alignment", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 107, "label": "text", "bbox": { "l": 215.93, "t": 557.56, "r": 218.47, "b": 569.16, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 116, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 215.93, "r_y0": 569.16, "r_x1": 218.47, "r_y1": 569.16, "r_x2": 218.47, "r_y2": 557.56, "r_x3": 215.93, "r_y3": 557.56, "coord_origin": "TOPLEFT" }, "text": "\u2264", "orig": "\u2264", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 108, "label": "text", "bbox": { "l": 229.06, "t": 557.56, "r": 231.72, "b": 569.16, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 117, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 229.06, "r_y0": 569.16, "r_x1": 231.72, "r_y1": 569.16, "r_x2": 231.72, "r_y2": 557.56, "r_x3": 229.06, "r_y3": 557.56, "coord_origin": "TOPLEFT" }, "text": "\u03bc", "orig": "\u03bc", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 109, "label": "text", "bbox": { "l": 261.21, "t": 448.46, "r": 263.57, "b": 451.2, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 119, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 261.21, "r_y0": 451.2, "r_x1": 263.57, "r_y1": 451.2, "r_x2": 263.57, "r_y2": 448.46, "r_x3": 261.21, "r_y3": 448.46, "coord_origin": "TOPLEFT" }, "text": "S", "orig": "S", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 110, "label": "text", "bbox": { "l": 312.33, "t": 448.46, "r": 313.64, "b": 451.2, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 120, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 312.33, "r_y0": 451.2, "r_x1": 313.64, "r_y1": 451.2, "r_x2": 313.64, "r_y2": 448.46, "r_x3": 312.33, "r_y3": 448.46, "coord_origin": "TOPLEFT" }, "text": "I", "orig": "I", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 111, "label": "text", "bbox": { "l": 377.41, "t": 448.46, "r": 380.06, "b": 451.2, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 121, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 377.41, "r_y0": 451.2, "r_x1": 380.06, "r_y1": 451.2, "r_x2": 380.06, "r_y2": 448.46, "r_x3": 377.41, "r_y3": 448.46, "coord_origin": "TOPLEFT" }, "text": "R", "orig": "R", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 112, "label": "text", "bbox": { "l": 200.64, "t": 453.34, "r": 205.82, "b": 456.08, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 122, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 200.64, "r_y0": 456.08, "r_x1": 205.82, "r_y1": 456.08, "r_x2": 205.82, "r_y2": 453.34, "r_x3": 200.64, "r_y3": 453.34, "coord_origin": "TOPLEFT" }, "text": "ST", "orig": "ST", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 113, "label": "text", "bbox": { "l": 222.21, "t": 453.34, "r": 229.77, "b": 456.08, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 123, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 222.21, "r_y0": 456.08, "r_x1": 229.77, "r_y1": 456.08, "r_x2": 229.77, "r_y2": 453.34, "r_x3": 222.21, "r_y3": 453.34, "coord_origin": "TOPLEFT" }, "text": "0.03", "orig": "0.03", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 114, "label": "text", "bbox": { "l": 243.27, "t": 453.34, "r": 250.83, "b": 456.08, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 124, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 243.27, "r_y0": 456.08, "r_x1": 250.83, "r_y1": 456.08, "r_x2": 250.83, "r_y2": 453.34, "r_x3": 243.27, "r_y3": 453.34, "coord_origin": "TOPLEFT" }, "text": "0.06", "orig": "0.06", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 115, "label": "text", "bbox": { "l": 264.3, "t": 453.34, "r": 271.85, "b": 456.08, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 125, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 264.3, "r_y0": 456.08, "r_x1": 271.85, "r_y1": 456.08, "r_x2": 271.85, "r_y2": 453.34, "r_x3": 264.3, "r_y3": 453.34, "coord_origin": "TOPLEFT" }, "text": "0.12", "orig": "0.12", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 116, "label": "text", "bbox": { "l": 285.32, "t": 453.34, "r": 292.88, "b": 456.08, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 126, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 285.32, "r_y0": 456.08, "r_x1": 292.88, "r_y1": 456.08, "r_x2": 292.88, "r_y2": 453.34, "r_x3": 285.32, "r_y3": 453.34, "coord_origin": "TOPLEFT" }, "text": "0.25", "orig": "0.25", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 117, "label": "text", "bbox": { "l": 306.38, "t": 453.34, "r": 311.77, "b": 456.08, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 127, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 306.38, "r_y0": 456.08, "r_x1": 311.77, "r_y1": 456.08, "r_x2": 311.77, "r_y2": 453.34, "r_x3": 306.38, "r_y3": 453.34, "coord_origin": "TOPLEFT" }, "text": "0.5", "orig": "0.5", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 118, "label": "text", "bbox": { "l": 323.42, "t": 453.34, "r": 325.58, "b": 456.08, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 128, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 323.42, "r_y0": 456.08, "r_x1": 325.58, "r_y1": 456.08, "r_x2": 325.58, "r_y2": 453.34, "r_x3": 323.42, "r_y3": 453.34, "coord_origin": "TOPLEFT" }, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 119, "label": "text", "bbox": { "l": 334.46, "t": 453.34, "r": 336.62, "b": 456.08, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 129, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 334.46, "r_y0": 456.08, "r_x1": 336.62, "r_y1": 456.08, "r_x2": 336.62, "r_y2": 453.34, "r_x3": 334.46, "r_y3": 453.34, "coord_origin": "TOPLEFT" }, "text": "2", "orig": "2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 120, "label": "text", "bbox": { "l": 345.53, "t": 453.34, "r": 347.69, "b": 456.08, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 130, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 345.53, "r_y0": 456.08, "r_x1": 347.69, "r_y1": 456.08, "r_x2": 347.69, "r_y2": 453.34, "r_x3": 345.53, "r_y3": 453.34, "coord_origin": "TOPLEFT" }, "text": "4", "orig": "4", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 121, "label": "text", "bbox": { "l": 356.57, "t": 453.34, "r": 358.73, "b": 456.08, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 131, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 356.57, "r_y0": 456.08, "r_x1": 358.73, "r_y1": 456.08, "r_x2": 358.73, "r_y2": 453.34, "r_x3": 356.57, "r_y3": 453.34, "coord_origin": "TOPLEFT" }, "text": "8", "orig": "8", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 122, "label": "text", "bbox": { "l": 367.64, "t": 453.34, "r": 371.97, "b": 456.08, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 132, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 367.64, "r_y0": 456.08, "r_x1": 371.97, "r_y1": 456.08, "r_x2": 371.97, "r_y2": 453.34, "r_x3": 367.64, "r_y3": 453.34, "coord_origin": "TOPLEFT" }, "text": "16", "orig": "16", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 123, "label": "text", "bbox": { "l": 382.67, "t": 453.34, "r": 387.01, "b": 456.08, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 133, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 382.67, "r_y0": 456.08, "r_x1": 387.01, "r_y1": 456.08, "r_x2": 387.01, "r_y2": 453.34, "r_x3": 382.67, "r_y3": 453.34, "coord_origin": "TOPLEFT" }, "text": "32", "orig": "32", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 124, "label": "text", "bbox": { "l": 397.74, "t": 453.34, "r": 402.07, "b": 456.08, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 134, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 397.74, "r_y0": 456.08, "r_x1": 402.07, "r_y1": 456.08, "r_x2": 402.07, "r_y2": 453.34, "r_x3": 397.74, "r_y3": 453.34, "coord_origin": "TOPLEFT" }, "text": "64", "orig": "64", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 125, "label": "text", "bbox": { "l": 412.79, "t": 447.99, "r": 414.93, "b": 457.8, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 135, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 412.79, "r_y0": 457.8, "r_x1": 414.93, "r_y1": 457.8, "r_x2": 414.93, "r_y2": 447.99, "r_x3": 412.79, "r_y3": 447.99, "coord_origin": "TOPLEFT" }, "text": "\u2265", "orig": "\u2265", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 126, "label": "text", "bbox": { "l": 414.96, "t": 453.34, "r": 422.52, "b": 456.08, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 136, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 414.96, "r_y0": 456.08, "r_x1": 422.52, "r_y1": 456.08, "r_x2": 422.52, "r_y2": 453.34, "r_x3": 414.96, "r_y3": 453.34, "coord_origin": "TOPLEFT" }, "text": " 128", "orig": " 128", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 127, "label": "text", "bbox": { "l": 200.64, "t": 463.92, "r": 204.58, "b": 466.66, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 137, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 200.64, "r_y0": 466.66, "r_x1": 204.58, "r_y1": 466.66, "r_x2": 204.58, "r_y2": 463.92, "r_x3": 200.64, "r_y3": 463.92, "coord_origin": "TOPLEFT" }, "text": "63", "orig": "63", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 128, "label": "text", "bbox": { "l": 367.63, "t": 463.92, "r": 369.58, "b": 466.66, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 138, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 367.63, "r_y0": 466.66, "r_x1": 369.58, "r_y1": 466.66, "r_x2": 369.58, "r_y2": 463.92, "r_x3": 367.63, "r_y3": 463.92, "coord_origin": "TOPLEFT" }, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 129, "label": "text", "bbox": { "l": 382.66, "t": 463.92, "r": 384.62, "b": 466.66, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 139, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 382.66, "r_y0": 466.66, "r_x1": 384.62, "r_y1": 466.66, "r_x2": 384.62, "r_y2": 463.92, "r_x3": 382.66, "r_y3": 463.92, "coord_origin": "TOPLEFT" }, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 130, "label": "text", "bbox": { "l": 397.73, "t": 463.92, "r": 399.68, "b": 466.66, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 140, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 397.73, "r_y0": 466.66, "r_x1": 399.68, "r_y1": 466.66, "r_x2": 399.68, "r_y2": 463.92, "r_x3": 397.73, "r_y3": 463.92, "coord_origin": "TOPLEFT" }, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 131, "label": "text", "bbox": { "l": 200.64, "t": 468.8, "r": 206.52, "b": 471.54, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 141, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 200.64, "r_y0": 471.54, "r_x1": 206.52, "r_y1": 471.54, "r_x2": 206.52, "r_y2": 468.8, "r_x3": 200.64, "r_y3": 468.8, "coord_origin": "TOPLEFT" }, "text": "199", "orig": "199", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 132, "label": "text", "bbox": { "l": 264.29, "t": 468.8, "r": 266.26, "b": 471.54, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 142, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 264.29, "r_y0": 471.54, "r_x1": 266.26, "r_y1": 471.54, "r_x2": 266.26, "r_y2": 468.8, "r_x3": 264.29, "r_y3": 468.8, "coord_origin": "TOPLEFT" }, "text": "5", "orig": "5", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 133, "label": "text", "bbox": { "l": 306.37, "t": 468.8, "r": 308.34, "b": 471.54, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 143, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 306.37, "r_y0": 471.54, "r_x1": 308.34, "r_y1": 471.54, "r_x2": 308.34, "r_y2": 468.8, "r_x3": 306.37, "r_y3": 468.8, "coord_origin": "TOPLEFT" }, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 134, "label": "text", "bbox": { "l": 345.52, "t": 468.8, "r": 347.48, "b": 471.54, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 144, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 345.52, "r_y0": 471.54, "r_x1": 347.48, "r_y1": 471.54, "r_x2": 347.48, "r_y2": 468.8, "r_x3": 345.52, "r_y3": 468.8, "coord_origin": "TOPLEFT" }, "text": "2", "orig": "2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 135, "label": "text", "bbox": { "l": 356.56, "t": 468.8, "r": 358.52, "b": 471.54, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 145, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 356.56, "r_y0": 471.54, "r_x1": 358.52, "r_y1": 471.54, "r_x2": 358.52, "r_y2": 468.8, "r_x3": 356.56, "r_y3": 468.8, "coord_origin": "TOPLEFT" }, "text": "4", "orig": "4", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 136, "label": "text", "bbox": { "l": 367.63, "t": 468.8, "r": 369.59, "b": 471.54, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 146, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 367.63, "r_y0": 471.54, "r_x1": 369.59, "r_y1": 471.54, "r_x2": 369.59, "r_y2": 468.8, "r_x3": 367.63, "r_y3": 468.8, "coord_origin": "TOPLEFT" }, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 137, "label": "text", "bbox": { "l": 382.66, "t": 468.8, "r": 384.63, "b": 471.54, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 147, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 382.66, "r_y0": 471.54, "r_x1": 384.63, "r_y1": 471.54, "r_x2": 384.63, "r_y2": 468.8, "r_x3": 382.66, "r_y3": 468.8, "coord_origin": "TOPLEFT" }, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 138, "label": "text", "bbox": { "l": 200.64, "t": 473.68, "r": 206.52, "b": 476.42, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 148, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 200.64, "r_y0": 476.42, "r_x1": 206.52, "r_y1": 476.42, "r_x2": 206.52, "r_y2": 473.68, "r_x3": 200.64, "r_y3": 473.68, "coord_origin": "TOPLEFT" }, "text": "416", "orig": "416", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 139, "label": "text", "bbox": { "l": 264.29, "t": 473.68, "r": 266.26, "b": 476.42, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 149, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 264.29, "r_y0": 476.42, "r_x1": 266.26, "r_y1": 476.42, "r_x2": 266.26, "r_y2": 473.68, "r_x3": 264.29, "r_y3": 473.68, "coord_origin": "TOPLEFT" }, "text": "4", "orig": "4", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 140, "label": "text", "bbox": { "l": 200.64, "t": 478.53, "r": 206.52, "b": 481.27, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 150, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 200.64, "r_y0": 481.27, "r_x1": 206.52, "r_y1": 481.27, "r_x2": 206.52, "r_y2": 478.53, "r_x3": 200.64, "r_y3": 478.53, "coord_origin": "TOPLEFT" }, "text": "230", "orig": "230", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 141, "label": "text", "bbox": { "l": 243.26, "t": 478.53, "r": 245.23, "b": 481.27, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 151, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 243.26, "r_y0": 481.27, "r_x1": 245.23, "r_y1": 481.27, "r_x2": 245.23, "r_y2": 478.53, "r_x3": 243.26, "r_y3": 478.53, "coord_origin": "TOPLEFT" }, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 142, "label": "text", "bbox": { "l": 264.29, "t": 478.53, "r": 266.26, "b": 481.27, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 152, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 264.29, "r_y0": 481.27, "r_x1": 266.26, "r_y1": 481.27, "r_x2": 266.26, "r_y2": 478.53, "r_x3": 264.29, "r_y3": 478.53, "coord_origin": "TOPLEFT" }, "text": "9", "orig": "9", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 143, "label": "text", "bbox": { "l": 323.4, "t": 478.53, "r": 325.37, "b": 481.27, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 153, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 323.4, "r_y0": 481.27, "r_x1": 325.37, "r_y1": 481.27, "r_x2": 325.37, "r_y2": 478.53, "r_x3": 323.4, "r_y3": 478.53, "coord_origin": "TOPLEFT" }, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 144, "label": "text", "bbox": { "l": 397.73, "t": 478.53, "r": 399.69, "b": 481.27, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 154, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 397.73, "r_y0": 481.27, "r_x1": 399.69, "r_y1": 481.27, "r_x2": 399.69, "r_y2": 478.53, "r_x3": 397.73, "r_y3": 478.53, "coord_origin": "TOPLEFT" }, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 145, "label": "text", "bbox": { "l": 200.64, "t": 483.41, "r": 206.52, "b": 486.15, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 155, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 200.64, "r_y0": 486.15, "r_x1": 206.52, "r_y1": 486.15, "r_x2": 206.52, "r_y2": 483.41, "r_x3": 200.64, "r_y3": 483.41, "coord_origin": "TOPLEFT" }, "text": "276", "orig": "276", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 146, "label": "text", "bbox": { "l": 382.66, "t": 483.41, "r": 384.62, "b": 486.15, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 156, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 382.66, "r_y0": 486.15, "r_x1": 384.62, "r_y1": 486.15, "r_x2": 384.62, "r_y2": 483.41, "r_x3": 382.66, "r_y3": 483.41, "coord_origin": "TOPLEFT" }, "text": "2", "orig": "2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 147, "label": "text", "bbox": { "l": 397.73, "t": 483.41, "r": 401.65, "b": 486.15, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 157, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 397.73, "r_y0": 486.15, "r_x1": 401.65, "r_y1": 486.15, "r_x2": 401.65, "r_y2": 483.41, "r_x3": 397.73, "r_y3": 483.41, "coord_origin": "TOPLEFT" }, "text": "12", "orig": "12", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 148, "label": "text", "bbox": { "l": 412.79, "t": 483.41, "r": 414.74, "b": 486.15, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 158, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 412.79, "r_y0": 486.15, "r_x1": 414.74, "r_y1": 486.15, "r_x2": 414.74, "r_y2": 483.41, "r_x3": 412.79, "r_y3": 483.41, "coord_origin": "TOPLEFT" }, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 149, "label": "text", "bbox": { "l": 200.64, "t": 488.29, "r": 207.14, "b": 491.03, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 159, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 200.64, "r_y0": 491.03, "r_x1": 207.14, "r_y1": 491.03, "r_x2": 207.14, "r_y2": 488.29, "r_x3": 200.64, "r_y3": 488.29, "coord_origin": "TOPLEFT" }, "text": "320", "orig": "320", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 150, "label": "text", "bbox": { "l": 367.63, "t": 488.29, "r": 369.78, "b": 491.03, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 160, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 367.63, "r_y0": 491.03, "r_x1": 369.78, "r_y1": 491.03, "r_x2": 369.78, "r_y2": 488.29, "r_x3": 367.63, "r_y3": 488.29, "coord_origin": "TOPLEFT" }, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 151, "label": "text", "bbox": { "l": 382.66, "t": 488.29, "r": 384.82, "b": 491.03, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 161, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 382.66, "r_y0": 491.03, "r_x1": 384.82, "r_y1": 491.03, "r_x2": 384.82, "r_y2": 488.29, "r_x3": 382.66, "r_y3": 488.29, "coord_origin": "TOPLEFT" }, "text": "4", "orig": "4", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 152, "label": "text", "bbox": { "l": 397.73, "t": 488.29, "r": 402.05, "b": 491.03, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 162, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 397.73, "r_y0": 491.03, "r_x1": 402.05, "r_y1": 491.03, "r_x2": 402.05, "r_y2": 488.29, "r_x3": 397.73, "r_y3": 488.29, "coord_origin": "TOPLEFT" }, "text": "20", "orig": "20", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 153, "label": "text", "bbox": { "l": 200.64, "t": 493.17, "r": 208.49, "b": 495.9, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 163, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 200.64, "r_y0": 495.9, "r_x1": 208.49, "r_y1": 495.9, "r_x2": 208.49, "r_y2": 493.17, "r_x3": 200.64, "r_y3": 493.17, "coord_origin": "TOPLEFT" }, "text": "2013", "orig": "2013", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 154, "label": "text", "bbox": { "l": 264.29, "t": 493.17, "r": 266.26, "b": 495.9, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 164, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 264.29, "r_y0": 495.9, "r_x1": 266.26, "r_y1": 495.9, "r_x2": 266.26, "r_y2": 493.17, "r_x3": 264.29, "r_y3": 493.17, "coord_origin": "TOPLEFT" }, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] } ] }, { "id": 155, "label": "text", "bbox": { "l": 227.91, "t": 665.83, "r": 230.1, "b": 675.35, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 165, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 227.91, "r_y0": 675.35, "r_x1": 230.1, "r_y1": 675.35, "r_x2": 230.1, "r_y2": 665.83, "r_x3": 227.91, "r_y3": 665.83, "coord_origin": "TOPLEFT" }, "text": "\u03bc", "orig": "\u03bc", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 156, "label": "text", "bbox": { "l": 300.58, "t": 683.62, "r": 302.73, "b": 693.43, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 166, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 300.58, "r_y0": 693.43, "r_x1": 302.73, "r_y1": 693.43, "r_x2": 302.73, "r_y2": 683.62, "r_x3": 300.58, "r_y3": 683.62, "coord_origin": "TOPLEFT" }, "text": "\u2265", "orig": "\u2265", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] } ] }, "tablestructure": { "table_map": { "0": { "label": "table", "id": 0, "page_no": 9, "cluster": { "id": 0, "label": "table", "bbox": { "l": 143.64, "t": 156.35, "r": 470.85, "b": 263.26, "coord_origin": "TOPLEFT" }, "confidence": 0.988, "cells": [ { "index": 7, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 160.78, "r_y0": 174.63, "r_x1": 195.0, "r_y1": 174.63, "r_x2": 195.0, "r_y2": 166.56, "r_x3": 160.78, "r_y3": 166.56, "coord_origin": "TOPLEFT" }, "text": "Data set", "orig": "Data set", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 8, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 215.52, "r_y0": 174.6, "r_x1": 254.04, "r_y1": 174.6, "r_x2": 254.04, "r_y2": 166.53, "r_x3": 215.52, "r_y3": 166.53, "coord_origin": "TOPLEFT" }, "text": "Language", "orig": "Language", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 9, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 300.4, "r_y0": 169.15, "r_x1": 323.99, "r_y1": 169.15, "r_x2": 323.99, "r_y2": 161.08, "r_x3": 300.4, "r_y3": 161.08, "coord_origin": "TOPLEFT" }, "text": "TEDs", "orig": "TEDs", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 10, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 370.35, "r_y0": 174.63, "r_x1": 414.75, "r_y1": 174.63, "r_x2": 414.75, "r_y2": 166.56, "r_x3": 370.35, "r_y3": 166.56, "coord_origin": "TOPLEFT" }, "text": "mAP(0.75)", "orig": "mAP(0.75)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 11, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 426.74, "r_y0": 169.15, "r_x1": 463.11, "r_y1": 169.15, "r_x2": 463.11, "r_y2": 161.08, "r_x3": 426.74, "r_y3": 161.08, "coord_origin": "TOPLEFT" }, "text": "Inference", "orig": "Inference", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 12, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 423.11, "r_y0": 180.11, "r_x1": 466.73, "r_y1": 180.11, "r_x2": 466.73, "r_y2": 172.04, "r_x3": 423.11, "r_y3": 172.04, "coord_origin": "TOPLEFT" }, "text": "time (secs)", "orig": "time (secs)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 13, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 262.41, "r_y0": 182.1, "r_x1": 288.06, "r_y1": 182.1, "r_x2": 288.06, "r_y2": 174.03, "r_x3": 262.41, "r_y3": 174.03, "coord_origin": "TOPLEFT" }, "text": "simple", "orig": "simple", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 14, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 296.43, "r_y0": 182.1, "r_x1": 329.45, "r_y1": 182.1, "r_x2": 329.45, "r_y2": 174.03, "r_x3": 296.43, "r_y3": 174.03, "coord_origin": "TOPLEFT" }, "text": "complex", "orig": "complex", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 15, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 345.03, "r_y0": 182.1, "r_x1": 354.76, "r_y1": 182.1, "r_x2": 354.76, "r_y2": 174.03, "r_x3": 345.03, "r_y3": 174.03, "coord_origin": "TOPLEFT" }, "text": "all", "orig": "all", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 16, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 154.54, "r_y0": 200.93, "r_x1": 201.24, "r_y1": 200.93, "r_x2": 201.24, "r_y2": 192.86, "r_x3": 154.54, "r_y3": 192.86, "coord_origin": "TOPLEFT" }, "text": "PubTabNet", "orig": "PubTabNet", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 17, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 222.44, "r_y0": 195.45, "r_x1": 247.13, "r_y1": 195.45, "r_x2": 247.13, "r_y2": 187.38, "r_x3": 222.44, "r_y3": 187.38, "coord_origin": "TOPLEFT" }, "text": "OTSL", "orig": "OTSL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 18, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 264.74, "r_y0": 195.45, "r_x1": 285.73, "r_y1": 195.45, "r_x2": 285.73, "r_y2": 187.38, "r_x3": 264.74, "r_y3": 187.38, "coord_origin": "TOPLEFT" }, "text": "0.965", "orig": "0.965", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 19, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 302.44, "r_y0": 195.45, "r_x1": 323.43, "r_y1": 195.45, "r_x2": 323.43, "r_y2": 187.38, "r_x3": 302.44, "r_y3": 187.38, "coord_origin": "TOPLEFT" }, "text": "0.934", "orig": "0.934", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 20, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 339.4, "r_y0": 195.45, "r_x1": 360.39, "r_y1": 195.45, "r_x2": 360.39, "r_y2": 187.38, "r_x3": 339.4, "r_y3": 187.38, "coord_origin": "TOPLEFT" }, "text": "0.955", "orig": "0.955", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 21, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 383.12, "r_y0": 195.24, "r_x1": 401.97, "r_y1": 195.24, "r_x2": 401.97, "r_y2": 187.32, "r_x3": 383.12, "r_y3": 187.32, "coord_origin": "TOPLEFT" }, "text": "0.88", "orig": "0.88", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 22, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 435.49, "r_y0": 195.24, "r_x1": 454.35, "r_y1": 195.24, "r_x2": 454.35, "r_y2": 187.32, "r_x3": 435.49, "r_y3": 187.32, "coord_origin": "TOPLEFT" }, "text": "2.73", "orig": "2.73", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 23, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 220.9, "r_y0": 208.4, "r_x1": 248.67, "r_y1": 208.4, "r_x2": 248.67, "r_y2": 200.33, "r_x3": 220.9, "r_y3": 200.33, "coord_origin": "TOPLEFT" }, "text": "HTML", "orig": "HTML", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 24, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 264.74, "r_y0": 208.4, "r_x1": 285.73, "r_y1": 208.4, "r_x2": 285.73, "r_y2": 200.33, "r_x3": 264.74, "r_y3": 200.33, "coord_origin": "TOPLEFT" }, "text": "0.969", "orig": "0.969", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 25, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 302.44, "r_y0": 208.4, "r_x1": 323.43, "r_y1": 208.4, "r_x2": 323.43, "r_y2": 200.33, "r_x3": 302.44, "r_y3": 200.33, "coord_origin": "TOPLEFT" }, "text": "0.927", "orig": "0.927", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 26, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 339.4, "r_y0": 208.4, "r_x1": 360.39, "r_y1": 208.4, "r_x2": 360.39, "r_y2": 200.33, "r_x3": 339.4, "r_y3": 200.33, "coord_origin": "TOPLEFT" }, "text": "0.955", "orig": "0.955", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 27, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 382.05, "r_y0": 208.4, "r_x1": 403.04, "r_y1": 208.4, "r_x2": 403.04, "r_y2": 200.33, "r_x3": 382.05, "r_y3": 200.33, "coord_origin": "TOPLEFT" }, "text": "0.857", "orig": "0.857", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 28, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 436.73, "r_y0": 208.4, "r_x1": 453.11, "r_y1": 208.4, "r_x2": 453.11, "r_y2": 200.33, "r_x3": 436.73, "r_y3": 200.33, "coord_origin": "TOPLEFT" }, "text": "5.39", "orig": "5.39", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 29, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 155.95, "r_y0": 227.23, "r_x1": 199.83, "r_y1": 227.23, "r_x2": 199.83, "r_y2": 219.16, "r_x3": 155.95, "r_y3": 219.16, "coord_origin": "TOPLEFT" }, "text": "FinTabNet", "orig": "FinTabNet", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 30, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 222.44, "r_y0": 221.75, "r_x1": 247.13, "r_y1": 221.75, "r_x2": 247.13, "r_y2": 213.68, "r_x3": 222.44, "r_y3": 213.68, "coord_origin": "TOPLEFT" }, "text": "OTSL", "orig": "OTSL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 31, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 264.74, "r_y0": 221.75, "r_x1": 285.73, "r_y1": 221.75, "r_x2": 285.73, "r_y2": 213.68, "r_x3": 264.74, "r_y3": 213.68, "coord_origin": "TOPLEFT" }, "text": "0.955", "orig": "0.955", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 32, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 302.44, "r_y0": 221.75, "r_x1": 323.43, "r_y1": 221.75, "r_x2": 323.43, "r_y2": 213.68, "r_x3": 302.44, "r_y3": 213.68, "coord_origin": "TOPLEFT" }, "text": "0.961", "orig": "0.961", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 33, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 337.81, "r_y0": 221.55, "r_x1": 361.98, "r_y1": 221.55, "r_x2": 361.98, "r_y2": 213.62, "r_x3": 337.81, "r_y3": 213.62, "coord_origin": "TOPLEFT" }, "text": "0.959", "orig": "0.959", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 34, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 380.46, "r_y0": 221.55, "r_x1": 404.62, "r_y1": 221.55, "r_x2": 404.62, "r_y2": 213.62, "r_x3": 380.46, "r_y3": 213.62, "coord_origin": "TOPLEFT" }, "text": "0.862", "orig": "0.862", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 35, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 435.49, "r_y0": 221.55, "r_x1": 454.35, "r_y1": 221.55, "r_x2": 454.35, "r_y2": 213.62, "r_x3": 435.49, "r_y3": 213.62, "coord_origin": "TOPLEFT" }, "text": "1.85", "orig": "1.85", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 36, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 220.9, "r_y0": 234.7, "r_x1": 248.67, "r_y1": 234.7, "r_x2": 248.67, "r_y2": 226.63, "r_x3": 220.9, "r_y3": 226.63, "coord_origin": "TOPLEFT" }, "text": "HTML", "orig": "HTML", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 37, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 264.74, "r_y0": 234.7, "r_x1": 285.73, "r_y1": 234.7, "r_x2": 285.73, "r_y2": 226.63, "r_x3": 264.74, "r_y3": 226.63, "coord_origin": "TOPLEFT" }, "text": "0.917", "orig": "0.917", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 38, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 302.44, "r_y0": 234.7, "r_x1": 323.43, "r_y1": 234.7, "r_x2": 323.43, "r_y2": 226.63, "r_x3": 302.44, "r_y3": 226.63, "coord_origin": "TOPLEFT" }, "text": "0.922", "orig": "0.922", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 39, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 341.71, "r_y0": 234.7, "r_x1": 358.09, "r_y1": 234.7, "r_x2": 358.09, "r_y2": 226.63, "r_x3": 341.71, "r_y3": 226.63, "coord_origin": "TOPLEFT" }, "text": "0.92", "orig": "0.92", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 40, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 382.05, "r_y0": 234.7, "r_x1": 403.04, "r_y1": 234.7, "r_x2": 403.04, "r_y2": 226.63, "r_x3": 382.05, "r_y3": 226.63, "coord_origin": "TOPLEFT" }, "text": "0.722", "orig": "0.722", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 41, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 436.73, "r_y0": 234.7, "r_x1": 453.11, "r_y1": 234.7, "r_x2": 453.11, "r_y2": 226.63, "r_x3": 436.73, "r_y3": 226.63, "coord_origin": "TOPLEFT" }, "text": "3.26", "orig": "3.26", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 42, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 148.63, "r_y0": 253.53, "r_x1": 207.15, "r_y1": 253.53, "r_x2": 207.15, "r_y2": 245.46, "r_x3": 148.63, "r_y3": 245.46, "coord_origin": "TOPLEFT" }, "text": "PubTables-1M", "orig": "PubTables-1M", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 43, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 222.44, "r_y0": 248.05, "r_x1": 247.13, "r_y1": 248.05, "r_x2": 247.13, "r_y2": 239.98, "r_x3": 222.44, "r_y3": 239.98, "coord_origin": "TOPLEFT" }, "text": "OTSL", "orig": "OTSL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 44, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 264.74, "r_y0": 248.05, "r_x1": 285.73, "r_y1": 248.05, "r_x2": 285.73, "r_y2": 239.98, "r_x3": 264.74, "r_y3": 239.98, "coord_origin": "TOPLEFT" }, "text": "0.987", "orig": "0.987", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 45, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 302.44, "r_y0": 248.05, "r_x1": 323.43, "r_y1": 248.05, "r_x2": 323.43, "r_y2": 239.98, "r_x3": 302.44, "r_y3": 239.98, "coord_origin": "TOPLEFT" }, "text": "0.964", "orig": "0.964", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 46, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 337.81, "r_y0": 247.85, "r_x1": 361.98, "r_y1": 247.85, "r_x2": 361.98, "r_y2": 239.92, "r_x3": 337.81, "r_y3": 239.92, "coord_origin": "TOPLEFT" }, "text": "0.977", "orig": "0.977", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 47, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 380.46, "r_y0": 247.85, "r_x1": 404.62, "r_y1": 247.85, "r_x2": 404.62, "r_y2": 239.92, "r_x3": 380.46, "r_y3": 239.92, "coord_origin": "TOPLEFT" }, "text": "0.896", "orig": "0.896", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 48, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 435.49, "r_y0": 247.85, "r_x1": 454.35, "r_y1": 247.85, "r_x2": 454.35, "r_y2": 239.92, "r_x3": 435.49, "r_y3": 239.92, "coord_origin": "TOPLEFT" }, "text": "1.79", "orig": "1.79", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 49, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 220.9, "r_y0": 261.0, "r_x1": 248.67, "r_y1": 261.0, "r_x2": 248.67, "r_y2": 252.93, "r_x3": 220.9, "r_y3": 252.93, "coord_origin": "TOPLEFT" }, "text": "HTML", "orig": "HTML", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 50, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 264.74, "r_y0": 261.0, "r_x1": 285.73, "r_y1": 261.0, "r_x2": 285.73, "r_y2": 252.93, "r_x3": 264.74, "r_y3": 252.93, "coord_origin": "TOPLEFT" }, "text": "0.983", "orig": "0.983", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 51, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 302.44, "r_y0": 261.0, "r_x1": 323.43, "r_y1": 261.0, "r_x2": 323.43, "r_y2": 252.93, "r_x3": 302.44, "r_y3": 252.93, "coord_origin": "TOPLEFT" }, "text": "0.944", "orig": "0.944", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 52, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 339.4, "r_y0": 261.0, "r_x1": 360.39, "r_y1": 261.0, "r_x2": 360.39, "r_y2": 252.93, "r_x3": 339.4, "r_y3": 252.93, "coord_origin": "TOPLEFT" }, "text": "0.966", "orig": "0.966", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 53, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 382.05, "r_y0": 261.0, "r_x1": 403.04, "r_y1": 261.0, "r_x2": 403.04, "r_y2": 252.93, "r_x3": 382.05, "r_y3": 252.93, "coord_origin": "TOPLEFT" }, "text": "0.889", "orig": "0.889", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 54, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 436.73, "r_y0": 261.0, "r_x1": 453.11, "r_y1": 261.0, "r_x2": 453.11, "r_y2": 252.93, "r_x3": 436.73, "r_y3": 252.93, "coord_origin": "TOPLEFT" }, "text": "3.26", "orig": "3.26", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [ { "id": 10, "label": "text", "bbox": { "l": 160.78, "t": 166.56, "r": 195.0, "b": 174.63, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 7, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 160.78, "r_y0": 174.63, "r_x1": 195.0, "r_y1": 174.63, "r_x2": 195.0, "r_y2": 166.56, "r_x3": 160.78, "r_y3": 166.56, "coord_origin": "TOPLEFT" }, "text": "Data set", "orig": "Data set", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 11, "label": "text", "bbox": { "l": 215.52, "t": 166.53, "r": 254.04, "b": 174.6, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 8, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 215.52, "r_y0": 174.6, "r_x1": 254.04, "r_y1": 174.6, "r_x2": 254.04, "r_y2": 166.53, "r_x3": 215.52, "r_y3": 166.53, "coord_origin": "TOPLEFT" }, "text": "Language", "orig": "Language", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 12, "label": "text", "bbox": { "l": 300.4, "t": 161.08, "r": 323.99, "b": 169.15, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 9, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 300.4, "r_y0": 169.15, "r_x1": 323.99, "r_y1": 169.15, "r_x2": 323.99, "r_y2": 161.08, "r_x3": 300.4, "r_y3": 161.08, "coord_origin": "TOPLEFT" }, "text": "TEDs", "orig": "TEDs", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 13, "label": "text", "bbox": { "l": 370.35, "t": 166.56, "r": 414.75, "b": 174.63, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 10, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 370.35, "r_y0": 174.63, "r_x1": 414.75, "r_y1": 174.63, "r_x2": 414.75, "r_y2": 166.56, "r_x3": 370.35, "r_y3": 166.56, "coord_origin": "TOPLEFT" }, "text": "mAP(0.75)", "orig": "mAP(0.75)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 14, "label": "text", "bbox": { "l": 426.74, "t": 161.08, "r": 463.11, "b": 169.15, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 11, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 426.74, "r_y0": 169.15, "r_x1": 463.11, "r_y1": 169.15, "r_x2": 463.11, "r_y2": 161.08, "r_x3": 426.74, "r_y3": 161.08, "coord_origin": "TOPLEFT" }, "text": "Inference", "orig": "Inference", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 15, "label": "text", "bbox": { "l": 423.11, "t": 172.04, "r": 466.73, "b": 180.11, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 12, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 423.11, "r_y0": 180.11, "r_x1": 466.73, "r_y1": 180.11, "r_x2": 466.73, "r_y2": 172.04, "r_x3": 423.11, "r_y3": 172.04, "coord_origin": "TOPLEFT" }, "text": "time (secs)", "orig": "time (secs)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 16, "label": "text", "bbox": { "l": 262.41, "t": 174.03, "r": 288.06, "b": 182.1, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 13, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 262.41, "r_y0": 182.1, "r_x1": 288.06, "r_y1": 182.1, "r_x2": 288.06, "r_y2": 174.03, "r_x3": 262.41, "r_y3": 174.03, "coord_origin": "TOPLEFT" }, "text": "simple", "orig": "simple", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 17, "label": "text", "bbox": { "l": 296.43, "t": 174.03, "r": 329.45, "b": 182.1, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 14, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 296.43, "r_y0": 182.1, "r_x1": 329.45, "r_y1": 182.1, "r_x2": 329.45, "r_y2": 174.03, "r_x3": 296.43, "r_y3": 174.03, "coord_origin": "TOPLEFT" }, "text": "complex", "orig": "complex", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 18, "label": "text", "bbox": { "l": 345.03, "t": 174.03, "r": 354.76, "b": 182.1, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 15, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 345.03, "r_y0": 182.1, "r_x1": 354.76, "r_y1": 182.1, "r_x2": 354.76, "r_y2": 174.03, "r_x3": 345.03, "r_y3": 174.03, "coord_origin": "TOPLEFT" }, "text": "all", "orig": "all", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 19, "label": "text", "bbox": { "l": 154.54, "t": 192.86, "r": 201.24, "b": 200.93, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 16, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 154.54, "r_y0": 200.93, "r_x1": 201.24, "r_y1": 200.93, "r_x2": 201.24, "r_y2": 192.86, "r_x3": 154.54, "r_y3": 192.86, "coord_origin": "TOPLEFT" }, "text": "PubTabNet", "orig": "PubTabNet", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 20, "label": "text", "bbox": { "l": 222.44, "t": 187.38, "r": 247.13, "b": 195.45, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 17, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 222.44, "r_y0": 195.45, "r_x1": 247.13, "r_y1": 195.45, "r_x2": 247.13, "r_y2": 187.38, "r_x3": 222.44, "r_y3": 187.38, "coord_origin": "TOPLEFT" }, "text": "OTSL", "orig": "OTSL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 21, "label": "text", "bbox": { "l": 264.74, "t": 187.38, "r": 285.73, "b": 195.45, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 18, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 264.74, "r_y0": 195.45, "r_x1": 285.73, "r_y1": 195.45, "r_x2": 285.73, "r_y2": 187.38, "r_x3": 264.74, "r_y3": 187.38, "coord_origin": "TOPLEFT" }, "text": "0.965", "orig": "0.965", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 22, "label": "text", "bbox": { "l": 302.44, "t": 187.38, "r": 323.43, "b": 195.45, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 19, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 302.44, "r_y0": 195.45, "r_x1": 323.43, "r_y1": 195.45, "r_x2": 323.43, "r_y2": 187.38, "r_x3": 302.44, "r_y3": 187.38, "coord_origin": "TOPLEFT" }, "text": "0.934", "orig": "0.934", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 23, "label": "text", "bbox": { "l": 339.4, "t": 187.38, "r": 360.39, "b": 195.45, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 20, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 339.4, "r_y0": 195.45, "r_x1": 360.39, "r_y1": 195.45, "r_x2": 360.39, "r_y2": 187.38, "r_x3": 339.4, "r_y3": 187.38, "coord_origin": "TOPLEFT" }, "text": "0.955", "orig": "0.955", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 24, "label": "text", "bbox": { "l": 383.12, "t": 187.32, "r": 401.97, "b": 195.24, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 21, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 383.12, "r_y0": 195.24, "r_x1": 401.97, "r_y1": 195.24, "r_x2": 401.97, "r_y2": 187.32, "r_x3": 383.12, "r_y3": 187.32, "coord_origin": "TOPLEFT" }, "text": "0.88", "orig": "0.88", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 25, "label": "text", "bbox": { "l": 435.49, "t": 187.32, "r": 454.35, "b": 195.24, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 22, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 435.49, "r_y0": 195.24, "r_x1": 454.35, "r_y1": 195.24, "r_x2": 454.35, "r_y2": 187.32, "r_x3": 435.49, "r_y3": 187.32, "coord_origin": "TOPLEFT" }, "text": "2.73", "orig": "2.73", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 26, "label": "text", "bbox": { "l": 220.9, "t": 200.33, "r": 248.67, "b": 208.4, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 23, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 220.9, "r_y0": 208.4, "r_x1": 248.67, "r_y1": 208.4, "r_x2": 248.67, "r_y2": 200.33, "r_x3": 220.9, "r_y3": 200.33, "coord_origin": "TOPLEFT" }, "text": "HTML", "orig": "HTML", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 27, "label": "text", "bbox": { "l": 264.74, "t": 200.33, "r": 285.73, "b": 208.4, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 24, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 264.74, "r_y0": 208.4, "r_x1": 285.73, "r_y1": 208.4, "r_x2": 285.73, "r_y2": 200.33, "r_x3": 264.74, "r_y3": 200.33, "coord_origin": "TOPLEFT" }, "text": "0.969", "orig": "0.969", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 28, "label": "text", "bbox": { "l": 302.44, "t": 200.33, "r": 323.43, "b": 208.4, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 25, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 302.44, "r_y0": 208.4, "r_x1": 323.43, "r_y1": 208.4, "r_x2": 323.43, "r_y2": 200.33, "r_x3": 302.44, "r_y3": 200.33, "coord_origin": "TOPLEFT" }, "text": "0.927", "orig": "0.927", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 29, "label": "text", "bbox": { "l": 339.4, "t": 200.33, "r": 360.39, "b": 208.4, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 26, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 339.4, "r_y0": 208.4, "r_x1": 360.39, "r_y1": 208.4, "r_x2": 360.39, "r_y2": 200.33, "r_x3": 339.4, "r_y3": 200.33, "coord_origin": "TOPLEFT" }, "text": "0.955", "orig": "0.955", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 30, "label": "text", "bbox": { "l": 382.05, "t": 200.33, "r": 403.04, "b": 208.4, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 27, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 382.05, "r_y0": 208.4, "r_x1": 403.04, "r_y1": 208.4, "r_x2": 403.04, "r_y2": 200.33, "r_x3": 382.05, "r_y3": 200.33, "coord_origin": "TOPLEFT" }, "text": "0.857", "orig": "0.857", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 31, "label": "text", "bbox": { "l": 436.73, "t": 200.33, "r": 453.11, "b": 208.4, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 28, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 436.73, "r_y0": 208.4, "r_x1": 453.11, "r_y1": 208.4, "r_x2": 453.11, "r_y2": 200.33, "r_x3": 436.73, "r_y3": 200.33, "coord_origin": "TOPLEFT" }, "text": "5.39", "orig": "5.39", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 32, "label": "text", "bbox": { "l": 155.95, "t": 219.16, "r": 199.83, "b": 227.23, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 29, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 155.95, "r_y0": 227.23, "r_x1": 199.83, "r_y1": 227.23, "r_x2": 199.83, "r_y2": 219.16, "r_x3": 155.95, "r_y3": 219.16, "coord_origin": "TOPLEFT" }, "text": "FinTabNet", "orig": "FinTabNet", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 33, "label": "text", "bbox": { "l": 222.44, "t": 213.68, "r": 247.13, "b": 221.75, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 30, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 222.44, "r_y0": 221.75, "r_x1": 247.13, "r_y1": 221.75, "r_x2": 247.13, "r_y2": 213.68, "r_x3": 222.44, "r_y3": 213.68, "coord_origin": "TOPLEFT" }, "text": "OTSL", "orig": "OTSL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 34, "label": "text", "bbox": { "l": 264.74, "t": 213.68, "r": 285.73, "b": 221.75, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 31, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 264.74, "r_y0": 221.75, "r_x1": 285.73, "r_y1": 221.75, "r_x2": 285.73, "r_y2": 213.68, "r_x3": 264.74, "r_y3": 213.68, "coord_origin": "TOPLEFT" }, "text": "0.955", "orig": "0.955", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 35, "label": "text", "bbox": { "l": 302.44, "t": 213.68, "r": 323.43, "b": 221.75, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 32, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 302.44, "r_y0": 221.75, "r_x1": 323.43, "r_y1": 221.75, "r_x2": 323.43, "r_y2": 213.68, "r_x3": 302.44, "r_y3": 213.68, "coord_origin": "TOPLEFT" }, "text": "0.961", "orig": "0.961", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 36, "label": "text", "bbox": { "l": 337.81, "t": 213.62, "r": 361.98, "b": 221.55, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 33, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 337.81, "r_y0": 221.55, "r_x1": 361.98, "r_y1": 221.55, "r_x2": 361.98, "r_y2": 213.62, "r_x3": 337.81, "r_y3": 213.62, "coord_origin": "TOPLEFT" }, "text": "0.959", "orig": "0.959", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 37, "label": "text", "bbox": { "l": 380.46, "t": 213.62, "r": 404.62, "b": 221.55, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 34, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 380.46, "r_y0": 221.55, "r_x1": 404.62, "r_y1": 221.55, "r_x2": 404.62, "r_y2": 213.62, "r_x3": 380.46, "r_y3": 213.62, "coord_origin": "TOPLEFT" }, "text": "0.862", "orig": "0.862", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 38, "label": "text", "bbox": { "l": 435.49, "t": 213.62, "r": 454.35, "b": 221.55, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 35, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 435.49, "r_y0": 221.55, "r_x1": 454.35, "r_y1": 221.55, "r_x2": 454.35, "r_y2": 213.62, "r_x3": 435.49, "r_y3": 213.62, "coord_origin": "TOPLEFT" }, "text": "1.85", "orig": "1.85", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 39, "label": "text", "bbox": { "l": 220.9, "t": 226.63, "r": 248.67, "b": 234.7, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 36, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 220.9, "r_y0": 234.7, "r_x1": 248.67, "r_y1": 234.7, "r_x2": 248.67, "r_y2": 226.63, "r_x3": 220.9, "r_y3": 226.63, "coord_origin": "TOPLEFT" }, "text": "HTML", "orig": "HTML", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 40, "label": "text", "bbox": { "l": 264.74, "t": 226.63, "r": 285.73, "b": 234.7, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 37, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 264.74, "r_y0": 234.7, "r_x1": 285.73, "r_y1": 234.7, "r_x2": 285.73, "r_y2": 226.63, "r_x3": 264.74, "r_y3": 226.63, "coord_origin": "TOPLEFT" }, "text": "0.917", "orig": "0.917", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 41, "label": "text", "bbox": { "l": 302.44, "t": 226.63, "r": 323.43, "b": 234.7, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 38, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 302.44, "r_y0": 234.7, "r_x1": 323.43, "r_y1": 234.7, "r_x2": 323.43, "r_y2": 226.63, "r_x3": 302.44, "r_y3": 226.63, "coord_origin": "TOPLEFT" }, "text": "0.922", "orig": "0.922", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 42, "label": "text", "bbox": { "l": 341.71, "t": 226.63, "r": 358.09, "b": 234.7, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 39, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 341.71, "r_y0": 234.7, "r_x1": 358.09, "r_y1": 234.7, "r_x2": 358.09, "r_y2": 226.63, "r_x3": 341.71, "r_y3": 226.63, "coord_origin": "TOPLEFT" }, "text": "0.92", "orig": "0.92", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 43, "label": "text", "bbox": { "l": 382.05, "t": 226.63, "r": 403.04, "b": 234.7, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 40, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 382.05, "r_y0": 234.7, "r_x1": 403.04, "r_y1": 234.7, "r_x2": 403.04, "r_y2": 226.63, "r_x3": 382.05, "r_y3": 226.63, "coord_origin": "TOPLEFT" }, "text": "0.722", "orig": "0.722", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 44, "label": "text", "bbox": { "l": 436.73, "t": 226.63, "r": 453.11, "b": 234.7, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 41, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 436.73, "r_y0": 234.7, "r_x1": 453.11, "r_y1": 234.7, "r_x2": 453.11, "r_y2": 226.63, "r_x3": 436.73, "r_y3": 226.63, "coord_origin": "TOPLEFT" }, "text": "3.26", "orig": "3.26", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 45, "label": "text", "bbox": { "l": 148.63, "t": 245.46, "r": 207.15, "b": 253.53, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 42, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 148.63, "r_y0": 253.53, "r_x1": 207.15, "r_y1": 253.53, "r_x2": 207.15, "r_y2": 245.46, "r_x3": 148.63, "r_y3": 245.46, "coord_origin": "TOPLEFT" }, "text": "PubTables-1M", "orig": "PubTables-1M", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 46, "label": "text", "bbox": { "l": 222.44, "t": 239.98, "r": 247.13, "b": 248.05, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 43, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 222.44, "r_y0": 248.05, "r_x1": 247.13, "r_y1": 248.05, "r_x2": 247.13, "r_y2": 239.98, "r_x3": 222.44, "r_y3": 239.98, "coord_origin": "TOPLEFT" }, "text": "OTSL", "orig": "OTSL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 47, "label": "text", "bbox": { "l": 264.74, "t": 239.98, "r": 285.73, "b": 248.05, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 44, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 264.74, "r_y0": 248.05, "r_x1": 285.73, "r_y1": 248.05, "r_x2": 285.73, "r_y2": 239.98, "r_x3": 264.74, "r_y3": 239.98, "coord_origin": "TOPLEFT" }, "text": "0.987", "orig": "0.987", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 48, "label": "text", "bbox": { "l": 302.44, "t": 239.98, "r": 323.43, "b": 248.05, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 45, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 302.44, "r_y0": 248.05, "r_x1": 323.43, "r_y1": 248.05, "r_x2": 323.43, "r_y2": 239.98, "r_x3": 302.44, "r_y3": 239.98, "coord_origin": "TOPLEFT" }, "text": "0.964", "orig": "0.964", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 49, "label": "text", "bbox": { "l": 337.81, "t": 239.92, "r": 361.98, "b": 247.85, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 46, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 337.81, "r_y0": 247.85, "r_x1": 361.98, "r_y1": 247.85, "r_x2": 361.98, "r_y2": 239.92, "r_x3": 337.81, "r_y3": 239.92, "coord_origin": "TOPLEFT" }, "text": "0.977", "orig": "0.977", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 50, "label": "text", "bbox": { "l": 380.46, "t": 239.92, "r": 404.62, "b": 247.85, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 47, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 380.46, "r_y0": 247.85, "r_x1": 404.62, "r_y1": 247.85, "r_x2": 404.62, "r_y2": 239.92, "r_x3": 380.46, "r_y3": 239.92, "coord_origin": "TOPLEFT" }, "text": "0.896", "orig": "0.896", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 51, "label": "text", "bbox": { "l": 435.49, "t": 239.92, "r": 454.35, "b": 247.85, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 48, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 435.49, "r_y0": 247.85, "r_x1": 454.35, "r_y1": 247.85, "r_x2": 454.35, "r_y2": 239.92, "r_x3": 435.49, "r_y3": 239.92, "coord_origin": "TOPLEFT" }, "text": "1.79", "orig": "1.79", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 52, "label": "text", "bbox": { "l": 220.9, "t": 252.93, "r": 248.67, "b": 261.0, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 49, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 220.9, "r_y0": 261.0, "r_x1": 248.67, "r_y1": 261.0, "r_x2": 248.67, "r_y2": 252.93, "r_x3": 220.9, "r_y3": 252.93, "coord_origin": "TOPLEFT" }, "text": "HTML", "orig": "HTML", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 53, "label": "text", "bbox": { "l": 264.74, "t": 252.93, "r": 285.73, "b": 261.0, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 50, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 264.74, "r_y0": 261.0, "r_x1": 285.73, "r_y1": 261.0, "r_x2": 285.73, "r_y2": 252.93, "r_x3": 264.74, "r_y3": 252.93, "coord_origin": "TOPLEFT" }, "text": "0.983", "orig": "0.983", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 54, "label": "text", "bbox": { "l": 302.44, "t": 252.93, "r": 323.43, "b": 261.0, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 51, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 302.44, "r_y0": 261.0, "r_x1": 323.43, "r_y1": 261.0, "r_x2": 323.43, "r_y2": 252.93, "r_x3": 302.44, "r_y3": 252.93, "coord_origin": "TOPLEFT" }, "text": "0.944", "orig": "0.944", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 55, "label": "text", "bbox": { "l": 339.4, "t": 252.93, "r": 360.39, "b": 261.0, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 52, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 339.4, "r_y0": 261.0, "r_x1": 360.39, "r_y1": 261.0, "r_x2": 360.39, "r_y2": 252.93, "r_x3": 339.4, "r_y3": 252.93, "coord_origin": "TOPLEFT" }, "text": "0.966", "orig": "0.966", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 56, "label": "text", "bbox": { "l": 382.05, "t": 252.93, "r": 403.04, "b": 261.0, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 53, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 382.05, "r_y0": 261.0, "r_x1": 403.04, "r_y1": 261.0, "r_x2": 403.04, "r_y2": 252.93, "r_x3": 382.05, "r_y3": 252.93, "coord_origin": "TOPLEFT" }, "text": "0.889", "orig": "0.889", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 57, "label": "text", "bbox": { "l": 436.73, "t": 252.93, "r": 453.11, "b": 261.0, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 54, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 436.73, "r_y0": 261.0, "r_x1": 453.11, "r_y1": 261.0, "r_x2": 453.11, "r_y2": 252.93, "r_x3": 436.73, "r_y3": 252.93, "coord_origin": "TOPLEFT" }, "text": "3.26", "orig": "3.26", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] } ] }, "text": null, "otsl_seq": [ "ched", "ched", "ched", "lcel", "lcel", "ched", "ched", "nl", "ucel", "ucel", "ched", "ched", "ched", "ucel", "ucel", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "nl" ], "num_rows": 5, "num_cols": 7, "table_cells": [ { "bbox": { "l": 160.78, "t": 166.56, "r": 195.0, "b": 174.63, "coord_origin": "TOPLEFT" }, "row_span": 2, "col_span": 1, "start_row_offset_idx": 0, "end_row_offset_idx": 2, "start_col_offset_idx": 0, "end_col_offset_idx": 1, "text": "Data set", "column_header": true, "row_header": false, "row_section": false }, { "bbox": { "l": 215.52, "t": 166.53, "r": 254.04, "b": 174.6, "coord_origin": "TOPLEFT" }, "row_span": 2, "col_span": 1, "start_row_offset_idx": 0, "end_row_offset_idx": 2, "start_col_offset_idx": 1, "end_col_offset_idx": 2, "text": "Language", "column_header": true, "row_header": false, "row_section": false }, { "bbox": { "l": 300.4, "t": 161.08, "r": 323.99, "b": 169.15, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 3, "start_row_offset_idx": 0, "end_row_offset_idx": 1, "start_col_offset_idx": 2, "end_col_offset_idx": 5, "text": "TEDs", "column_header": true, "row_header": false, "row_section": false }, { "bbox": { "l": 370.35, "t": 166.56, "r": 414.75, "b": 174.63, "coord_origin": "TOPLEFT" }, "row_span": 2, "col_span": 1, "start_row_offset_idx": 0, "end_row_offset_idx": 2, "start_col_offset_idx": 5, "end_col_offset_idx": 6, "text": "mAP(0.75)", "column_header": true, "row_header": false, "row_section": false }, { "bbox": { "l": 426.74, "t": 161.08, "r": 463.11, "b": 169.15, "coord_origin": "TOPLEFT" }, "row_span": 2, "col_span": 1, "start_row_offset_idx": 0, "end_row_offset_idx": 2, "start_col_offset_idx": 6, "end_col_offset_idx": 7, "text": "Inference time (secs)", "column_header": true, "row_header": false, "row_section": false }, { "bbox": { "l": 262.41, "t": 174.03, "r": 288.06, "b": 182.1, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 1, "end_row_offset_idx": 2, "start_col_offset_idx": 2, "end_col_offset_idx": 3, "text": "simple", "column_header": true, "row_header": false, "row_section": false }, { "bbox": { "l": 296.43, "t": 174.03, "r": 329.45, "b": 182.1, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 1, "end_row_offset_idx": 2, "start_col_offset_idx": 3, "end_col_offset_idx": 4, "text": "complex", "column_header": true, "row_header": false, "row_section": false }, { "bbox": { "l": 345.03, "t": 174.03, "r": 354.76, "b": 182.1, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 1, "end_row_offset_idx": 2, "start_col_offset_idx": 4, "end_col_offset_idx": 5, "text": "all", "column_header": true, "row_header": false, "row_section": false }, { "bbox": { "l": 154.54, "t": 192.86, "r": 201.24, "b": 200.93, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 2, "end_row_offset_idx": 3, "start_col_offset_idx": 0, "end_col_offset_idx": 1, "text": "PubTabNet", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 222.44, "t": 187.38, "r": 247.13, "b": 195.45, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 2, "end_row_offset_idx": 3, "start_col_offset_idx": 1, "end_col_offset_idx": 2, "text": "OTSL HTML", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 264.74, "t": 187.38, "r": 285.73, "b": 195.45, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 2, "end_row_offset_idx": 3, "start_col_offset_idx": 2, "end_col_offset_idx": 3, "text": "0.965 0.969", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 302.44, "t": 187.38, "r": 323.43, "b": 195.45, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 2, "end_row_offset_idx": 3, "start_col_offset_idx": 3, "end_col_offset_idx": 4, "text": "0.934 0.927", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 339.4, "t": 187.38, "r": 360.39, "b": 195.45, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 2, "end_row_offset_idx": 3, "start_col_offset_idx": 4, "end_col_offset_idx": 5, "text": "0.955 0.955", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 383.12, "t": 187.32, "r": 401.97, "b": 195.24, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 2, "end_row_offset_idx": 3, "start_col_offset_idx": 5, "end_col_offset_idx": 6, "text": "0.88 0.857", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 435.49, "t": 187.32, "r": 454.35, "b": 195.24, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 2, "end_row_offset_idx": 3, "start_col_offset_idx": 6, "end_col_offset_idx": 7, "text": "2.73 5.39", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 155.95, "t": 219.16, "r": 199.83, "b": 227.23, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 3, "end_row_offset_idx": 4, "start_col_offset_idx": 0, "end_col_offset_idx": 1, "text": "FinTabNet", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 222.44, "t": 213.68, "r": 247.13, "b": 221.75, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 3, "end_row_offset_idx": 4, "start_col_offset_idx": 1, "end_col_offset_idx": 2, "text": "OTSL HTML", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 264.74, "t": 213.68, "r": 285.73, "b": 221.75, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 3, "end_row_offset_idx": 4, "start_col_offset_idx": 2, "end_col_offset_idx": 3, "text": "0.955 0.917", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 302.44, "t": 213.68, "r": 323.43, "b": 221.75, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 3, "end_row_offset_idx": 4, "start_col_offset_idx": 3, "end_col_offset_idx": 4, "text": "0.961 0.922", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 337.81, "t": 213.62, "r": 361.98, "b": 221.55, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 3, "end_row_offset_idx": 4, "start_col_offset_idx": 4, "end_col_offset_idx": 5, "text": "0.959 0.92", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 380.46, "t": 213.62, "r": 404.62, "b": 221.55, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 3, "end_row_offset_idx": 4, "start_col_offset_idx": 5, "end_col_offset_idx": 6, "text": "0.862 0.722", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 435.49, "t": 213.62, "r": 454.35, "b": 221.55, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 3, "end_row_offset_idx": 4, "start_col_offset_idx": 6, "end_col_offset_idx": 7, "text": "1.85 3.26", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 148.63, "t": 245.46, "r": 207.15, "b": 253.53, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 4, "end_row_offset_idx": 5, "start_col_offset_idx": 0, "end_col_offset_idx": 1, "text": "PubTables-1M", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 222.44, "t": 239.98, "r": 247.13, "b": 248.05, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 4, "end_row_offset_idx": 5, "start_col_offset_idx": 1, "end_col_offset_idx": 2, "text": "OTSL HTML", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 264.74, "t": 239.98, "r": 285.73, "b": 248.05, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 4, "end_row_offset_idx": 5, "start_col_offset_idx": 2, "end_col_offset_idx": 3, "text": "0.987 0.983", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 302.44, "t": 239.98, "r": 323.43, "b": 248.05, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 4, "end_row_offset_idx": 5, "start_col_offset_idx": 3, "end_col_offset_idx": 4, "text": "0.964 0.944", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 337.81, "t": 239.92, "r": 361.98, "b": 247.85, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 4, "end_row_offset_idx": 5, "start_col_offset_idx": 4, "end_col_offset_idx": 5, "text": "0.977 0.966", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 380.46, "t": 239.92, "r": 404.62, "b": 247.85, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 4, "end_row_offset_idx": 5, "start_col_offset_idx": 5, "end_col_offset_idx": 6, "text": "0.896 0.889", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 435.49, "t": 239.92, "r": 454.35, "b": 247.85, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 4, "end_row_offset_idx": 5, "start_col_offset_idx": 6, "end_col_offset_idx": 7, "text": "1.79 3.26", "column_header": false, "row_header": false, "row_section": false } ] } } }, "figures_classification": null, "equations_prediction": null, "vlm_response": null }, "assembled": { "elements": [ { "label": "page_header", "id": 7, "page_no": 9, "cluster": { "id": 7, "label": "page_header", "bbox": { "l": 134.76, "t": 93.77, "r": 143.98, "b": 101.84, "coord_origin": "TOPLEFT" }, "confidence": 0.831, "cells": [ { "index": 0, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 101.84, "r_x1": 143.98, "r_y1": 101.84, "r_x2": 143.98, "r_y2": 93.77, "r_x3": 134.76, "r_y3": 93.77, "coord_origin": "TOPLEFT" }, "text": "10", "orig": "10", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "10" }, { "label": "page_header", "id": 6, "page_no": 9, "cluster": { "id": 6, "label": "page_header", "bbox": { "l": 167.82, "t": 93.77, "r": 231.72, "b": 101.84, "coord_origin": "TOPLEFT" }, "confidence": 0.837, "cells": [ { "index": 1, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 167.82, "r_y0": 101.84, "r_x1": 178.08, "r_y1": 101.84, "r_x2": 178.08, "r_y2": 93.77, "r_x3": 167.82, "r_y3": 93.77, "coord_origin": "TOPLEFT" }, "text": "M.", "orig": "M.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 2, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 182.38, "r_y0": 101.84, "r_x1": 231.72, "r_y1": 101.84, "r_x2": 231.72, "r_y2": 93.77, "r_x3": 182.38, "r_y3": 93.77, "coord_origin": "TOPLEFT" }, "text": "Lysak, et al.", "orig": "Lysak, et al.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "M. Lysak, et al." }, { "label": "caption", "id": 4, "page_no": 9, "cluster": { "id": 4, "label": "caption", "bbox": { "l": 134.76, "t": 115.84, "r": 480.59, "b": 145.89, "coord_origin": "TOPLEFT" }, "confidence": 0.951, "cells": [ { "index": 3, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 123.76, "r_x1": 173.09, "r_y1": 123.76, "r_x2": 173.09, "r_y2": 115.84, "r_x3": 134.76, "r_y3": 115.84, "coord_origin": "TOPLEFT" }, "text": "Table 2.", "orig": "Table 2.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 4, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 181.3, "r_y0": 123.97, "r_x1": 480.59, "r_y1": 123.97, "r_x2": 480.59, "r_y2": 115.9, "r_x3": 181.3, "r_y3": 115.9, "coord_origin": "TOPLEFT" }, "text": "TSR and cell detection results compared between OTSL and HTML on", "orig": "TSR and cell detection results compared between OTSL and HTML on", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 5, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 134.93, "r_x1": 480.59, "r_y1": 134.93, "r_x2": 480.59, "r_y2": 126.86, "r_x3": 134.76, "r_y3": 126.86, "coord_origin": "TOPLEFT" }, "text": "the PubTabNet [22], FinTabNet [21] and PubTables-1M [14] data sets using Table-", "orig": "the PubTabNet [22], FinTabNet [21] and PubTables-1M [14] data sets using Table-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 6, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 145.89, "r_x1": 305.96, "r_y1": 145.89, "r_x2": 305.96, "r_y2": 137.82, "r_x3": 134.76, "r_y3": 137.82, "coord_origin": "TOPLEFT" }, "text": "Former [9] (with enc=6, dec=6, heads=8).", "orig": "Former [9] (with enc=6, dec=6, heads=8).", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "Table 2. TSR and cell detection results compared between OTSL and HTML on the PubTabNet [22], FinTabNet [21] and PubTables-1M [14] data sets using TableFormer [9] (with enc=6, dec=6, heads=8)." }, { "label": "table", "id": 0, "page_no": 9, "cluster": { "id": 0, "label": "table", "bbox": { "l": 143.64, "t": 156.35, "r": 470.85, "b": 263.26, "coord_origin": "TOPLEFT" }, "confidence": 0.988, "cells": [ { "index": 7, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 160.78, "r_y0": 174.63, "r_x1": 195.0, "r_y1": 174.63, "r_x2": 195.0, "r_y2": 166.56, "r_x3": 160.78, "r_y3": 166.56, "coord_origin": "TOPLEFT" }, "text": "Data set", "orig": "Data set", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 8, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 215.52, "r_y0": 174.6, "r_x1": 254.04, "r_y1": 174.6, "r_x2": 254.04, "r_y2": 166.53, "r_x3": 215.52, "r_y3": 166.53, "coord_origin": "TOPLEFT" }, "text": "Language", "orig": "Language", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 9, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 300.4, "r_y0": 169.15, "r_x1": 323.99, "r_y1": 169.15, "r_x2": 323.99, "r_y2": 161.08, "r_x3": 300.4, "r_y3": 161.08, "coord_origin": "TOPLEFT" }, "text": "TEDs", "orig": "TEDs", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 10, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 370.35, "r_y0": 174.63, "r_x1": 414.75, "r_y1": 174.63, "r_x2": 414.75, "r_y2": 166.56, "r_x3": 370.35, "r_y3": 166.56, "coord_origin": "TOPLEFT" }, "text": "mAP(0.75)", "orig": "mAP(0.75)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 11, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 426.74, "r_y0": 169.15, "r_x1": 463.11, "r_y1": 169.15, "r_x2": 463.11, "r_y2": 161.08, "r_x3": 426.74, "r_y3": 161.08, "coord_origin": "TOPLEFT" }, "text": "Inference", "orig": "Inference", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 12, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 423.11, "r_y0": 180.11, "r_x1": 466.73, "r_y1": 180.11, "r_x2": 466.73, "r_y2": 172.04, "r_x3": 423.11, "r_y3": 172.04, "coord_origin": "TOPLEFT" }, "text": "time (secs)", "orig": "time (secs)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 13, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 262.41, "r_y0": 182.1, "r_x1": 288.06, "r_y1": 182.1, "r_x2": 288.06, "r_y2": 174.03, "r_x3": 262.41, "r_y3": 174.03, "coord_origin": "TOPLEFT" }, "text": "simple", "orig": "simple", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 14, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 296.43, "r_y0": 182.1, "r_x1": 329.45, "r_y1": 182.1, "r_x2": 329.45, "r_y2": 174.03, "r_x3": 296.43, "r_y3": 174.03, "coord_origin": "TOPLEFT" }, "text": "complex", "orig": "complex", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 15, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 345.03, "r_y0": 182.1, "r_x1": 354.76, "r_y1": 182.1, "r_x2": 354.76, "r_y2": 174.03, "r_x3": 345.03, "r_y3": 174.03, "coord_origin": "TOPLEFT" }, "text": "all", "orig": "all", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 16, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 154.54, "r_y0": 200.93, "r_x1": 201.24, "r_y1": 200.93, "r_x2": 201.24, "r_y2": 192.86, "r_x3": 154.54, "r_y3": 192.86, "coord_origin": "TOPLEFT" }, "text": "PubTabNet", "orig": "PubTabNet", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 17, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 222.44, "r_y0": 195.45, "r_x1": 247.13, "r_y1": 195.45, "r_x2": 247.13, "r_y2": 187.38, "r_x3": 222.44, "r_y3": 187.38, "coord_origin": "TOPLEFT" }, "text": "OTSL", "orig": "OTSL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 18, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 264.74, "r_y0": 195.45, "r_x1": 285.73, "r_y1": 195.45, "r_x2": 285.73, "r_y2": 187.38, "r_x3": 264.74, "r_y3": 187.38, "coord_origin": "TOPLEFT" }, "text": "0.965", "orig": "0.965", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 19, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 302.44, "r_y0": 195.45, "r_x1": 323.43, "r_y1": 195.45, "r_x2": 323.43, "r_y2": 187.38, "r_x3": 302.44, "r_y3": 187.38, "coord_origin": "TOPLEFT" }, "text": "0.934", "orig": "0.934", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 20, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 339.4, "r_y0": 195.45, "r_x1": 360.39, "r_y1": 195.45, "r_x2": 360.39, "r_y2": 187.38, "r_x3": 339.4, "r_y3": 187.38, "coord_origin": "TOPLEFT" }, "text": "0.955", "orig": "0.955", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 21, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 383.12, "r_y0": 195.24, "r_x1": 401.97, "r_y1": 195.24, "r_x2": 401.97, "r_y2": 187.32, "r_x3": 383.12, "r_y3": 187.32, "coord_origin": "TOPLEFT" }, "text": "0.88", "orig": "0.88", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 22, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 435.49, "r_y0": 195.24, "r_x1": 454.35, "r_y1": 195.24, "r_x2": 454.35, "r_y2": 187.32, "r_x3": 435.49, "r_y3": 187.32, "coord_origin": "TOPLEFT" }, "text": "2.73", "orig": "2.73", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 23, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 220.9, "r_y0": 208.4, "r_x1": 248.67, "r_y1": 208.4, "r_x2": 248.67, "r_y2": 200.33, "r_x3": 220.9, "r_y3": 200.33, "coord_origin": "TOPLEFT" }, "text": "HTML", "orig": "HTML", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 24, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 264.74, "r_y0": 208.4, "r_x1": 285.73, "r_y1": 208.4, "r_x2": 285.73, "r_y2": 200.33, "r_x3": 264.74, "r_y3": 200.33, "coord_origin": "TOPLEFT" }, "text": "0.969", "orig": "0.969", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 25, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 302.44, "r_y0": 208.4, "r_x1": 323.43, "r_y1": 208.4, "r_x2": 323.43, "r_y2": 200.33, "r_x3": 302.44, "r_y3": 200.33, "coord_origin": "TOPLEFT" }, "text": "0.927", "orig": "0.927", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 26, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 339.4, "r_y0": 208.4, "r_x1": 360.39, "r_y1": 208.4, "r_x2": 360.39, "r_y2": 200.33, "r_x3": 339.4, "r_y3": 200.33, "coord_origin": "TOPLEFT" }, "text": "0.955", "orig": "0.955", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 27, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 382.05, "r_y0": 208.4, "r_x1": 403.04, "r_y1": 208.4, "r_x2": 403.04, "r_y2": 200.33, "r_x3": 382.05, "r_y3": 200.33, "coord_origin": "TOPLEFT" }, "text": "0.857", "orig": "0.857", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 28, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 436.73, "r_y0": 208.4, "r_x1": 453.11, "r_y1": 208.4, "r_x2": 453.11, "r_y2": 200.33, "r_x3": 436.73, "r_y3": 200.33, "coord_origin": "TOPLEFT" }, "text": "5.39", "orig": "5.39", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 29, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 155.95, "r_y0": 227.23, "r_x1": 199.83, "r_y1": 227.23, "r_x2": 199.83, "r_y2": 219.16, "r_x3": 155.95, "r_y3": 219.16, "coord_origin": "TOPLEFT" }, "text": "FinTabNet", "orig": "FinTabNet", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 30, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 222.44, "r_y0": 221.75, "r_x1": 247.13, "r_y1": 221.75, "r_x2": 247.13, "r_y2": 213.68, "r_x3": 222.44, "r_y3": 213.68, "coord_origin": "TOPLEFT" }, "text": "OTSL", "orig": "OTSL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 31, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 264.74, "r_y0": 221.75, "r_x1": 285.73, "r_y1": 221.75, "r_x2": 285.73, "r_y2": 213.68, "r_x3": 264.74, "r_y3": 213.68, "coord_origin": "TOPLEFT" }, "text": "0.955", "orig": "0.955", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 32, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 302.44, "r_y0": 221.75, "r_x1": 323.43, "r_y1": 221.75, "r_x2": 323.43, "r_y2": 213.68, "r_x3": 302.44, "r_y3": 213.68, "coord_origin": "TOPLEFT" }, "text": "0.961", "orig": "0.961", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 33, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 337.81, "r_y0": 221.55, "r_x1": 361.98, "r_y1": 221.55, "r_x2": 361.98, "r_y2": 213.62, "r_x3": 337.81, "r_y3": 213.62, "coord_origin": "TOPLEFT" }, "text": "0.959", "orig": "0.959", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 34, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 380.46, "r_y0": 221.55, "r_x1": 404.62, "r_y1": 221.55, "r_x2": 404.62, "r_y2": 213.62, "r_x3": 380.46, "r_y3": 213.62, "coord_origin": "TOPLEFT" }, "text": "0.862", "orig": "0.862", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 35, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 435.49, "r_y0": 221.55, "r_x1": 454.35, "r_y1": 221.55, "r_x2": 454.35, "r_y2": 213.62, "r_x3": 435.49, "r_y3": 213.62, "coord_origin": "TOPLEFT" }, "text": "1.85", "orig": "1.85", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 36, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 220.9, "r_y0": 234.7, "r_x1": 248.67, "r_y1": 234.7, "r_x2": 248.67, "r_y2": 226.63, "r_x3": 220.9, "r_y3": 226.63, "coord_origin": "TOPLEFT" }, "text": "HTML", "orig": "HTML", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 37, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 264.74, "r_y0": 234.7, "r_x1": 285.73, "r_y1": 234.7, "r_x2": 285.73, "r_y2": 226.63, "r_x3": 264.74, "r_y3": 226.63, "coord_origin": "TOPLEFT" }, "text": "0.917", "orig": "0.917", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 38, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 302.44, "r_y0": 234.7, "r_x1": 323.43, "r_y1": 234.7, "r_x2": 323.43, "r_y2": 226.63, "r_x3": 302.44, "r_y3": 226.63, "coord_origin": "TOPLEFT" }, "text": "0.922", "orig": "0.922", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 39, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 341.71, "r_y0": 234.7, "r_x1": 358.09, "r_y1": 234.7, "r_x2": 358.09, "r_y2": 226.63, "r_x3": 341.71, "r_y3": 226.63, "coord_origin": "TOPLEFT" }, "text": "0.92", "orig": "0.92", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 40, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 382.05, "r_y0": 234.7, "r_x1": 403.04, "r_y1": 234.7, "r_x2": 403.04, "r_y2": 226.63, "r_x3": 382.05, "r_y3": 226.63, "coord_origin": "TOPLEFT" }, "text": "0.722", "orig": "0.722", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 41, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 436.73, "r_y0": 234.7, "r_x1": 453.11, "r_y1": 234.7, "r_x2": 453.11, "r_y2": 226.63, "r_x3": 436.73, "r_y3": 226.63, "coord_origin": "TOPLEFT" }, "text": "3.26", "orig": "3.26", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 42, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 148.63, "r_y0": 253.53, "r_x1": 207.15, "r_y1": 253.53, "r_x2": 207.15, "r_y2": 245.46, "r_x3": 148.63, "r_y3": 245.46, "coord_origin": "TOPLEFT" }, "text": "PubTables-1M", "orig": "PubTables-1M", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 43, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 222.44, "r_y0": 248.05, "r_x1": 247.13, "r_y1": 248.05, "r_x2": 247.13, "r_y2": 239.98, "r_x3": 222.44, "r_y3": 239.98, "coord_origin": "TOPLEFT" }, "text": "OTSL", "orig": "OTSL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 44, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 264.74, "r_y0": 248.05, "r_x1": 285.73, "r_y1": 248.05, "r_x2": 285.73, "r_y2": 239.98, "r_x3": 264.74, "r_y3": 239.98, "coord_origin": "TOPLEFT" }, "text": "0.987", "orig": "0.987", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 45, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 302.44, "r_y0": 248.05, "r_x1": 323.43, "r_y1": 248.05, "r_x2": 323.43, "r_y2": 239.98, "r_x3": 302.44, "r_y3": 239.98, "coord_origin": "TOPLEFT" }, "text": "0.964", "orig": "0.964", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 46, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 337.81, "r_y0": 247.85, "r_x1": 361.98, "r_y1": 247.85, "r_x2": 361.98, "r_y2": 239.92, "r_x3": 337.81, "r_y3": 239.92, "coord_origin": "TOPLEFT" }, "text": "0.977", "orig": "0.977", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 47, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 380.46, "r_y0": 247.85, "r_x1": 404.62, "r_y1": 247.85, "r_x2": 404.62, "r_y2": 239.92, "r_x3": 380.46, "r_y3": 239.92, "coord_origin": "TOPLEFT" }, "text": "0.896", "orig": "0.896", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 48, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 435.49, "r_y0": 247.85, "r_x1": 454.35, "r_y1": 247.85, "r_x2": 454.35, "r_y2": 239.92, "r_x3": 435.49, "r_y3": 239.92, "coord_origin": "TOPLEFT" }, "text": "1.79", "orig": "1.79", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 49, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 220.9, "r_y0": 261.0, "r_x1": 248.67, "r_y1": 261.0, "r_x2": 248.67, "r_y2": 252.93, "r_x3": 220.9, "r_y3": 252.93, "coord_origin": "TOPLEFT" }, "text": "HTML", "orig": "HTML", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 50, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 264.74, "r_y0": 261.0, "r_x1": 285.73, "r_y1": 261.0, "r_x2": 285.73, "r_y2": 252.93, "r_x3": 264.74, "r_y3": 252.93, "coord_origin": "TOPLEFT" }, "text": "0.983", "orig": "0.983", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 51, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 302.44, "r_y0": 261.0, "r_x1": 323.43, "r_y1": 261.0, "r_x2": 323.43, "r_y2": 252.93, "r_x3": 302.44, "r_y3": 252.93, "coord_origin": "TOPLEFT" }, "text": "0.944", "orig": "0.944", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 52, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 339.4, "r_y0": 261.0, "r_x1": 360.39, "r_y1": 261.0, "r_x2": 360.39, "r_y2": 252.93, "r_x3": 339.4, "r_y3": 252.93, "coord_origin": "TOPLEFT" }, "text": "0.966", "orig": "0.966", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 53, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 382.05, "r_y0": 261.0, "r_x1": 403.04, "r_y1": 261.0, "r_x2": 403.04, "r_y2": 252.93, "r_x3": 382.05, "r_y3": 252.93, "coord_origin": "TOPLEFT" }, "text": "0.889", "orig": "0.889", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 54, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 436.73, "r_y0": 261.0, "r_x1": 453.11, "r_y1": 261.0, "r_x2": 453.11, "r_y2": 252.93, "r_x3": 436.73, "r_y3": 252.93, "coord_origin": "TOPLEFT" }, "text": "3.26", "orig": "3.26", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [ { "id": 10, "label": "text", "bbox": { "l": 160.78, "t": 166.56, "r": 195.0, "b": 174.63, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 7, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 160.78, "r_y0": 174.63, "r_x1": 195.0, "r_y1": 174.63, "r_x2": 195.0, "r_y2": 166.56, "r_x3": 160.78, "r_y3": 166.56, "coord_origin": "TOPLEFT" }, "text": "Data set", "orig": "Data set", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 11, "label": "text", "bbox": { "l": 215.52, "t": 166.53, "r": 254.04, "b": 174.6, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 8, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 215.52, "r_y0": 174.6, "r_x1": 254.04, "r_y1": 174.6, "r_x2": 254.04, "r_y2": 166.53, "r_x3": 215.52, "r_y3": 166.53, "coord_origin": "TOPLEFT" }, "text": "Language", "orig": "Language", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 12, "label": "text", "bbox": { "l": 300.4, "t": 161.08, "r": 323.99, "b": 169.15, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 9, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 300.4, "r_y0": 169.15, "r_x1": 323.99, "r_y1": 169.15, "r_x2": 323.99, "r_y2": 161.08, "r_x3": 300.4, "r_y3": 161.08, "coord_origin": "TOPLEFT" }, "text": "TEDs", "orig": "TEDs", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 13, "label": "text", "bbox": { "l": 370.35, "t": 166.56, "r": 414.75, "b": 174.63, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 10, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 370.35, "r_y0": 174.63, "r_x1": 414.75, "r_y1": 174.63, "r_x2": 414.75, "r_y2": 166.56, "r_x3": 370.35, "r_y3": 166.56, "coord_origin": "TOPLEFT" }, "text": "mAP(0.75)", "orig": "mAP(0.75)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 14, "label": "text", "bbox": { "l": 426.74, "t": 161.08, "r": 463.11, "b": 169.15, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 11, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 426.74, "r_y0": 169.15, "r_x1": 463.11, "r_y1": 169.15, "r_x2": 463.11, "r_y2": 161.08, "r_x3": 426.74, "r_y3": 161.08, "coord_origin": "TOPLEFT" }, "text": "Inference", "orig": "Inference", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 15, "label": "text", "bbox": { "l": 423.11, "t": 172.04, "r": 466.73, "b": 180.11, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 12, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 423.11, "r_y0": 180.11, "r_x1": 466.73, "r_y1": 180.11, "r_x2": 466.73, "r_y2": 172.04, "r_x3": 423.11, "r_y3": 172.04, "coord_origin": "TOPLEFT" }, "text": "time (secs)", "orig": "time (secs)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 16, "label": "text", "bbox": { "l": 262.41, "t": 174.03, "r": 288.06, "b": 182.1, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 13, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 262.41, "r_y0": 182.1, "r_x1": 288.06, "r_y1": 182.1, "r_x2": 288.06, "r_y2": 174.03, "r_x3": 262.41, "r_y3": 174.03, "coord_origin": "TOPLEFT" }, "text": "simple", "orig": "simple", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 17, "label": "text", "bbox": { "l": 296.43, "t": 174.03, "r": 329.45, "b": 182.1, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 14, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 296.43, "r_y0": 182.1, "r_x1": 329.45, "r_y1": 182.1, "r_x2": 329.45, "r_y2": 174.03, "r_x3": 296.43, "r_y3": 174.03, "coord_origin": "TOPLEFT" }, "text": "complex", "orig": "complex", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 18, "label": "text", "bbox": { "l": 345.03, "t": 174.03, "r": 354.76, "b": 182.1, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 15, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 345.03, "r_y0": 182.1, "r_x1": 354.76, "r_y1": 182.1, "r_x2": 354.76, "r_y2": 174.03, "r_x3": 345.03, "r_y3": 174.03, "coord_origin": "TOPLEFT" }, "text": "all", "orig": "all", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 19, "label": "text", "bbox": { "l": 154.54, "t": 192.86, "r": 201.24, "b": 200.93, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 16, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 154.54, "r_y0": 200.93, "r_x1": 201.24, "r_y1": 200.93, "r_x2": 201.24, "r_y2": 192.86, "r_x3": 154.54, "r_y3": 192.86, "coord_origin": "TOPLEFT" }, "text": "PubTabNet", "orig": "PubTabNet", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 20, "label": "text", "bbox": { "l": 222.44, "t": 187.38, "r": 247.13, "b": 195.45, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 17, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 222.44, "r_y0": 195.45, "r_x1": 247.13, "r_y1": 195.45, "r_x2": 247.13, "r_y2": 187.38, "r_x3": 222.44, "r_y3": 187.38, "coord_origin": "TOPLEFT" }, "text": "OTSL", "orig": "OTSL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 21, "label": "text", "bbox": { "l": 264.74, "t": 187.38, "r": 285.73, "b": 195.45, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 18, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 264.74, "r_y0": 195.45, "r_x1": 285.73, "r_y1": 195.45, "r_x2": 285.73, "r_y2": 187.38, "r_x3": 264.74, "r_y3": 187.38, "coord_origin": "TOPLEFT" }, "text": "0.965", "orig": "0.965", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 22, "label": "text", "bbox": { "l": 302.44, "t": 187.38, "r": 323.43, "b": 195.45, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 19, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 302.44, "r_y0": 195.45, "r_x1": 323.43, "r_y1": 195.45, "r_x2": 323.43, "r_y2": 187.38, "r_x3": 302.44, "r_y3": 187.38, "coord_origin": "TOPLEFT" }, "text": "0.934", "orig": "0.934", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 23, "label": "text", "bbox": { "l": 339.4, "t": 187.38, "r": 360.39, "b": 195.45, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 20, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 339.4, "r_y0": 195.45, "r_x1": 360.39, "r_y1": 195.45, "r_x2": 360.39, "r_y2": 187.38, "r_x3": 339.4, "r_y3": 187.38, "coord_origin": "TOPLEFT" }, "text": "0.955", "orig": "0.955", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 24, "label": "text", "bbox": { "l": 383.12, "t": 187.32, "r": 401.97, "b": 195.24, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 21, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 383.12, "r_y0": 195.24, "r_x1": 401.97, "r_y1": 195.24, "r_x2": 401.97, "r_y2": 187.32, "r_x3": 383.12, "r_y3": 187.32, "coord_origin": "TOPLEFT" }, "text": "0.88", "orig": "0.88", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 25, "label": "text", "bbox": { "l": 435.49, "t": 187.32, "r": 454.35, "b": 195.24, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 22, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 435.49, "r_y0": 195.24, "r_x1": 454.35, "r_y1": 195.24, "r_x2": 454.35, "r_y2": 187.32, "r_x3": 435.49, "r_y3": 187.32, "coord_origin": "TOPLEFT" }, "text": "2.73", "orig": "2.73", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 26, "label": "text", "bbox": { "l": 220.9, "t": 200.33, "r": 248.67, "b": 208.4, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 23, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 220.9, "r_y0": 208.4, "r_x1": 248.67, "r_y1": 208.4, "r_x2": 248.67, "r_y2": 200.33, "r_x3": 220.9, "r_y3": 200.33, "coord_origin": "TOPLEFT" }, "text": "HTML", "orig": "HTML", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 27, "label": "text", "bbox": { "l": 264.74, "t": 200.33, "r": 285.73, "b": 208.4, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 24, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 264.74, "r_y0": 208.4, "r_x1": 285.73, "r_y1": 208.4, "r_x2": 285.73, "r_y2": 200.33, "r_x3": 264.74, "r_y3": 200.33, "coord_origin": "TOPLEFT" }, "text": "0.969", "orig": "0.969", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 28, "label": "text", "bbox": { "l": 302.44, "t": 200.33, "r": 323.43, "b": 208.4, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 25, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 302.44, "r_y0": 208.4, "r_x1": 323.43, "r_y1": 208.4, "r_x2": 323.43, "r_y2": 200.33, "r_x3": 302.44, "r_y3": 200.33, "coord_origin": "TOPLEFT" }, "text": "0.927", "orig": "0.927", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 29, "label": "text", "bbox": { "l": 339.4, "t": 200.33, "r": 360.39, "b": 208.4, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 26, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 339.4, "r_y0": 208.4, "r_x1": 360.39, "r_y1": 208.4, "r_x2": 360.39, "r_y2": 200.33, "r_x3": 339.4, "r_y3": 200.33, "coord_origin": "TOPLEFT" }, "text": "0.955", "orig": "0.955", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 30, "label": "text", "bbox": { "l": 382.05, "t": 200.33, "r": 403.04, "b": 208.4, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 27, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 382.05, "r_y0": 208.4, "r_x1": 403.04, "r_y1": 208.4, "r_x2": 403.04, "r_y2": 200.33, "r_x3": 382.05, "r_y3": 200.33, "coord_origin": "TOPLEFT" }, "text": "0.857", "orig": "0.857", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 31, "label": "text", "bbox": { "l": 436.73, "t": 200.33, "r": 453.11, "b": 208.4, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 28, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 436.73, "r_y0": 208.4, "r_x1": 453.11, "r_y1": 208.4, "r_x2": 453.11, "r_y2": 200.33, "r_x3": 436.73, "r_y3": 200.33, "coord_origin": "TOPLEFT" }, "text": "5.39", "orig": "5.39", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 32, "label": "text", "bbox": { "l": 155.95, "t": 219.16, "r": 199.83, "b": 227.23, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 29, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 155.95, "r_y0": 227.23, "r_x1": 199.83, "r_y1": 227.23, "r_x2": 199.83, "r_y2": 219.16, "r_x3": 155.95, "r_y3": 219.16, "coord_origin": "TOPLEFT" }, "text": "FinTabNet", "orig": "FinTabNet", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 33, "label": "text", "bbox": { "l": 222.44, "t": 213.68, "r": 247.13, "b": 221.75, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 30, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 222.44, "r_y0": 221.75, "r_x1": 247.13, "r_y1": 221.75, "r_x2": 247.13, "r_y2": 213.68, "r_x3": 222.44, "r_y3": 213.68, "coord_origin": "TOPLEFT" }, "text": "OTSL", "orig": "OTSL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 34, "label": "text", "bbox": { "l": 264.74, "t": 213.68, "r": 285.73, "b": 221.75, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 31, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 264.74, "r_y0": 221.75, "r_x1": 285.73, "r_y1": 221.75, "r_x2": 285.73, "r_y2": 213.68, "r_x3": 264.74, "r_y3": 213.68, "coord_origin": "TOPLEFT" }, "text": "0.955", "orig": "0.955", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 35, "label": "text", "bbox": { "l": 302.44, "t": 213.68, "r": 323.43, "b": 221.75, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 32, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 302.44, "r_y0": 221.75, "r_x1": 323.43, "r_y1": 221.75, "r_x2": 323.43, "r_y2": 213.68, "r_x3": 302.44, "r_y3": 213.68, "coord_origin": "TOPLEFT" }, "text": "0.961", "orig": "0.961", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 36, "label": "text", "bbox": { "l": 337.81, "t": 213.62, "r": 361.98, "b": 221.55, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 33, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 337.81, "r_y0": 221.55, "r_x1": 361.98, "r_y1": 221.55, "r_x2": 361.98, "r_y2": 213.62, "r_x3": 337.81, "r_y3": 213.62, "coord_origin": "TOPLEFT" }, "text": "0.959", "orig": "0.959", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 37, "label": "text", "bbox": { "l": 380.46, "t": 213.62, "r": 404.62, "b": 221.55, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 34, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 380.46, "r_y0": 221.55, "r_x1": 404.62, "r_y1": 221.55, "r_x2": 404.62, "r_y2": 213.62, "r_x3": 380.46, "r_y3": 213.62, "coord_origin": "TOPLEFT" }, "text": "0.862", "orig": "0.862", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 38, "label": "text", "bbox": { "l": 435.49, "t": 213.62, "r": 454.35, "b": 221.55, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 35, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 435.49, "r_y0": 221.55, "r_x1": 454.35, "r_y1": 221.55, "r_x2": 454.35, "r_y2": 213.62, "r_x3": 435.49, "r_y3": 213.62, "coord_origin": "TOPLEFT" }, "text": "1.85", "orig": "1.85", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 39, "label": "text", "bbox": { "l": 220.9, "t": 226.63, "r": 248.67, "b": 234.7, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 36, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 220.9, "r_y0": 234.7, "r_x1": 248.67, "r_y1": 234.7, "r_x2": 248.67, "r_y2": 226.63, "r_x3": 220.9, "r_y3": 226.63, "coord_origin": "TOPLEFT" }, "text": "HTML", "orig": "HTML", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 40, "label": "text", "bbox": { "l": 264.74, "t": 226.63, "r": 285.73, "b": 234.7, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 37, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 264.74, "r_y0": 234.7, "r_x1": 285.73, "r_y1": 234.7, "r_x2": 285.73, "r_y2": 226.63, "r_x3": 264.74, "r_y3": 226.63, "coord_origin": "TOPLEFT" }, "text": "0.917", "orig": "0.917", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 41, "label": "text", "bbox": { "l": 302.44, "t": 226.63, "r": 323.43, "b": 234.7, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 38, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 302.44, "r_y0": 234.7, "r_x1": 323.43, "r_y1": 234.7, "r_x2": 323.43, "r_y2": 226.63, "r_x3": 302.44, "r_y3": 226.63, "coord_origin": "TOPLEFT" }, "text": "0.922", "orig": "0.922", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 42, "label": "text", "bbox": { "l": 341.71, "t": 226.63, "r": 358.09, "b": 234.7, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 39, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 341.71, "r_y0": 234.7, "r_x1": 358.09, "r_y1": 234.7, "r_x2": 358.09, "r_y2": 226.63, "r_x3": 341.71, "r_y3": 226.63, "coord_origin": "TOPLEFT" }, "text": "0.92", "orig": "0.92", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 43, "label": "text", "bbox": { "l": 382.05, "t": 226.63, "r": 403.04, "b": 234.7, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 40, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 382.05, "r_y0": 234.7, "r_x1": 403.04, "r_y1": 234.7, "r_x2": 403.04, "r_y2": 226.63, "r_x3": 382.05, "r_y3": 226.63, "coord_origin": "TOPLEFT" }, "text": "0.722", "orig": "0.722", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 44, "label": "text", "bbox": { "l": 436.73, "t": 226.63, "r": 453.11, "b": 234.7, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 41, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 436.73, "r_y0": 234.7, "r_x1": 453.11, "r_y1": 234.7, "r_x2": 453.11, "r_y2": 226.63, "r_x3": 436.73, "r_y3": 226.63, "coord_origin": "TOPLEFT" }, "text": "3.26", "orig": "3.26", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 45, "label": "text", "bbox": { "l": 148.63, "t": 245.46, "r": 207.15, "b": 253.53, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 42, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 148.63, "r_y0": 253.53, "r_x1": 207.15, "r_y1": 253.53, "r_x2": 207.15, "r_y2": 245.46, "r_x3": 148.63, "r_y3": 245.46, "coord_origin": "TOPLEFT" }, "text": "PubTables-1M", "orig": "PubTables-1M", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 46, "label": "text", "bbox": { "l": 222.44, "t": 239.98, "r": 247.13, "b": 248.05, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 43, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 222.44, "r_y0": 248.05, "r_x1": 247.13, "r_y1": 248.05, "r_x2": 247.13, "r_y2": 239.98, "r_x3": 222.44, "r_y3": 239.98, "coord_origin": "TOPLEFT" }, "text": "OTSL", "orig": "OTSL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 47, "label": "text", "bbox": { "l": 264.74, "t": 239.98, "r": 285.73, "b": 248.05, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 44, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 264.74, "r_y0": 248.05, "r_x1": 285.73, "r_y1": 248.05, "r_x2": 285.73, "r_y2": 239.98, "r_x3": 264.74, "r_y3": 239.98, "coord_origin": "TOPLEFT" }, "text": "0.987", "orig": "0.987", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 48, "label": "text", "bbox": { "l": 302.44, "t": 239.98, "r": 323.43, "b": 248.05, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 45, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 302.44, "r_y0": 248.05, "r_x1": 323.43, "r_y1": 248.05, "r_x2": 323.43, "r_y2": 239.98, "r_x3": 302.44, "r_y3": 239.98, "coord_origin": "TOPLEFT" }, "text": "0.964", "orig": "0.964", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 49, "label": "text", "bbox": { "l": 337.81, "t": 239.92, "r": 361.98, "b": 247.85, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 46, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 337.81, "r_y0": 247.85, "r_x1": 361.98, "r_y1": 247.85, "r_x2": 361.98, "r_y2": 239.92, "r_x3": 337.81, "r_y3": 239.92, "coord_origin": "TOPLEFT" }, "text": "0.977", "orig": "0.977", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 50, "label": "text", "bbox": { "l": 380.46, "t": 239.92, "r": 404.62, "b": 247.85, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 47, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 380.46, "r_y0": 247.85, "r_x1": 404.62, "r_y1": 247.85, "r_x2": 404.62, "r_y2": 239.92, "r_x3": 380.46, "r_y3": 239.92, "coord_origin": "TOPLEFT" }, "text": "0.896", "orig": "0.896", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 51, "label": "text", "bbox": { "l": 435.49, "t": 239.92, "r": 454.35, "b": 247.85, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 48, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 435.49, "r_y0": 247.85, "r_x1": 454.35, "r_y1": 247.85, "r_x2": 454.35, "r_y2": 239.92, "r_x3": 435.49, "r_y3": 239.92, "coord_origin": "TOPLEFT" }, "text": "1.79", "orig": "1.79", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 52, "label": "text", "bbox": { "l": 220.9, "t": 252.93, "r": 248.67, "b": 261.0, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 49, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 220.9, "r_y0": 261.0, "r_x1": 248.67, "r_y1": 261.0, "r_x2": 248.67, "r_y2": 252.93, "r_x3": 220.9, "r_y3": 252.93, "coord_origin": "TOPLEFT" }, "text": "HTML", "orig": "HTML", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 53, "label": "text", "bbox": { "l": 264.74, "t": 252.93, "r": 285.73, "b": 261.0, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 50, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 264.74, "r_y0": 261.0, "r_x1": 285.73, "r_y1": 261.0, "r_x2": 285.73, "r_y2": 252.93, "r_x3": 264.74, "r_y3": 252.93, "coord_origin": "TOPLEFT" }, "text": "0.983", "orig": "0.983", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 54, "label": "text", "bbox": { "l": 302.44, "t": 252.93, "r": 323.43, "b": 261.0, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 51, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 302.44, "r_y0": 261.0, "r_x1": 323.43, "r_y1": 261.0, "r_x2": 323.43, "r_y2": 252.93, "r_x3": 302.44, "r_y3": 252.93, "coord_origin": "TOPLEFT" }, "text": "0.944", "orig": "0.944", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 55, "label": "text", "bbox": { "l": 339.4, "t": 252.93, "r": 360.39, "b": 261.0, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 52, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 339.4, "r_y0": 261.0, "r_x1": 360.39, "r_y1": 261.0, "r_x2": 360.39, "r_y2": 252.93, "r_x3": 339.4, "r_y3": 252.93, "coord_origin": "TOPLEFT" }, "text": "0.966", "orig": "0.966", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 56, "label": "text", "bbox": { "l": 382.05, "t": 252.93, "r": 403.04, "b": 261.0, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 53, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 382.05, "r_y0": 261.0, "r_x1": 403.04, "r_y1": 261.0, "r_x2": 403.04, "r_y2": 252.93, "r_x3": 382.05, "r_y3": 252.93, "coord_origin": "TOPLEFT" }, "text": "0.889", "orig": "0.889", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 57, "label": "text", "bbox": { "l": 436.73, "t": 252.93, "r": 453.11, "b": 261.0, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 54, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 436.73, "r_y0": 261.0, "r_x1": 453.11, "r_y1": 261.0, "r_x2": 453.11, "r_y2": 252.93, "r_x3": 436.73, "r_y3": 252.93, "coord_origin": "TOPLEFT" }, "text": "3.26", "orig": "3.26", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] } ] }, "text": null, "otsl_seq": [ "ched", "ched", "ched", "lcel", "lcel", "ched", "ched", "nl", "ucel", "ucel", "ched", "ched", "ched", "ucel", "ucel", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "nl" ], "num_rows": 5, "num_cols": 7, "table_cells": [ { "bbox": { "l": 160.78, "t": 166.56, "r": 195.0, "b": 174.63, "coord_origin": "TOPLEFT" }, "row_span": 2, "col_span": 1, "start_row_offset_idx": 0, "end_row_offset_idx": 2, "start_col_offset_idx": 0, "end_col_offset_idx": 1, "text": "Data set", "column_header": true, "row_header": false, "row_section": false }, { "bbox": { "l": 215.52, "t": 166.53, "r": 254.04, "b": 174.6, "coord_origin": "TOPLEFT" }, "row_span": 2, "col_span": 1, "start_row_offset_idx": 0, "end_row_offset_idx": 2, "start_col_offset_idx": 1, "end_col_offset_idx": 2, "text": "Language", "column_header": true, "row_header": false, "row_section": false }, { "bbox": { "l": 300.4, "t": 161.08, "r": 323.99, "b": 169.15, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 3, "start_row_offset_idx": 0, "end_row_offset_idx": 1, "start_col_offset_idx": 2, "end_col_offset_idx": 5, "text": "TEDs", "column_header": true, "row_header": false, "row_section": false }, { "bbox": { "l": 370.35, "t": 166.56, "r": 414.75, "b": 174.63, "coord_origin": "TOPLEFT" }, "row_span": 2, "col_span": 1, "start_row_offset_idx": 0, "end_row_offset_idx": 2, "start_col_offset_idx": 5, "end_col_offset_idx": 6, "text": "mAP(0.75)", "column_header": true, "row_header": false, "row_section": false }, { "bbox": { "l": 426.74, "t": 161.08, "r": 463.11, "b": 169.15, "coord_origin": "TOPLEFT" }, "row_span": 2, "col_span": 1, "start_row_offset_idx": 0, "end_row_offset_idx": 2, "start_col_offset_idx": 6, "end_col_offset_idx": 7, "text": "Inference time (secs)", "column_header": true, "row_header": false, "row_section": false }, { "bbox": { "l": 262.41, "t": 174.03, "r": 288.06, "b": 182.1, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 1, "end_row_offset_idx": 2, "start_col_offset_idx": 2, "end_col_offset_idx": 3, "text": "simple", "column_header": true, "row_header": false, "row_section": false }, { "bbox": { "l": 296.43, "t": 174.03, "r": 329.45, "b": 182.1, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 1, "end_row_offset_idx": 2, "start_col_offset_idx": 3, "end_col_offset_idx": 4, "text": "complex", "column_header": true, "row_header": false, "row_section": false }, { "bbox": { "l": 345.03, "t": 174.03, "r": 354.76, "b": 182.1, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 1, "end_row_offset_idx": 2, "start_col_offset_idx": 4, "end_col_offset_idx": 5, "text": "all", "column_header": true, "row_header": false, "row_section": false }, { "bbox": { "l": 154.54, "t": 192.86, "r": 201.24, "b": 200.93, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 2, "end_row_offset_idx": 3, "start_col_offset_idx": 0, "end_col_offset_idx": 1, "text": "PubTabNet", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 222.44, "t": 187.38, "r": 247.13, "b": 195.45, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 2, "end_row_offset_idx": 3, "start_col_offset_idx": 1, "end_col_offset_idx": 2, "text": "OTSL HTML", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 264.74, "t": 187.38, "r": 285.73, "b": 195.45, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 2, "end_row_offset_idx": 3, "start_col_offset_idx": 2, "end_col_offset_idx": 3, "text": "0.965 0.969", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 302.44, "t": 187.38, "r": 323.43, "b": 195.45, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 2, "end_row_offset_idx": 3, "start_col_offset_idx": 3, "end_col_offset_idx": 4, "text": "0.934 0.927", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 339.4, "t": 187.38, "r": 360.39, "b": 195.45, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 2, "end_row_offset_idx": 3, "start_col_offset_idx": 4, "end_col_offset_idx": 5, "text": "0.955 0.955", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 383.12, "t": 187.32, "r": 401.97, "b": 195.24, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 2, "end_row_offset_idx": 3, "start_col_offset_idx": 5, "end_col_offset_idx": 6, "text": "0.88 0.857", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 435.49, "t": 187.32, "r": 454.35, "b": 195.24, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 2, "end_row_offset_idx": 3, "start_col_offset_idx": 6, "end_col_offset_idx": 7, "text": "2.73 5.39", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 155.95, "t": 219.16, "r": 199.83, "b": 227.23, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 3, "end_row_offset_idx": 4, "start_col_offset_idx": 0, "end_col_offset_idx": 1, "text": "FinTabNet", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 222.44, "t": 213.68, "r": 247.13, "b": 221.75, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 3, "end_row_offset_idx": 4, "start_col_offset_idx": 1, "end_col_offset_idx": 2, "text": "OTSL HTML", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 264.74, "t": 213.68, "r": 285.73, "b": 221.75, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 3, "end_row_offset_idx": 4, "start_col_offset_idx": 2, "end_col_offset_idx": 3, "text": "0.955 0.917", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 302.44, "t": 213.68, "r": 323.43, "b": 221.75, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 3, "end_row_offset_idx": 4, "start_col_offset_idx": 3, "end_col_offset_idx": 4, "text": "0.961 0.922", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 337.81, "t": 213.62, "r": 361.98, "b": 221.55, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 3, "end_row_offset_idx": 4, "start_col_offset_idx": 4, "end_col_offset_idx": 5, "text": "0.959 0.92", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 380.46, "t": 213.62, "r": 404.62, "b": 221.55, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 3, "end_row_offset_idx": 4, "start_col_offset_idx": 5, "end_col_offset_idx": 6, "text": "0.862 0.722", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 435.49, "t": 213.62, "r": 454.35, "b": 221.55, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 3, "end_row_offset_idx": 4, "start_col_offset_idx": 6, "end_col_offset_idx": 7, "text": "1.85 3.26", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 148.63, "t": 245.46, "r": 207.15, "b": 253.53, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 4, "end_row_offset_idx": 5, "start_col_offset_idx": 0, "end_col_offset_idx": 1, "text": "PubTables-1M", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 222.44, "t": 239.98, "r": 247.13, "b": 248.05, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 4, "end_row_offset_idx": 5, "start_col_offset_idx": 1, "end_col_offset_idx": 2, "text": "OTSL HTML", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 264.74, "t": 239.98, "r": 285.73, "b": 248.05, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 4, "end_row_offset_idx": 5, "start_col_offset_idx": 2, "end_col_offset_idx": 3, "text": "0.987 0.983", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 302.44, "t": 239.98, "r": 323.43, "b": 248.05, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 4, "end_row_offset_idx": 5, "start_col_offset_idx": 3, "end_col_offset_idx": 4, "text": "0.964 0.944", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 337.81, "t": 239.92, "r": 361.98, "b": 247.85, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 4, "end_row_offset_idx": 5, "start_col_offset_idx": 4, "end_col_offset_idx": 5, "text": "0.977 0.966", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 380.46, "t": 239.92, "r": 404.62, "b": 247.85, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 4, "end_row_offset_idx": 5, "start_col_offset_idx": 5, "end_col_offset_idx": 6, "text": "0.896 0.889", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 435.49, "t": 239.92, "r": 454.35, "b": 247.85, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 4, "end_row_offset_idx": 5, "start_col_offset_idx": 6, "end_col_offset_idx": 7, "text": "1.79 3.26", "column_header": false, "row_header": false, "row_section": false } ] }, { "label": "section_header", "id": 3, "page_no": 9, "cluster": { "id": 3, "label": "section_header", "bbox": { "l": 134.76, "t": 288.91, "r": 257.09, "b": 297.72, "coord_origin": "TOPLEFT" }, "confidence": 0.955, "cells": [ { "index": 55, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 297.72, "r_x1": 149.4, "r_y1": 297.72, "r_x2": 149.4, "r_y2": 288.91, "r_x3": 134.76, "r_y3": 288.91, "coord_origin": "TOPLEFT" }, "text": "5.3", "orig": "5.3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 56, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 160.86, "r_y0": 297.72, "r_x1": 257.09, "r_y1": 297.72, "r_x2": 257.09, "r_y2": 288.91, "r_x3": 160.86, "r_y3": 288.91, "coord_origin": "TOPLEFT" }, "text": "Qualitative Results", "orig": "Qualitative Results", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "5.3 Qualitative Results" }, { "label": "text", "id": 1, "page_no": 9, "cluster": { "id": 1, "label": "text", "bbox": { "l": 134.76, "t": 309.86, "r": 480.59, "b": 366.48, "coord_origin": "TOPLEFT" }, "confidence": 0.983, "cells": [ { "index": 57, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 318.66, "r_x1": 480.59, "r_y1": 318.66, "r_x2": 480.59, "r_y2": 309.86, "r_x3": 134.76, "r_y3": 309.86, "coord_origin": "TOPLEFT" }, "text": "To illustrate the qualitative differences between OTSL and HTML, Figure 5", "orig": "To illustrate the qualitative differences between OTSL and HTML, Figure 5", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 58, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 330.61, "r_x1": 480.59, "r_y1": 330.61, "r_x2": 480.59, "r_y2": 321.82, "r_x3": 134.76, "r_y3": 321.82, "coord_origin": "TOPLEFT" }, "text": "demonstrates less overlap and more accurate bounding boxes with OTSL. In", "orig": "demonstrates less overlap and more accurate bounding boxes with OTSL. In", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 59, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 342.57, "r_x1": 480.59, "r_y1": 342.57, "r_x2": 480.59, "r_y2": 333.77, "r_x3": 134.76, "r_y3": 333.77, "coord_origin": "TOPLEFT" }, "text": "Figure 6, OTSL proves to be more effective in handling tables with longer to-", "orig": "Figure 6, OTSL proves to be more effective in handling tables with longer to-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 60, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 354.52, "r_x1": 480.59, "r_y1": 354.52, "r_x2": 480.59, "r_y2": 345.73, "r_x3": 134.76, "r_y3": 345.73, "coord_origin": "TOPLEFT" }, "text": "ken sequences, resulting in even more precise structure prediction and bounding", "orig": "ken sequences, resulting in even more precise structure prediction and bounding", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 61, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 366.48, "r_x1": 161.66, "r_y1": 366.48, "r_x2": 161.66, "r_y2": 357.68, "r_x3": 134.76, "r_y3": 357.68, "coord_origin": "TOPLEFT" }, "text": "boxes.", "orig": "boxes.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "To illustrate the qualitative differences between OTSL and HTML, Figure 5 demonstrates less overlap and more accurate bounding boxes with OTSL. In Figure 6, OTSL proves to be more effective in handling tables with longer token sequences, resulting in even more precise structure prediction and bounding boxes." }, { "label": "caption", "id": 5, "page_no": 9, "cluster": { "id": 5, "label": "caption", "bbox": { "l": 134.76, "t": 397.59, "r": 480.59, "b": 439.72, "coord_origin": "TOPLEFT" }, "confidence": 0.948, "cells": [ { "index": 62, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 405.52, "r_x1": 162.64, "r_y1": 405.52, "r_x2": 162.64, "r_y2": 397.59, "r_x3": 134.76, "r_y3": 397.59, "coord_origin": "TOPLEFT" }, "text": "Fig. 5.", "orig": "Fig. 5.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 63, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 167.38, "r_y0": 405.72, "r_x1": 480.59, "r_y1": 405.72, "r_x2": 480.59, "r_y2": 397.65, "r_x3": 167.38, "r_y3": 397.65, "coord_origin": "TOPLEFT" }, "text": "The OTSL model produces more accurate bounding boxes with less over-", "orig": "The OTSL model produces more accurate bounding boxes with less over-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 64, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 416.68, "r_x1": 480.59, "r_y1": 416.68, "r_x2": 480.59, "r_y2": 408.61, "r_x3": 134.76, "r_y3": 408.61, "coord_origin": "TOPLEFT" }, "text": "lap (E) than the HTML model (D), when predicting the structure of a sparse ta-", "orig": "lap (E) than the HTML model (D), when predicting the structure of a sparse ta-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 65, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 427.64, "r_x1": 480.59, "r_y1": 427.64, "r_x2": 480.59, "r_y2": 419.57, "r_x3": 134.76, "r_y3": 419.57, "coord_origin": "TOPLEFT" }, "text": "ble (A), at twice the inference speed because of shorter sequence length (B),(C).", "orig": "ble (A), at twice the inference speed because of shorter sequence length (B),(C).", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 66, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 438.6, "r_x1": 304.69, "r_y1": 438.6, "r_x2": 304.69, "r_y2": 430.53, "r_x3": 134.76, "r_y3": 430.53, "coord_origin": "TOPLEFT" }, "text": "\"PMC2807444_006_00.png\" PubTabNet.", "orig": "\"PMC2807444_006_00.png\" PubTabNet.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 118, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 342.63, "r_y0": 439.72, "r_x1": 344.82, "r_y1": 439.72, "r_x2": 344.82, "r_y2": 430.2, "r_x3": 342.63, "r_y3": 430.2, "coord_origin": "TOPLEFT" }, "text": "\u03bc", "orig": "\u03bc", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "Fig. 5. The OTSL model produces more accurate bounding boxes with less overlap (E) than the HTML model (D), when predicting the structure of a sparse table (A), at twice the inference speed because of shorter sequence length (B),(C). \"PMC2807444_006_00.png\" PubTabNet. \u03bc" }, { "label": "picture", "id": 2, "page_no": 9, "cluster": { "id": 2, "label": "picture", "bbox": { "l": 162.67, "t": 444.62, "r": 451.7, "b": 663.21, "coord_origin": "TOPLEFT" }, "confidence": 0.974, "cells": [ { "index": 67, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 180.12, "r_y0": 518.95, "r_x1": 190.62, "r_y1": 518.95, "r_x2": 190.62, "r_y2": 516.23, "r_x3": 180.12, "r_y3": 516.23, "coord_origin": "TOPLEFT" }, "text": "", "orig": "
", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 68, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 183.24, "r_y0": 522.85, "r_x1": 304.55, "r_y1": 522.85, "r_x2": 304.55, "r_y2": 520.13, "r_x3": 183.24, "r_y3": 520.13, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 69, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 183.24, "r_y0": 526.75, "r_x1": 388.42, "r_y1": 526.75, "r_x2": 388.42, "r_y2": 524.03, "r_x3": 183.24, "r_y3": 524.03, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 70, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 183.24, "r_y0": 530.65, "r_x1": 388.42, "r_y1": 530.65, "r_x2": 388.42, "r_y2": 527.93, "r_x3": 183.24, "r_y3": 527.93, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 71, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 183.24, "r_y0": 534.55, "r_x1": 388.42, "r_y1": 534.55, "r_x2": 388.42, "r_y2": 531.83, "r_x3": 183.24, "r_y3": 531.83, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 72, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 183.24, "r_y0": 538.44, "r_x1": 388.42, "r_y1": 538.44, "r_x2": 388.42, "r_y2": 535.73, "r_x3": 183.24, "r_y3": 535.73, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 73, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 183.24, "r_y0": 542.34, "r_x1": 388.42, "r_y1": 542.34, "r_x2": 388.42, "r_y2": 539.63, "r_x3": 183.24, "r_y3": 539.63, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 74, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 183.24, "r_y0": 546.24, "r_x1": 388.42, "r_y1": 546.24, "r_x2": 388.42, "r_y2": 543.53, "r_x3": 183.24, "r_y3": 543.53, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 75, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 183.24, "r_y0": 550.14, "r_x1": 388.42, "r_y1": 550.14, "r_x2": 388.42, "r_y2": 547.42, "r_x3": 183.24, "r_y3": 547.42, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 76, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 183.24, "r_y0": 554.04, "r_x1": 388.42, "r_y1": 554.04, "r_x2": 388.42, "r_y2": 551.32, "r_x3": 183.24, "r_y3": 551.32, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 77, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 180.12, "r_y0": 557.94, "r_x1": 191.87, "r_y1": 557.94, "r_x2": 191.87, "r_y2": 555.22, "r_x3": 180.12, "r_y3": 555.22, "coord_origin": "TOPLEFT" }, "text": "
", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 78, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 407.38, "r_y0": 521.02, "r_x1": 408.82, "r_y1": 521.02, "r_x2": 408.82, "r_y2": 518.3, "r_x3": 407.38, "r_y3": 518.3, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 79, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 410.26, "r_y0": 521.02, "r_x1": 450.49, "r_y1": 521.02, "r_x2": 450.49, "r_y2": 518.3, "r_x3": 410.26, "r_y3": 518.3, "coord_origin": "TOPLEFT" }, "text": "C L L L C L L L L L C L L NL", "orig": "C L L L C L L L L L C L L NL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 80, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 407.38, "r_y0": 524.92, "r_x1": 408.82, "r_y1": 524.92, "r_x2": 408.82, "r_y2": 522.2, "r_x3": 407.38, "r_y3": 522.2, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 81, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 410.26, "r_y0": 524.92, "r_x1": 450.49, "r_y1": 524.92, "r_x2": 450.49, "r_y2": 522.2, "r_x3": 410.26, "r_y3": 522.2, "coord_origin": "TOPLEFT" }, "text": "C C C C C C C C C C C C C NL", "orig": "C C C C C C C C C C C C C NL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 82, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 407.38, "r_y0": 528.81, "r_x1": 408.82, "r_y1": 528.81, "r_x2": 408.82, "r_y2": 526.1, "r_x3": 407.38, "r_y3": 526.1, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 83, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 410.26, "r_y0": 528.81, "r_x1": 450.49, "r_y1": 528.81, "r_x2": 450.49, "r_y2": 526.1, "r_x3": 410.26, "r_y3": 526.1, "coord_origin": "TOPLEFT" }, "text": "C C C C C C C C C C C C C NL", "orig": "C C C C C C C C C C C C C NL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 84, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 407.38, "r_y0": 532.71, "r_x1": 408.82, "r_y1": 532.71, "r_x2": 408.82, "r_y2": 530.0, "r_x3": 407.38, "r_y3": 530.0, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 85, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 410.26, "r_y0": 532.71, "r_x1": 450.49, "r_y1": 532.71, "r_x2": 450.49, "r_y2": 530.0, "r_x3": 410.26, "r_y3": 530.0, "coord_origin": "TOPLEFT" }, "text": "C C C C C C C C C C C C C NL", "orig": "C C C C C C C C C C C C C NL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 86, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 407.38, "r_y0": 536.61, "r_x1": 408.82, "r_y1": 536.61, "r_x2": 408.82, "r_y2": 533.9, "r_x3": 407.38, "r_y3": 533.9, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 87, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 410.26, "r_y0": 536.61, "r_x1": 450.49, "r_y1": 536.61, "r_x2": 450.49, "r_y2": 533.9, "r_x3": 410.26, "r_y3": 533.9, "coord_origin": "TOPLEFT" }, "text": "C C C C C C C C C C C C C NL", "orig": "C C C C C C C C C C C C C NL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 88, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 407.38, "r_y0": 540.51, "r_x1": 408.82, "r_y1": 540.51, "r_x2": 408.82, "r_y2": 537.79, "r_x3": 407.38, "r_y3": 537.79, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 89, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 410.26, "r_y0": 540.51, "r_x1": 450.49, "r_y1": 540.51, "r_x2": 450.49, "r_y2": 537.79, "r_x3": 410.26, "r_y3": 537.79, "coord_origin": "TOPLEFT" }, "text": "C C C C C C C C C C C C C NL", "orig": "C C C C C C C C C C C C C NL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 90, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 407.38, "r_y0": 544.41, "r_x1": 408.82, "r_y1": 544.41, "r_x2": 408.82, "r_y2": 541.69, "r_x3": 407.38, "r_y3": 541.69, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 91, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 410.26, "r_y0": 544.41, "r_x1": 450.49, "r_y1": 544.41, "r_x2": 450.49, "r_y2": 541.69, "r_x3": 410.26, "r_y3": 541.69, "coord_origin": "TOPLEFT" }, "text": "C C C C C C C C C C C C C NL", "orig": "C C C C C C C C C C C C C NL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 92, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 407.38, "r_y0": 548.31, "r_x1": 408.82, "r_y1": 548.31, "r_x2": 408.82, "r_y2": 545.59, "r_x3": 407.38, "r_y3": 545.59, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 93, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 410.26, "r_y0": 548.31, "r_x1": 450.49, "r_y1": 548.31, "r_x2": 450.49, "r_y2": 545.59, "r_x3": 410.26, "r_y3": 545.59, "coord_origin": "TOPLEFT" }, "text": "C C C C C C C C C C C C C NL", "orig": "C C C C C C C C C C C C C NL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 94, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 407.38, "r_y0": 552.21, "r_x1": 408.82, "r_y1": 552.21, "r_x2": 408.82, "r_y2": 549.49, "r_x3": 407.38, "r_y3": 549.49, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 95, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 410.26, "r_y0": 552.21, "r_x1": 450.49, "r_y1": 552.21, "r_x2": 450.49, "r_y2": 549.49, "r_x3": 410.26, "r_y3": 549.49, "coord_origin": "TOPLEFT" }, "text": "C C C C C C C C C C C C C NL", "orig": "C C C C C C C C C C C C C NL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 96, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 164.53, "r_y0": 515.31, "r_x1": 181.85, "r_y1": 515.31, "r_x2": 181.85, "r_y2": 509.46, "r_x3": 164.53, "r_y3": 509.46, "coord_origin": "TOPLEFT" }, "text": "HTML", "orig": "HTML", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 97, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 183.58, "r_y0": 515.31, "r_x1": 186.4, "r_y1": 515.31, "r_x2": 186.4, "r_y2": 509.46, "r_x3": 183.58, "r_y3": 509.46, "coord_origin": "TOPLEFT" }, "text": "#", "orig": "#", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 98, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 189.21, "r_y0": 515.31, "r_x1": 208.9, "r_y1": 515.31, "r_x2": 208.9, "r_y2": 509.46, "r_x3": 189.21, "r_y3": 509.46, "coord_origin": "TOPLEFT" }, "text": "tokens:", "orig": "tokens:", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 99, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 210.63, "r_y0": 515.31, "r_x1": 221.04, "r_y1": 515.31, "r_x2": 221.04, "r_y2": 509.46, "r_x3": 210.63, "r_y3": 509.46, "coord_origin": "TOPLEFT" }, "text": "258", "orig": "258", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 100, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 390.2, "r_y0": 515.46, "r_x1": 406.84, "r_y1": 515.46, "r_x2": 406.84, "r_y2": 509.6, "r_x3": 390.2, "r_y3": 509.6, "coord_origin": "TOPLEFT" }, "text": "OTSL", "orig": "OTSL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 101, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 408.57, "r_y0": 515.46, "r_x1": 411.38, "r_y1": 515.46, "r_x2": 411.38, "r_y2": 509.6, "r_x3": 408.57, "r_y3": 509.6, "coord_origin": "TOPLEFT" }, "text": "#", "orig": "#", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 102, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 414.2, "r_y0": 515.46, "r_x1": 433.89, "r_y1": 515.46, "r_x2": 433.89, "r_y2": 509.6, "r_x3": 414.2, "r_y3": 509.6, "coord_origin": "TOPLEFT" }, "text": "tokens:", "orig": "tokens:", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 103, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 435.62, "r_y0": 515.46, "r_x1": 446.03, "r_y1": 515.46, "r_x2": 446.03, "r_y2": 509.6, "r_x3": 435.62, "r_y3": 509.6, "coord_origin": "TOPLEFT" }, "text": "135", "orig": "135", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 104, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 167.19, "r_y0": 526.39, "r_x1": 172.82, "r_y1": 526.39, "r_x2": 172.82, "r_y2": 519.07, "r_x3": 167.19, "r_y3": 519.07, "coord_origin": "TOPLEFT" }, "text": "B", "orig": "B", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 105, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 187.34, "r_y0": 455.94, "r_x1": 192.97, "r_y1": 455.94, "r_x2": 192.97, "r_y2": 448.62, "r_x3": 187.34, "r_y3": 448.62, "coord_origin": "TOPLEFT" }, "text": "A", "orig": "A", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 106, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 167.39, "r_y0": 573.32, "r_x1": 173.02, "r_y1": 573.32, "r_x2": 173.02, "r_y2": 566.01, "r_x3": 167.39, "r_y3": 566.01, "coord_origin": "TOPLEFT" }, "text": "D", "orig": "D", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 107, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 248.46, "r_y0": 629.09, "r_x1": 253.66, "r_y1": 629.09, "r_x2": 253.66, "r_y2": 621.78, "r_x3": 248.46, "r_y3": 621.78, "coord_origin": "TOPLEFT" }, "text": "E", "orig": "E", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 108, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 395.9, "r_y0": 526.51, "r_x1": 401.53, "r_y1": 526.51, "r_x2": 401.53, "r_y2": 519.2, "r_x3": 395.9, "r_y3": 519.2, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 109, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 171.63, "r_y0": 597.27, "r_x1": 177.48, "r_y1": 597.27, "r_x2": 177.48, "r_y2": 580.29, "r_x3": 171.63, "r_y3": 580.29, "coord_origin": "TOPLEFT" }, "text": "HTML", "orig": "HTML", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 110, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 251.06, "r_y0": 649.92, "r_x1": 256.91, "r_y1": 649.92, "r_x2": 256.91, "r_y2": 633.63, "r_x3": 251.06, "r_y3": 633.63, "coord_origin": "TOPLEFT" }, "text": "OTSL", "orig": "OTSL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 111, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 372.15, "r_y0": 607.31, "r_x1": 427.04, "r_y1": 607.31, "r_x2": 427.04, "r_y2": 601.46, "r_x3": 372.15, "r_y3": 601.46, "coord_origin": "TOPLEFT" }, "text": "HTML model shows", "orig": "HTML model shows", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 112, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 372.15, "r_y0": 613.75, "r_x1": 430.07, "r_y1": 613.75, "r_x2": 430.07, "r_y2": 607.9, "r_x3": 372.15, "r_y3": 607.9, "coord_origin": "TOPLEFT" }, "text": "bounding box drifting", "orig": "bounding box drifting", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 113, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 176.88, "r_y0": 648.72, "r_x1": 231.08, "r_y1": 648.72, "r_x2": 231.08, "r_y2": 642.87, "r_x3": 176.88, "r_y3": 642.87, "coord_origin": "TOPLEFT" }, "text": "OTSL model shows", "orig": "OTSL model shows", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 114, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 176.88, "r_y0": 655.17, "r_x1": 230.99, "r_y1": 655.17, "r_x2": 230.99, "r_y2": 649.31, "r_x3": 176.88, "r_y3": 649.31, "coord_origin": "TOPLEFT" }, "text": "clean bounding box", "orig": "clean bounding box", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 115, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 176.88, "r_y0": 661.61, "r_x1": 203.93, "r_y1": 661.61, "r_x2": 203.93, "r_y2": 655.76, "r_x3": 176.88, "r_y3": 655.76, "coord_origin": "TOPLEFT" }, "text": "alignment", "orig": "alignment", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 116, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 215.93, "r_y0": 569.16, "r_x1": 218.47, "r_y1": 569.16, "r_x2": 218.47, "r_y2": 557.56, "r_x3": 215.93, "r_y3": 557.56, "coord_origin": "TOPLEFT" }, "text": "\u2264", "orig": "\u2264", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 117, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 229.06, "r_y0": 569.16, "r_x1": 231.72, "r_y1": 569.16, "r_x2": 231.72, "r_y2": 557.56, "r_x3": 229.06, "r_y3": 557.56, "coord_origin": "TOPLEFT" }, "text": "\u03bc", "orig": "\u03bc", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 119, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 261.21, "r_y0": 451.2, "r_x1": 263.57, "r_y1": 451.2, "r_x2": 263.57, "r_y2": 448.46, "r_x3": 261.21, "r_y3": 448.46, "coord_origin": "TOPLEFT" }, "text": "S", "orig": "S", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 120, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 312.33, "r_y0": 451.2, "r_x1": 313.64, "r_y1": 451.2, "r_x2": 313.64, "r_y2": 448.46, "r_x3": 312.33, "r_y3": 448.46, "coord_origin": "TOPLEFT" }, "text": "I", "orig": "I", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 121, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 377.41, "r_y0": 451.2, "r_x1": 380.06, "r_y1": 451.2, "r_x2": 380.06, "r_y2": 448.46, "r_x3": 377.41, "r_y3": 448.46, "coord_origin": "TOPLEFT" }, "text": "R", "orig": "R", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 122, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 200.64, "r_y0": 456.08, "r_x1": 205.82, "r_y1": 456.08, "r_x2": 205.82, "r_y2": 453.34, "r_x3": 200.64, "r_y3": 453.34, "coord_origin": "TOPLEFT" }, "text": "ST", "orig": "ST", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 123, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 222.21, "r_y0": 456.08, "r_x1": 229.77, "r_y1": 456.08, "r_x2": 229.77, "r_y2": 453.34, "r_x3": 222.21, "r_y3": 453.34, "coord_origin": "TOPLEFT" }, "text": "0.03", "orig": "0.03", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 124, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 243.27, "r_y0": 456.08, "r_x1": 250.83, "r_y1": 456.08, "r_x2": 250.83, "r_y2": 453.34, "r_x3": 243.27, "r_y3": 453.34, "coord_origin": "TOPLEFT" }, "text": "0.06", "orig": "0.06", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 125, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 264.3, "r_y0": 456.08, "r_x1": 271.85, "r_y1": 456.08, "r_x2": 271.85, "r_y2": 453.34, "r_x3": 264.3, "r_y3": 453.34, "coord_origin": "TOPLEFT" }, "text": "0.12", "orig": "0.12", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 126, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 285.32, "r_y0": 456.08, "r_x1": 292.88, "r_y1": 456.08, "r_x2": 292.88, "r_y2": 453.34, "r_x3": 285.32, "r_y3": 453.34, "coord_origin": "TOPLEFT" }, "text": "0.25", "orig": "0.25", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 127, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 306.38, "r_y0": 456.08, "r_x1": 311.77, "r_y1": 456.08, "r_x2": 311.77, "r_y2": 453.34, "r_x3": 306.38, "r_y3": 453.34, "coord_origin": "TOPLEFT" }, "text": "0.5", "orig": "0.5", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 128, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 323.42, "r_y0": 456.08, "r_x1": 325.58, "r_y1": 456.08, "r_x2": 325.58, "r_y2": 453.34, "r_x3": 323.42, "r_y3": 453.34, "coord_origin": "TOPLEFT" }, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 129, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 334.46, "r_y0": 456.08, "r_x1": 336.62, "r_y1": 456.08, "r_x2": 336.62, "r_y2": 453.34, "r_x3": 334.46, "r_y3": 453.34, "coord_origin": "TOPLEFT" }, "text": "2", "orig": "2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 130, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 345.53, "r_y0": 456.08, "r_x1": 347.69, "r_y1": 456.08, "r_x2": 347.69, "r_y2": 453.34, "r_x3": 345.53, "r_y3": 453.34, "coord_origin": "TOPLEFT" }, "text": "4", "orig": "4", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 131, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 356.57, "r_y0": 456.08, "r_x1": 358.73, "r_y1": 456.08, "r_x2": 358.73, "r_y2": 453.34, "r_x3": 356.57, "r_y3": 453.34, "coord_origin": "TOPLEFT" }, "text": "8", "orig": "8", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 132, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 367.64, "r_y0": 456.08, "r_x1": 371.97, "r_y1": 456.08, "r_x2": 371.97, "r_y2": 453.34, "r_x3": 367.64, "r_y3": 453.34, "coord_origin": "TOPLEFT" }, "text": "16", "orig": "16", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 133, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 382.67, "r_y0": 456.08, "r_x1": 387.01, "r_y1": 456.08, "r_x2": 387.01, "r_y2": 453.34, "r_x3": 382.67, "r_y3": 453.34, "coord_origin": "TOPLEFT" }, "text": "32", "orig": "32", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 134, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 397.74, "r_y0": 456.08, "r_x1": 402.07, "r_y1": 456.08, "r_x2": 402.07, "r_y2": 453.34, "r_x3": 397.74, "r_y3": 453.34, "coord_origin": "TOPLEFT" }, "text": "64", "orig": "64", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 135, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 412.79, "r_y0": 457.8, "r_x1": 414.93, "r_y1": 457.8, "r_x2": 414.93, "r_y2": 447.99, "r_x3": 412.79, "r_y3": 447.99, "coord_origin": "TOPLEFT" }, "text": "\u2265", "orig": "\u2265", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 136, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 414.96, "r_y0": 456.08, "r_x1": 422.52, "r_y1": 456.08, "r_x2": 422.52, "r_y2": 453.34, "r_x3": 414.96, "r_y3": 453.34, "coord_origin": "TOPLEFT" }, "text": " 128", "orig": " 128", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 137, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 200.64, "r_y0": 466.66, "r_x1": 204.58, "r_y1": 466.66, "r_x2": 204.58, "r_y2": 463.92, "r_x3": 200.64, "r_y3": 463.92, "coord_origin": "TOPLEFT" }, "text": "63", "orig": "63", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 138, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 367.63, "r_y0": 466.66, "r_x1": 369.58, "r_y1": 466.66, "r_x2": 369.58, "r_y2": 463.92, "r_x3": 367.63, "r_y3": 463.92, "coord_origin": "TOPLEFT" }, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 139, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 382.66, "r_y0": 466.66, "r_x1": 384.62, "r_y1": 466.66, "r_x2": 384.62, "r_y2": 463.92, "r_x3": 382.66, "r_y3": 463.92, "coord_origin": "TOPLEFT" }, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 140, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 397.73, "r_y0": 466.66, "r_x1": 399.68, "r_y1": 466.66, "r_x2": 399.68, "r_y2": 463.92, "r_x3": 397.73, "r_y3": 463.92, "coord_origin": "TOPLEFT" }, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 141, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 200.64, "r_y0": 471.54, "r_x1": 206.52, "r_y1": 471.54, "r_x2": 206.52, "r_y2": 468.8, "r_x3": 200.64, "r_y3": 468.8, "coord_origin": "TOPLEFT" }, "text": "199", "orig": "199", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 142, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 264.29, "r_y0": 471.54, "r_x1": 266.26, "r_y1": 471.54, "r_x2": 266.26, "r_y2": 468.8, "r_x3": 264.29, "r_y3": 468.8, "coord_origin": "TOPLEFT" }, "text": "5", "orig": "5", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 143, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 306.37, "r_y0": 471.54, "r_x1": 308.34, "r_y1": 471.54, "r_x2": 308.34, "r_y2": 468.8, "r_x3": 306.37, "r_y3": 468.8, "coord_origin": "TOPLEFT" }, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 144, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 345.52, "r_y0": 471.54, "r_x1": 347.48, "r_y1": 471.54, "r_x2": 347.48, "r_y2": 468.8, "r_x3": 345.52, "r_y3": 468.8, "coord_origin": "TOPLEFT" }, "text": "2", "orig": "2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 145, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 356.56, "r_y0": 471.54, "r_x1": 358.52, "r_y1": 471.54, "r_x2": 358.52, "r_y2": 468.8, "r_x3": 356.56, "r_y3": 468.8, "coord_origin": "TOPLEFT" }, "text": "4", "orig": "4", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 146, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 367.63, "r_y0": 471.54, "r_x1": 369.59, "r_y1": 471.54, "r_x2": 369.59, "r_y2": 468.8, "r_x3": 367.63, "r_y3": 468.8, "coord_origin": "TOPLEFT" }, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 147, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 382.66, "r_y0": 471.54, "r_x1": 384.63, "r_y1": 471.54, "r_x2": 384.63, "r_y2": 468.8, "r_x3": 382.66, "r_y3": 468.8, "coord_origin": "TOPLEFT" }, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 148, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 200.64, "r_y0": 476.42, "r_x1": 206.52, "r_y1": 476.42, "r_x2": 206.52, "r_y2": 473.68, "r_x3": 200.64, "r_y3": 473.68, "coord_origin": "TOPLEFT" }, "text": "416", "orig": "416", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 149, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 264.29, "r_y0": 476.42, "r_x1": 266.26, "r_y1": 476.42, "r_x2": 266.26, "r_y2": 473.68, "r_x3": 264.29, "r_y3": 473.68, "coord_origin": "TOPLEFT" }, "text": "4", "orig": "4", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 150, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 200.64, "r_y0": 481.27, "r_x1": 206.52, "r_y1": 481.27, "r_x2": 206.52, "r_y2": 478.53, "r_x3": 200.64, "r_y3": 478.53, "coord_origin": "TOPLEFT" }, "text": "230", "orig": "230", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 151, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 243.26, "r_y0": 481.27, "r_x1": 245.23, "r_y1": 481.27, "r_x2": 245.23, "r_y2": 478.53, "r_x3": 243.26, "r_y3": 478.53, "coord_origin": "TOPLEFT" }, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 152, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 264.29, "r_y0": 481.27, "r_x1": 266.26, "r_y1": 481.27, "r_x2": 266.26, "r_y2": 478.53, "r_x3": 264.29, "r_y3": 478.53, "coord_origin": "TOPLEFT" }, "text": "9", "orig": "9", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 153, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 323.4, "r_y0": 481.27, "r_x1": 325.37, "r_y1": 481.27, "r_x2": 325.37, "r_y2": 478.53, "r_x3": 323.4, "r_y3": 478.53, "coord_origin": "TOPLEFT" }, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 154, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 397.73, "r_y0": 481.27, "r_x1": 399.69, "r_y1": 481.27, "r_x2": 399.69, "r_y2": 478.53, "r_x3": 397.73, "r_y3": 478.53, "coord_origin": "TOPLEFT" }, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 155, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 200.64, "r_y0": 486.15, "r_x1": 206.52, "r_y1": 486.15, "r_x2": 206.52, "r_y2": 483.41, "r_x3": 200.64, "r_y3": 483.41, "coord_origin": "TOPLEFT" }, "text": "276", "orig": "276", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 156, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 382.66, "r_y0": 486.15, "r_x1": 384.62, "r_y1": 486.15, "r_x2": 384.62, "r_y2": 483.41, "r_x3": 382.66, "r_y3": 483.41, "coord_origin": "TOPLEFT" }, "text": "2", "orig": "2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 157, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 397.73, "r_y0": 486.15, "r_x1": 401.65, "r_y1": 486.15, "r_x2": 401.65, "r_y2": 483.41, "r_x3": 397.73, "r_y3": 483.41, "coord_origin": "TOPLEFT" }, "text": "12", "orig": "12", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 158, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 412.79, "r_y0": 486.15, "r_x1": 414.74, "r_y1": 486.15, "r_x2": 414.74, "r_y2": 483.41, "r_x3": 412.79, "r_y3": 483.41, "coord_origin": "TOPLEFT" }, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 159, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 200.64, "r_y0": 491.03, "r_x1": 207.14, "r_y1": 491.03, "r_x2": 207.14, "r_y2": 488.29, "r_x3": 200.64, "r_y3": 488.29, "coord_origin": "TOPLEFT" }, "text": "320", "orig": "320", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 160, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 367.63, "r_y0": 491.03, "r_x1": 369.78, "r_y1": 491.03, "r_x2": 369.78, "r_y2": 488.29, "r_x3": 367.63, "r_y3": 488.29, "coord_origin": "TOPLEFT" }, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 161, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 382.66, "r_y0": 491.03, "r_x1": 384.82, "r_y1": 491.03, "r_x2": 384.82, "r_y2": 488.29, "r_x3": 382.66, "r_y3": 488.29, "coord_origin": "TOPLEFT" }, "text": "4", "orig": "4", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 162, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 397.73, "r_y0": 491.03, "r_x1": 402.05, "r_y1": 491.03, "r_x2": 402.05, "r_y2": 488.29, "r_x3": 397.73, "r_y3": 488.29, "coord_origin": "TOPLEFT" }, "text": "20", "orig": "20", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 163, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 200.64, "r_y0": 495.9, "r_x1": 208.49, "r_y1": 495.9, "r_x2": 208.49, "r_y2": 493.17, "r_x3": 200.64, "r_y3": 493.17, "coord_origin": "TOPLEFT" }, "text": "2013", "orig": "2013", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 164, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 264.29, "r_y0": 495.9, "r_x1": 266.26, "r_y1": 495.9, "r_x2": 266.26, "r_y2": 493.17, "r_x3": 264.29, "r_y3": 493.17, "coord_origin": "TOPLEFT" }, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [ { "id": 58, "label": "text", "bbox": { "l": 180.12, "t": 516.23, "r": 190.62, "b": 518.95, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 67, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 180.12, "r_y0": 518.95, "r_x1": 190.62, "r_y1": 518.95, "r_x2": 190.62, "r_y2": 516.23, "r_x3": 180.12, "r_y3": 516.23, "coord_origin": "TOPLEFT" }, "text": "", "orig": "
", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 59, "label": "text", "bbox": { "l": 183.24, "t": 520.13, "r": 304.55, "b": 522.85, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 68, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 183.24, "r_y0": 522.85, "r_x1": 304.55, "r_y1": 522.85, "r_x2": 304.55, "r_y2": 520.13, "r_x3": 183.24, "r_y3": 520.13, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 60, "label": "text", "bbox": { "l": 183.24, "t": 524.03, "r": 388.42, "b": 526.75, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 69, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 183.24, "r_y0": 526.75, "r_x1": 388.42, "r_y1": 526.75, "r_x2": 388.42, "r_y2": 524.03, "r_x3": 183.24, "r_y3": 524.03, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 61, "label": "text", "bbox": { "l": 183.24, "t": 527.93, "r": 388.42, "b": 530.65, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 70, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 183.24, "r_y0": 530.65, "r_x1": 388.42, "r_y1": 530.65, "r_x2": 388.42, "r_y2": 527.93, "r_x3": 183.24, "r_y3": 527.93, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 62, "label": "text", "bbox": { "l": 183.24, "t": 531.83, "r": 388.42, "b": 534.55, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 71, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 183.24, "r_y0": 534.55, "r_x1": 388.42, "r_y1": 534.55, "r_x2": 388.42, "r_y2": 531.83, "r_x3": 183.24, "r_y3": 531.83, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 63, "label": "text", "bbox": { "l": 183.24, "t": 535.73, "r": 388.42, "b": 538.44, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 72, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 183.24, "r_y0": 538.44, "r_x1": 388.42, "r_y1": 538.44, "r_x2": 388.42, "r_y2": 535.73, "r_x3": 183.24, "r_y3": 535.73, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 64, "label": "text", "bbox": { "l": 183.24, "t": 539.63, "r": 388.42, "b": 542.34, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 73, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 183.24, "r_y0": 542.34, "r_x1": 388.42, "r_y1": 542.34, "r_x2": 388.42, "r_y2": 539.63, "r_x3": 183.24, "r_y3": 539.63, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 65, "label": "text", "bbox": { "l": 183.24, "t": 543.53, "r": 388.42, "b": 546.24, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 74, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 183.24, "r_y0": 546.24, "r_x1": 388.42, "r_y1": 546.24, "r_x2": 388.42, "r_y2": 543.53, "r_x3": 183.24, "r_y3": 543.53, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 66, "label": "text", "bbox": { "l": 183.24, "t": 547.42, "r": 388.42, "b": 550.14, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 75, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 183.24, "r_y0": 550.14, "r_x1": 388.42, "r_y1": 550.14, "r_x2": 388.42, "r_y2": 547.42, "r_x3": 183.24, "r_y3": 547.42, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 67, "label": "text", "bbox": { "l": 183.24, "t": 551.32, "r": 388.42, "b": 554.04, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 76, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 183.24, "r_y0": 554.04, "r_x1": 388.42, "r_y1": 554.04, "r_x2": 388.42, "r_y2": 551.32, "r_x3": 183.24, "r_y3": 551.32, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 68, "label": "text", "bbox": { "l": 180.12, "t": 555.22, "r": 191.87, "b": 557.94, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 77, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 180.12, "r_y0": 557.94, "r_x1": 191.87, "r_y1": 557.94, "r_x2": 191.87, "r_y2": 555.22, "r_x3": 180.12, "r_y3": 555.22, "coord_origin": "TOPLEFT" }, "text": "
", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 69, "label": "text", "bbox": { "l": 407.38, "t": 518.3, "r": 408.82, "b": 521.02, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 78, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 407.38, "r_y0": 521.02, "r_x1": 408.82, "r_y1": 521.02, "r_x2": 408.82, "r_y2": 518.3, "r_x3": 407.38, "r_y3": 518.3, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 70, "label": "text", "bbox": { "l": 410.26, "t": 518.3, "r": 450.49, "b": 521.02, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 79, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 410.26, "r_y0": 521.02, "r_x1": 450.49, "r_y1": 521.02, "r_x2": 450.49, "r_y2": 518.3, "r_x3": 410.26, "r_y3": 518.3, "coord_origin": "TOPLEFT" }, "text": "C L L L C L L L L L C L L NL", "orig": "C L L L C L L L L L C L L NL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 71, "label": "text", "bbox": { "l": 407.38, "t": 522.2, "r": 408.82, "b": 524.92, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 80, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 407.38, "r_y0": 524.92, "r_x1": 408.82, "r_y1": 524.92, "r_x2": 408.82, "r_y2": 522.2, "r_x3": 407.38, "r_y3": 522.2, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 72, "label": "text", "bbox": { "l": 410.26, "t": 522.2, "r": 450.49, "b": 524.92, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 81, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 410.26, "r_y0": 524.92, "r_x1": 450.49, "r_y1": 524.92, "r_x2": 450.49, "r_y2": 522.2, "r_x3": 410.26, "r_y3": 522.2, "coord_origin": "TOPLEFT" }, "text": "C C C C C C C C C C C C C NL", "orig": "C C C C C C C C C C C C C NL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 73, "label": "text", "bbox": { "l": 407.38, "t": 526.1, "r": 408.82, "b": 528.81, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 82, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 407.38, "r_y0": 528.81, "r_x1": 408.82, "r_y1": 528.81, "r_x2": 408.82, "r_y2": 526.1, "r_x3": 407.38, "r_y3": 526.1, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 74, "label": "text", "bbox": { "l": 410.26, "t": 526.1, "r": 450.49, "b": 528.81, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 83, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 410.26, "r_y0": 528.81, "r_x1": 450.49, "r_y1": 528.81, "r_x2": 450.49, "r_y2": 526.1, "r_x3": 410.26, "r_y3": 526.1, "coord_origin": "TOPLEFT" }, "text": "C C C C C C C C C C C C C NL", "orig": "C C C C C C C C C C C C C NL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 75, "label": "text", "bbox": { "l": 407.38, "t": 530.0, "r": 408.82, "b": 532.71, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 84, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 407.38, "r_y0": 532.71, "r_x1": 408.82, "r_y1": 532.71, "r_x2": 408.82, "r_y2": 530.0, "r_x3": 407.38, "r_y3": 530.0, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 76, "label": "text", "bbox": { "l": 410.26, "t": 530.0, "r": 450.49, "b": 532.71, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 85, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 410.26, "r_y0": 532.71, "r_x1": 450.49, "r_y1": 532.71, "r_x2": 450.49, "r_y2": 530.0, "r_x3": 410.26, "r_y3": 530.0, "coord_origin": "TOPLEFT" }, "text": "C C C C C C C C C C C C C NL", "orig": "C C C C C C C C C C C C C NL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 77, "label": "text", "bbox": { "l": 407.38, "t": 533.9, "r": 408.82, "b": 536.61, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 86, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 407.38, "r_y0": 536.61, "r_x1": 408.82, "r_y1": 536.61, "r_x2": 408.82, "r_y2": 533.9, "r_x3": 407.38, "r_y3": 533.9, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 78, "label": "text", "bbox": { "l": 410.26, "t": 533.9, "r": 450.49, "b": 536.61, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 87, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 410.26, "r_y0": 536.61, "r_x1": 450.49, "r_y1": 536.61, "r_x2": 450.49, "r_y2": 533.9, "r_x3": 410.26, "r_y3": 533.9, "coord_origin": "TOPLEFT" }, "text": "C C C C C C C C C C C C C NL", "orig": "C C C C C C C C C C C C C NL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 79, "label": "text", "bbox": { "l": 407.38, "t": 537.79, "r": 408.82, "b": 540.51, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 88, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 407.38, "r_y0": 540.51, "r_x1": 408.82, "r_y1": 540.51, "r_x2": 408.82, "r_y2": 537.79, "r_x3": 407.38, "r_y3": 537.79, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 80, "label": "text", "bbox": { "l": 410.26, "t": 537.79, "r": 450.49, "b": 540.51, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 89, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 410.26, "r_y0": 540.51, "r_x1": 450.49, "r_y1": 540.51, "r_x2": 450.49, "r_y2": 537.79, "r_x3": 410.26, "r_y3": 537.79, "coord_origin": "TOPLEFT" }, "text": "C C C C C C C C C C C C C NL", "orig": "C C C C C C C C C C C C C NL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 81, "label": "text", "bbox": { "l": 407.38, "t": 541.69, "r": 408.82, "b": 544.41, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 90, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 407.38, "r_y0": 544.41, "r_x1": 408.82, "r_y1": 544.41, "r_x2": 408.82, "r_y2": 541.69, "r_x3": 407.38, "r_y3": 541.69, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 82, "label": "text", "bbox": { "l": 410.26, "t": 541.69, "r": 450.49, "b": 544.41, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 91, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 410.26, "r_y0": 544.41, "r_x1": 450.49, "r_y1": 544.41, "r_x2": 450.49, "r_y2": 541.69, "r_x3": 410.26, "r_y3": 541.69, "coord_origin": "TOPLEFT" }, "text": "C C C C C C C C C C C C C NL", "orig": "C C C C C C C C C C C C C NL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 83, "label": "text", "bbox": { "l": 407.38, "t": 545.59, "r": 408.82, "b": 548.31, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 92, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 407.38, "r_y0": 548.31, "r_x1": 408.82, "r_y1": 548.31, "r_x2": 408.82, "r_y2": 545.59, "r_x3": 407.38, "r_y3": 545.59, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 84, "label": "text", "bbox": { "l": 410.26, "t": 545.59, "r": 450.49, "b": 548.31, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 93, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 410.26, "r_y0": 548.31, "r_x1": 450.49, "r_y1": 548.31, "r_x2": 450.49, "r_y2": 545.59, "r_x3": 410.26, "r_y3": 545.59, "coord_origin": "TOPLEFT" }, "text": "C C C C C C C C C C C C C NL", "orig": "C C C C C C C C C C C C C NL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 85, "label": "text", "bbox": { "l": 407.38, "t": 549.49, "r": 408.82, "b": 552.21, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 94, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 407.38, "r_y0": 552.21, "r_x1": 408.82, "r_y1": 552.21, "r_x2": 408.82, "r_y2": 549.49, "r_x3": 407.38, "r_y3": 549.49, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 86, "label": "text", "bbox": { "l": 410.26, "t": 549.49, "r": 450.49, "b": 552.21, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 95, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 410.26, "r_y0": 552.21, "r_x1": 450.49, "r_y1": 552.21, "r_x2": 450.49, "r_y2": 549.49, "r_x3": 410.26, "r_y3": 549.49, "coord_origin": "TOPLEFT" }, "text": "C C C C C C C C C C C C C NL", "orig": "C C C C C C C C C C C C C NL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 87, "label": "text", "bbox": { "l": 164.53, "t": 509.46, "r": 181.85, "b": 515.31, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 96, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 164.53, "r_y0": 515.31, "r_x1": 181.85, "r_y1": 515.31, "r_x2": 181.85, "r_y2": 509.46, "r_x3": 164.53, "r_y3": 509.46, "coord_origin": "TOPLEFT" }, "text": "HTML", "orig": "HTML", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 88, "label": "text", "bbox": { "l": 183.58, "t": 509.46, "r": 186.4, "b": 515.31, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 97, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 183.58, "r_y0": 515.31, "r_x1": 186.4, "r_y1": 515.31, "r_x2": 186.4, "r_y2": 509.46, "r_x3": 183.58, "r_y3": 509.46, "coord_origin": "TOPLEFT" }, "text": "#", "orig": "#", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 89, "label": "text", "bbox": { "l": 189.21, "t": 509.46, "r": 208.9, "b": 515.31, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 98, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 189.21, "r_y0": 515.31, "r_x1": 208.9, "r_y1": 515.31, "r_x2": 208.9, "r_y2": 509.46, "r_x3": 189.21, "r_y3": 509.46, "coord_origin": "TOPLEFT" }, "text": "tokens:", "orig": "tokens:", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 90, "label": "text", "bbox": { "l": 210.63, "t": 509.46, "r": 221.04, "b": 515.31, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 99, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 210.63, "r_y0": 515.31, "r_x1": 221.04, "r_y1": 515.31, "r_x2": 221.04, "r_y2": 509.46, "r_x3": 210.63, "r_y3": 509.46, "coord_origin": "TOPLEFT" }, "text": "258", "orig": "258", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 91, "label": "text", "bbox": { "l": 390.2, "t": 509.6, "r": 406.84, "b": 515.46, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 100, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 390.2, "r_y0": 515.46, "r_x1": 406.84, "r_y1": 515.46, "r_x2": 406.84, "r_y2": 509.6, "r_x3": 390.2, "r_y3": 509.6, "coord_origin": "TOPLEFT" }, "text": "OTSL", "orig": "OTSL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 92, "label": "text", "bbox": { "l": 408.57, "t": 509.6, "r": 411.38, "b": 515.46, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 101, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 408.57, "r_y0": 515.46, "r_x1": 411.38, "r_y1": 515.46, "r_x2": 411.38, "r_y2": 509.6, "r_x3": 408.57, "r_y3": 509.6, "coord_origin": "TOPLEFT" }, "text": "#", "orig": "#", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 93, "label": "text", "bbox": { "l": 414.2, "t": 509.6, "r": 433.89, "b": 515.46, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 102, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 414.2, "r_y0": 515.46, "r_x1": 433.89, "r_y1": 515.46, "r_x2": 433.89, "r_y2": 509.6, "r_x3": 414.2, "r_y3": 509.6, "coord_origin": "TOPLEFT" }, "text": "tokens:", "orig": "tokens:", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 94, "label": "text", "bbox": { "l": 435.62, "t": 509.6, "r": 446.03, "b": 515.46, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 103, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 435.62, "r_y0": 515.46, "r_x1": 446.03, "r_y1": 515.46, "r_x2": 446.03, "r_y2": 509.6, "r_x3": 435.62, "r_y3": 509.6, "coord_origin": "TOPLEFT" }, "text": "135", "orig": "135", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 95, "label": "text", "bbox": { "l": 167.19, "t": 519.07, "r": 172.82, "b": 526.39, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 104, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 167.19, "r_y0": 526.39, "r_x1": 172.82, "r_y1": 526.39, "r_x2": 172.82, "r_y2": 519.07, "r_x3": 167.19, "r_y3": 519.07, "coord_origin": "TOPLEFT" }, "text": "B", "orig": "B", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 96, "label": "text", "bbox": { "l": 187.34, "t": 448.62, "r": 192.97, "b": 455.94, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 105, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 187.34, "r_y0": 455.94, "r_x1": 192.97, "r_y1": 455.94, "r_x2": 192.97, "r_y2": 448.62, "r_x3": 187.34, "r_y3": 448.62, "coord_origin": "TOPLEFT" }, "text": "A", "orig": "A", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 97, "label": "text", "bbox": { "l": 167.39, "t": 566.01, "r": 173.02, "b": 573.32, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 106, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 167.39, "r_y0": 573.32, "r_x1": 173.02, "r_y1": 573.32, "r_x2": 173.02, "r_y2": 566.01, "r_x3": 167.39, "r_y3": 566.01, "coord_origin": "TOPLEFT" }, "text": "D", "orig": "D", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 98, "label": "text", "bbox": { "l": 248.46, "t": 621.78, "r": 253.66, "b": 629.09, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 107, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 248.46, "r_y0": 629.09, "r_x1": 253.66, "r_y1": 629.09, "r_x2": 253.66, "r_y2": 621.78, "r_x3": 248.46, "r_y3": 621.78, "coord_origin": "TOPLEFT" }, "text": "E", "orig": "E", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 99, "label": "text", "bbox": { "l": 395.9, "t": 519.2, "r": 401.53, "b": 526.51, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 108, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 395.9, "r_y0": 526.51, "r_x1": 401.53, "r_y1": 526.51, "r_x2": 401.53, "r_y2": 519.2, "r_x3": 395.9, "r_y3": 519.2, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 100, "label": "text", "bbox": { "l": 171.63, "t": 580.29, "r": 177.48, "b": 597.27, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 109, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 171.63, "r_y0": 597.27, "r_x1": 177.48, "r_y1": 597.27, "r_x2": 177.48, "r_y2": 580.29, "r_x3": 171.63, "r_y3": 580.29, "coord_origin": "TOPLEFT" }, "text": "HTML", "orig": "HTML", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 101, "label": "text", "bbox": { "l": 251.06, "t": 633.63, "r": 256.91, "b": 649.92, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 110, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 251.06, "r_y0": 649.92, "r_x1": 256.91, "r_y1": 649.92, "r_x2": 256.91, "r_y2": 633.63, "r_x3": 251.06, "r_y3": 633.63, "coord_origin": "TOPLEFT" }, "text": "OTSL", "orig": "OTSL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 102, "label": "text", "bbox": { "l": 372.15, "t": 601.46, "r": 427.04, "b": 607.31, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 111, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 372.15, "r_y0": 607.31, "r_x1": 427.04, "r_y1": 607.31, "r_x2": 427.04, "r_y2": 601.46, "r_x3": 372.15, "r_y3": 601.46, "coord_origin": "TOPLEFT" }, "text": "HTML model shows", "orig": "HTML model shows", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 103, "label": "text", "bbox": { "l": 372.15, "t": 607.9, "r": 430.07, "b": 613.75, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 112, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 372.15, "r_y0": 613.75, "r_x1": 430.07, "r_y1": 613.75, "r_x2": 430.07, "r_y2": 607.9, "r_x3": 372.15, "r_y3": 607.9, "coord_origin": "TOPLEFT" }, "text": "bounding box drifting", "orig": "bounding box drifting", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 104, "label": "text", "bbox": { "l": 176.88, "t": 642.87, "r": 231.08, "b": 648.72, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 113, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 176.88, "r_y0": 648.72, "r_x1": 231.08, "r_y1": 648.72, "r_x2": 231.08, "r_y2": 642.87, "r_x3": 176.88, "r_y3": 642.87, "coord_origin": "TOPLEFT" }, "text": "OTSL model shows", "orig": "OTSL model shows", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 105, "label": "text", "bbox": { "l": 176.88, "t": 649.31, "r": 230.99, "b": 655.17, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 114, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 176.88, "r_y0": 655.17, "r_x1": 230.99, "r_y1": 655.17, "r_x2": 230.99, "r_y2": 649.31, "r_x3": 176.88, "r_y3": 649.31, "coord_origin": "TOPLEFT" }, "text": "clean bounding box", "orig": "clean bounding box", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 106, "label": "text", "bbox": { "l": 176.88, "t": 655.76, "r": 203.93, "b": 661.61, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 115, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 176.88, "r_y0": 661.61, "r_x1": 203.93, "r_y1": 661.61, "r_x2": 203.93, "r_y2": 655.76, "r_x3": 176.88, "r_y3": 655.76, "coord_origin": "TOPLEFT" }, "text": "alignment", "orig": "alignment", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 107, "label": "text", "bbox": { "l": 215.93, "t": 557.56, "r": 218.47, "b": 569.16, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 116, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 215.93, "r_y0": 569.16, "r_x1": 218.47, "r_y1": 569.16, "r_x2": 218.47, "r_y2": 557.56, "r_x3": 215.93, "r_y3": 557.56, "coord_origin": "TOPLEFT" }, "text": "\u2264", "orig": "\u2264", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 108, "label": "text", "bbox": { "l": 229.06, "t": 557.56, "r": 231.72, "b": 569.16, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 117, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 229.06, "r_y0": 569.16, "r_x1": 231.72, "r_y1": 569.16, "r_x2": 231.72, "r_y2": 557.56, "r_x3": 229.06, "r_y3": 557.56, "coord_origin": "TOPLEFT" }, "text": "\u03bc", "orig": "\u03bc", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 109, "label": "text", "bbox": { "l": 261.21, "t": 448.46, "r": 263.57, "b": 451.2, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 119, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 261.21, "r_y0": 451.2, "r_x1": 263.57, "r_y1": 451.2, "r_x2": 263.57, "r_y2": 448.46, "r_x3": 261.21, "r_y3": 448.46, "coord_origin": "TOPLEFT" }, "text": "S", "orig": "S", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 110, "label": "text", "bbox": { "l": 312.33, "t": 448.46, "r": 313.64, "b": 451.2, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 120, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 312.33, "r_y0": 451.2, "r_x1": 313.64, "r_y1": 451.2, "r_x2": 313.64, "r_y2": 448.46, "r_x3": 312.33, "r_y3": 448.46, "coord_origin": "TOPLEFT" }, "text": "I", "orig": "I", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 111, "label": "text", "bbox": { "l": 377.41, "t": 448.46, "r": 380.06, "b": 451.2, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 121, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 377.41, "r_y0": 451.2, "r_x1": 380.06, "r_y1": 451.2, "r_x2": 380.06, "r_y2": 448.46, "r_x3": 377.41, "r_y3": 448.46, "coord_origin": "TOPLEFT" }, "text": "R", "orig": "R", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 112, "label": "text", "bbox": { "l": 200.64, "t": 453.34, "r": 205.82, "b": 456.08, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 122, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 200.64, "r_y0": 456.08, "r_x1": 205.82, "r_y1": 456.08, "r_x2": 205.82, "r_y2": 453.34, "r_x3": 200.64, "r_y3": 453.34, "coord_origin": "TOPLEFT" }, "text": "ST", "orig": "ST", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 113, "label": "text", "bbox": { "l": 222.21, "t": 453.34, "r": 229.77, "b": 456.08, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 123, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 222.21, "r_y0": 456.08, "r_x1": 229.77, "r_y1": 456.08, "r_x2": 229.77, "r_y2": 453.34, "r_x3": 222.21, "r_y3": 453.34, "coord_origin": "TOPLEFT" }, "text": "0.03", "orig": "0.03", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 114, "label": "text", "bbox": { "l": 243.27, "t": 453.34, "r": 250.83, "b": 456.08, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 124, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 243.27, "r_y0": 456.08, "r_x1": 250.83, "r_y1": 456.08, "r_x2": 250.83, "r_y2": 453.34, "r_x3": 243.27, "r_y3": 453.34, "coord_origin": "TOPLEFT" }, "text": "0.06", "orig": "0.06", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 115, "label": "text", "bbox": { "l": 264.3, "t": 453.34, "r": 271.85, "b": 456.08, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 125, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 264.3, "r_y0": 456.08, "r_x1": 271.85, "r_y1": 456.08, "r_x2": 271.85, "r_y2": 453.34, "r_x3": 264.3, "r_y3": 453.34, "coord_origin": "TOPLEFT" }, "text": "0.12", "orig": "0.12", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 116, "label": "text", "bbox": { "l": 285.32, "t": 453.34, "r": 292.88, "b": 456.08, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 126, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 285.32, "r_y0": 456.08, "r_x1": 292.88, "r_y1": 456.08, "r_x2": 292.88, "r_y2": 453.34, "r_x3": 285.32, "r_y3": 453.34, "coord_origin": "TOPLEFT" }, "text": "0.25", "orig": "0.25", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 117, "label": "text", "bbox": { "l": 306.38, "t": 453.34, "r": 311.77, "b": 456.08, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 127, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 306.38, "r_y0": 456.08, "r_x1": 311.77, "r_y1": 456.08, "r_x2": 311.77, "r_y2": 453.34, "r_x3": 306.38, "r_y3": 453.34, "coord_origin": "TOPLEFT" }, "text": "0.5", "orig": "0.5", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 118, "label": "text", "bbox": { "l": 323.42, "t": 453.34, "r": 325.58, "b": 456.08, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 128, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 323.42, "r_y0": 456.08, "r_x1": 325.58, "r_y1": 456.08, "r_x2": 325.58, "r_y2": 453.34, "r_x3": 323.42, "r_y3": 453.34, "coord_origin": "TOPLEFT" }, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 119, "label": "text", "bbox": { "l": 334.46, "t": 453.34, "r": 336.62, "b": 456.08, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 129, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 334.46, "r_y0": 456.08, "r_x1": 336.62, "r_y1": 456.08, "r_x2": 336.62, "r_y2": 453.34, "r_x3": 334.46, "r_y3": 453.34, "coord_origin": "TOPLEFT" }, "text": "2", "orig": "2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 120, "label": "text", "bbox": { "l": 345.53, "t": 453.34, "r": 347.69, "b": 456.08, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 130, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 345.53, "r_y0": 456.08, "r_x1": 347.69, "r_y1": 456.08, "r_x2": 347.69, "r_y2": 453.34, "r_x3": 345.53, "r_y3": 453.34, "coord_origin": "TOPLEFT" }, "text": "4", "orig": "4", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 121, "label": "text", "bbox": { "l": 356.57, "t": 453.34, "r": 358.73, "b": 456.08, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 131, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 356.57, "r_y0": 456.08, "r_x1": 358.73, "r_y1": 456.08, "r_x2": 358.73, "r_y2": 453.34, "r_x3": 356.57, "r_y3": 453.34, "coord_origin": "TOPLEFT" }, "text": "8", "orig": "8", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 122, "label": "text", "bbox": { "l": 367.64, "t": 453.34, "r": 371.97, "b": 456.08, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 132, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 367.64, "r_y0": 456.08, "r_x1": 371.97, "r_y1": 456.08, "r_x2": 371.97, "r_y2": 453.34, "r_x3": 367.64, "r_y3": 453.34, "coord_origin": "TOPLEFT" }, "text": "16", "orig": "16", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 123, "label": "text", "bbox": { "l": 382.67, "t": 453.34, "r": 387.01, "b": 456.08, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 133, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 382.67, "r_y0": 456.08, "r_x1": 387.01, "r_y1": 456.08, "r_x2": 387.01, "r_y2": 453.34, "r_x3": 382.67, "r_y3": 453.34, "coord_origin": "TOPLEFT" }, "text": "32", "orig": "32", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 124, "label": "text", "bbox": { "l": 397.74, "t": 453.34, "r": 402.07, "b": 456.08, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 134, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 397.74, "r_y0": 456.08, "r_x1": 402.07, "r_y1": 456.08, "r_x2": 402.07, "r_y2": 453.34, "r_x3": 397.74, "r_y3": 453.34, "coord_origin": "TOPLEFT" }, "text": "64", "orig": "64", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 125, "label": "text", "bbox": { "l": 412.79, "t": 447.99, "r": 414.93, "b": 457.8, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 135, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 412.79, "r_y0": 457.8, "r_x1": 414.93, "r_y1": 457.8, "r_x2": 414.93, "r_y2": 447.99, "r_x3": 412.79, "r_y3": 447.99, "coord_origin": "TOPLEFT" }, "text": "\u2265", "orig": "\u2265", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 126, "label": "text", "bbox": { "l": 414.96, "t": 453.34, "r": 422.52, "b": 456.08, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 136, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 414.96, "r_y0": 456.08, "r_x1": 422.52, "r_y1": 456.08, "r_x2": 422.52, "r_y2": 453.34, "r_x3": 414.96, "r_y3": 453.34, "coord_origin": "TOPLEFT" }, "text": " 128", "orig": " 128", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 127, "label": "text", "bbox": { "l": 200.64, "t": 463.92, "r": 204.58, "b": 466.66, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 137, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 200.64, "r_y0": 466.66, "r_x1": 204.58, "r_y1": 466.66, "r_x2": 204.58, "r_y2": 463.92, "r_x3": 200.64, "r_y3": 463.92, "coord_origin": "TOPLEFT" }, "text": "63", "orig": "63", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 128, "label": "text", "bbox": { "l": 367.63, "t": 463.92, "r": 369.58, "b": 466.66, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 138, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 367.63, "r_y0": 466.66, "r_x1": 369.58, "r_y1": 466.66, "r_x2": 369.58, "r_y2": 463.92, "r_x3": 367.63, "r_y3": 463.92, "coord_origin": "TOPLEFT" }, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 129, "label": "text", "bbox": { "l": 382.66, "t": 463.92, "r": 384.62, "b": 466.66, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 139, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 382.66, "r_y0": 466.66, "r_x1": 384.62, "r_y1": 466.66, "r_x2": 384.62, "r_y2": 463.92, "r_x3": 382.66, "r_y3": 463.92, "coord_origin": "TOPLEFT" }, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 130, "label": "text", "bbox": { "l": 397.73, "t": 463.92, "r": 399.68, "b": 466.66, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 140, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 397.73, "r_y0": 466.66, "r_x1": 399.68, "r_y1": 466.66, "r_x2": 399.68, "r_y2": 463.92, "r_x3": 397.73, "r_y3": 463.92, "coord_origin": "TOPLEFT" }, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 131, "label": "text", "bbox": { "l": 200.64, "t": 468.8, "r": 206.52, "b": 471.54, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 141, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 200.64, "r_y0": 471.54, "r_x1": 206.52, "r_y1": 471.54, "r_x2": 206.52, "r_y2": 468.8, "r_x3": 200.64, "r_y3": 468.8, "coord_origin": "TOPLEFT" }, "text": "199", "orig": "199", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 132, "label": "text", "bbox": { "l": 264.29, "t": 468.8, "r": 266.26, "b": 471.54, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 142, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 264.29, "r_y0": 471.54, "r_x1": 266.26, "r_y1": 471.54, "r_x2": 266.26, "r_y2": 468.8, "r_x3": 264.29, "r_y3": 468.8, "coord_origin": "TOPLEFT" }, "text": "5", "orig": "5", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 133, "label": "text", "bbox": { "l": 306.37, "t": 468.8, "r": 308.34, "b": 471.54, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 143, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 306.37, "r_y0": 471.54, "r_x1": 308.34, "r_y1": 471.54, "r_x2": 308.34, "r_y2": 468.8, "r_x3": 306.37, "r_y3": 468.8, "coord_origin": "TOPLEFT" }, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 134, "label": "text", "bbox": { "l": 345.52, "t": 468.8, "r": 347.48, "b": 471.54, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 144, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 345.52, "r_y0": 471.54, "r_x1": 347.48, "r_y1": 471.54, "r_x2": 347.48, "r_y2": 468.8, "r_x3": 345.52, "r_y3": 468.8, "coord_origin": "TOPLEFT" }, "text": "2", "orig": "2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 135, "label": "text", "bbox": { "l": 356.56, "t": 468.8, "r": 358.52, "b": 471.54, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 145, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 356.56, "r_y0": 471.54, "r_x1": 358.52, "r_y1": 471.54, "r_x2": 358.52, "r_y2": 468.8, "r_x3": 356.56, "r_y3": 468.8, "coord_origin": "TOPLEFT" }, "text": "4", "orig": "4", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 136, "label": "text", "bbox": { "l": 367.63, "t": 468.8, "r": 369.59, "b": 471.54, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 146, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 367.63, "r_y0": 471.54, "r_x1": 369.59, "r_y1": 471.54, "r_x2": 369.59, "r_y2": 468.8, "r_x3": 367.63, "r_y3": 468.8, "coord_origin": "TOPLEFT" }, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 137, "label": "text", "bbox": { "l": 382.66, "t": 468.8, "r": 384.63, "b": 471.54, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 147, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 382.66, "r_y0": 471.54, "r_x1": 384.63, "r_y1": 471.54, "r_x2": 384.63, "r_y2": 468.8, "r_x3": 382.66, "r_y3": 468.8, "coord_origin": "TOPLEFT" }, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 138, "label": "text", "bbox": { "l": 200.64, "t": 473.68, "r": 206.52, "b": 476.42, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 148, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 200.64, "r_y0": 476.42, "r_x1": 206.52, "r_y1": 476.42, "r_x2": 206.52, "r_y2": 473.68, "r_x3": 200.64, "r_y3": 473.68, "coord_origin": "TOPLEFT" }, "text": "416", "orig": "416", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 139, "label": "text", "bbox": { "l": 264.29, "t": 473.68, "r": 266.26, "b": 476.42, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 149, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 264.29, "r_y0": 476.42, "r_x1": 266.26, "r_y1": 476.42, "r_x2": 266.26, "r_y2": 473.68, "r_x3": 264.29, "r_y3": 473.68, "coord_origin": "TOPLEFT" }, "text": "4", "orig": "4", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 140, "label": "text", "bbox": { "l": 200.64, "t": 478.53, "r": 206.52, "b": 481.27, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 150, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 200.64, "r_y0": 481.27, "r_x1": 206.52, "r_y1": 481.27, "r_x2": 206.52, "r_y2": 478.53, "r_x3": 200.64, "r_y3": 478.53, "coord_origin": "TOPLEFT" }, "text": "230", "orig": "230", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 141, "label": "text", "bbox": { "l": 243.26, "t": 478.53, "r": 245.23, "b": 481.27, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 151, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 243.26, "r_y0": 481.27, "r_x1": 245.23, "r_y1": 481.27, "r_x2": 245.23, "r_y2": 478.53, "r_x3": 243.26, "r_y3": 478.53, "coord_origin": "TOPLEFT" }, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 142, "label": "text", "bbox": { "l": 264.29, "t": 478.53, "r": 266.26, "b": 481.27, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 152, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 264.29, "r_y0": 481.27, "r_x1": 266.26, "r_y1": 481.27, "r_x2": 266.26, "r_y2": 478.53, "r_x3": 264.29, "r_y3": 478.53, "coord_origin": "TOPLEFT" }, "text": "9", "orig": "9", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 143, "label": "text", "bbox": { "l": 323.4, "t": 478.53, "r": 325.37, "b": 481.27, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 153, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 323.4, "r_y0": 481.27, "r_x1": 325.37, "r_y1": 481.27, "r_x2": 325.37, "r_y2": 478.53, "r_x3": 323.4, "r_y3": 478.53, "coord_origin": "TOPLEFT" }, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 144, "label": "text", "bbox": { "l": 397.73, "t": 478.53, "r": 399.69, "b": 481.27, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 154, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 397.73, "r_y0": 481.27, "r_x1": 399.69, "r_y1": 481.27, "r_x2": 399.69, "r_y2": 478.53, "r_x3": 397.73, "r_y3": 478.53, "coord_origin": "TOPLEFT" }, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 145, "label": "text", "bbox": { "l": 200.64, "t": 483.41, "r": 206.52, "b": 486.15, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 155, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 200.64, "r_y0": 486.15, "r_x1": 206.52, "r_y1": 486.15, "r_x2": 206.52, "r_y2": 483.41, "r_x3": 200.64, "r_y3": 483.41, "coord_origin": "TOPLEFT" }, "text": "276", "orig": "276", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 146, "label": "text", "bbox": { "l": 382.66, "t": 483.41, "r": 384.62, "b": 486.15, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 156, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 382.66, "r_y0": 486.15, "r_x1": 384.62, "r_y1": 486.15, "r_x2": 384.62, "r_y2": 483.41, "r_x3": 382.66, "r_y3": 483.41, "coord_origin": "TOPLEFT" }, "text": "2", "orig": "2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 147, "label": "text", "bbox": { "l": 397.73, "t": 483.41, "r": 401.65, "b": 486.15, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 157, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 397.73, "r_y0": 486.15, "r_x1": 401.65, "r_y1": 486.15, "r_x2": 401.65, "r_y2": 483.41, "r_x3": 397.73, "r_y3": 483.41, "coord_origin": "TOPLEFT" }, "text": "12", "orig": "12", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 148, "label": "text", "bbox": { "l": 412.79, "t": 483.41, "r": 414.74, "b": 486.15, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 158, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 412.79, "r_y0": 486.15, "r_x1": 414.74, "r_y1": 486.15, "r_x2": 414.74, "r_y2": 483.41, "r_x3": 412.79, "r_y3": 483.41, "coord_origin": "TOPLEFT" }, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 149, "label": "text", "bbox": { "l": 200.64, "t": 488.29, "r": 207.14, "b": 491.03, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 159, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 200.64, "r_y0": 491.03, "r_x1": 207.14, "r_y1": 491.03, "r_x2": 207.14, "r_y2": 488.29, "r_x3": 200.64, "r_y3": 488.29, "coord_origin": "TOPLEFT" }, "text": "320", "orig": "320", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 150, "label": "text", "bbox": { "l": 367.63, "t": 488.29, "r": 369.78, "b": 491.03, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 160, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 367.63, "r_y0": 491.03, "r_x1": 369.78, "r_y1": 491.03, "r_x2": 369.78, "r_y2": 488.29, "r_x3": 367.63, "r_y3": 488.29, "coord_origin": "TOPLEFT" }, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 151, "label": "text", "bbox": { "l": 382.66, "t": 488.29, "r": 384.82, "b": 491.03, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 161, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 382.66, "r_y0": 491.03, "r_x1": 384.82, "r_y1": 491.03, "r_x2": 384.82, "r_y2": 488.29, "r_x3": 382.66, "r_y3": 488.29, "coord_origin": "TOPLEFT" }, "text": "4", "orig": "4", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 152, "label": "text", "bbox": { "l": 397.73, "t": 488.29, "r": 402.05, "b": 491.03, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 162, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 397.73, "r_y0": 491.03, "r_x1": 402.05, "r_y1": 491.03, "r_x2": 402.05, "r_y2": 488.29, "r_x3": 397.73, "r_y3": 488.29, "coord_origin": "TOPLEFT" }, "text": "20", "orig": "20", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 153, "label": "text", "bbox": { "l": 200.64, "t": 493.17, "r": 208.49, "b": 495.9, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 163, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 200.64, "r_y0": 495.9, "r_x1": 208.49, "r_y1": 495.9, "r_x2": 208.49, "r_y2": 493.17, "r_x3": 200.64, "r_y3": 493.17, "coord_origin": "TOPLEFT" }, "text": "2013", "orig": "2013", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 154, "label": "text", "bbox": { "l": 264.29, "t": 493.17, "r": 266.26, "b": 495.9, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 164, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 264.29, "r_y0": 495.9, "r_x1": 266.26, "r_y1": 495.9, "r_x2": 266.26, "r_y2": 493.17, "r_x3": 264.29, "r_y3": 493.17, "coord_origin": "TOPLEFT" }, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] } ] }, "text": "", "annotations": [], "provenance": null, "predicted_class": null, "confidence": null }, { "label": "text", "id": 155, "page_no": 9, "cluster": { "id": 155, "label": "text", "bbox": { "l": 227.91, "t": 665.83, "r": 230.1, "b": 675.35, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 165, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 227.91, "r_y0": 675.35, "r_x1": 230.1, "r_y1": 675.35, "r_x2": 230.1, "r_y2": 665.83, "r_x3": 227.91, "r_y3": 665.83, "coord_origin": "TOPLEFT" }, "text": "\u03bc", "orig": "\u03bc", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "\u03bc" }, { "label": "text", "id": 156, "page_no": 9, "cluster": { "id": 156, "label": "text", "bbox": { "l": 300.58, "t": 683.62, "r": 302.73, "b": 693.43, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 166, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 300.58, "r_y0": 693.43, "r_x1": 302.73, "r_y1": 693.43, "r_x2": 302.73, "r_y2": 683.62, "r_x3": 300.58, "r_y3": 683.62, "coord_origin": "TOPLEFT" }, "text": "\u2265", "orig": "\u2265", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "\u2265" } ], "body": [ { "label": "caption", "id": 4, "page_no": 9, "cluster": { "id": 4, "label": "caption", "bbox": { "l": 134.76, "t": 115.84, "r": 480.59, "b": 145.89, "coord_origin": "TOPLEFT" }, "confidence": 0.951, "cells": [ { "index": 3, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 123.76, "r_x1": 173.09, "r_y1": 123.76, "r_x2": 173.09, "r_y2": 115.84, "r_x3": 134.76, "r_y3": 115.84, "coord_origin": "TOPLEFT" }, "text": "Table 2.", "orig": "Table 2.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 4, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 181.3, "r_y0": 123.97, "r_x1": 480.59, "r_y1": 123.97, "r_x2": 480.59, "r_y2": 115.9, "r_x3": 181.3, "r_y3": 115.9, "coord_origin": "TOPLEFT" }, "text": "TSR and cell detection results compared between OTSL and HTML on", "orig": "TSR and cell detection results compared between OTSL and HTML on", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 5, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 134.93, "r_x1": 480.59, "r_y1": 134.93, "r_x2": 480.59, "r_y2": 126.86, "r_x3": 134.76, "r_y3": 126.86, "coord_origin": "TOPLEFT" }, "text": "the PubTabNet [22], FinTabNet [21] and PubTables-1M [14] data sets using Table-", "orig": "the PubTabNet [22], FinTabNet [21] and PubTables-1M [14] data sets using Table-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 6, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 145.89, "r_x1": 305.96, "r_y1": 145.89, "r_x2": 305.96, "r_y2": 137.82, "r_x3": 134.76, "r_y3": 137.82, "coord_origin": "TOPLEFT" }, "text": "Former [9] (with enc=6, dec=6, heads=8).", "orig": "Former [9] (with enc=6, dec=6, heads=8).", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "Table 2. TSR and cell detection results compared between OTSL and HTML on the PubTabNet [22], FinTabNet [21] and PubTables-1M [14] data sets using TableFormer [9] (with enc=6, dec=6, heads=8)." }, { "label": "table", "id": 0, "page_no": 9, "cluster": { "id": 0, "label": "table", "bbox": { "l": 143.64, "t": 156.35, "r": 470.85, "b": 263.26, "coord_origin": "TOPLEFT" }, "confidence": 0.988, "cells": [ { "index": 7, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 160.78, "r_y0": 174.63, "r_x1": 195.0, "r_y1": 174.63, "r_x2": 195.0, "r_y2": 166.56, "r_x3": 160.78, "r_y3": 166.56, "coord_origin": "TOPLEFT" }, "text": "Data set", "orig": "Data set", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 8, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 215.52, "r_y0": 174.6, "r_x1": 254.04, "r_y1": 174.6, "r_x2": 254.04, "r_y2": 166.53, "r_x3": 215.52, "r_y3": 166.53, "coord_origin": "TOPLEFT" }, "text": "Language", "orig": "Language", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 9, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 300.4, "r_y0": 169.15, "r_x1": 323.99, "r_y1": 169.15, "r_x2": 323.99, "r_y2": 161.08, "r_x3": 300.4, "r_y3": 161.08, "coord_origin": "TOPLEFT" }, "text": "TEDs", "orig": "TEDs", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 10, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 370.35, "r_y0": 174.63, "r_x1": 414.75, "r_y1": 174.63, "r_x2": 414.75, "r_y2": 166.56, "r_x3": 370.35, "r_y3": 166.56, "coord_origin": "TOPLEFT" }, "text": "mAP(0.75)", "orig": "mAP(0.75)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 11, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 426.74, "r_y0": 169.15, "r_x1": 463.11, "r_y1": 169.15, "r_x2": 463.11, "r_y2": 161.08, "r_x3": 426.74, "r_y3": 161.08, "coord_origin": "TOPLEFT" }, "text": "Inference", "orig": "Inference", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 12, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 423.11, "r_y0": 180.11, "r_x1": 466.73, "r_y1": 180.11, "r_x2": 466.73, "r_y2": 172.04, "r_x3": 423.11, "r_y3": 172.04, "coord_origin": "TOPLEFT" }, "text": "time (secs)", "orig": "time (secs)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 13, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 262.41, "r_y0": 182.1, "r_x1": 288.06, "r_y1": 182.1, "r_x2": 288.06, "r_y2": 174.03, "r_x3": 262.41, "r_y3": 174.03, "coord_origin": "TOPLEFT" }, "text": "simple", "orig": "simple", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 14, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 296.43, "r_y0": 182.1, "r_x1": 329.45, "r_y1": 182.1, "r_x2": 329.45, "r_y2": 174.03, "r_x3": 296.43, "r_y3": 174.03, "coord_origin": "TOPLEFT" }, "text": "complex", "orig": "complex", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 15, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 345.03, "r_y0": 182.1, "r_x1": 354.76, "r_y1": 182.1, "r_x2": 354.76, "r_y2": 174.03, "r_x3": 345.03, "r_y3": 174.03, "coord_origin": "TOPLEFT" }, "text": "all", "orig": "all", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 16, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 154.54, "r_y0": 200.93, "r_x1": 201.24, "r_y1": 200.93, "r_x2": 201.24, "r_y2": 192.86, "r_x3": 154.54, "r_y3": 192.86, "coord_origin": "TOPLEFT" }, "text": "PubTabNet", "orig": "PubTabNet", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 17, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 222.44, "r_y0": 195.45, "r_x1": 247.13, "r_y1": 195.45, "r_x2": 247.13, "r_y2": 187.38, "r_x3": 222.44, "r_y3": 187.38, "coord_origin": "TOPLEFT" }, "text": "OTSL", "orig": "OTSL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 18, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 264.74, "r_y0": 195.45, "r_x1": 285.73, "r_y1": 195.45, "r_x2": 285.73, "r_y2": 187.38, "r_x3": 264.74, "r_y3": 187.38, "coord_origin": "TOPLEFT" }, "text": "0.965", "orig": "0.965", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 19, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 302.44, "r_y0": 195.45, "r_x1": 323.43, "r_y1": 195.45, "r_x2": 323.43, "r_y2": 187.38, "r_x3": 302.44, "r_y3": 187.38, "coord_origin": "TOPLEFT" }, "text": "0.934", "orig": "0.934", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 20, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 339.4, "r_y0": 195.45, "r_x1": 360.39, "r_y1": 195.45, "r_x2": 360.39, "r_y2": 187.38, "r_x3": 339.4, "r_y3": 187.38, "coord_origin": "TOPLEFT" }, "text": "0.955", "orig": "0.955", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 21, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 383.12, "r_y0": 195.24, "r_x1": 401.97, "r_y1": 195.24, "r_x2": 401.97, "r_y2": 187.32, "r_x3": 383.12, "r_y3": 187.32, "coord_origin": "TOPLEFT" }, "text": "0.88", "orig": "0.88", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 22, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 435.49, "r_y0": 195.24, "r_x1": 454.35, "r_y1": 195.24, "r_x2": 454.35, "r_y2": 187.32, "r_x3": 435.49, "r_y3": 187.32, "coord_origin": "TOPLEFT" }, "text": "2.73", "orig": "2.73", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 23, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 220.9, "r_y0": 208.4, "r_x1": 248.67, "r_y1": 208.4, "r_x2": 248.67, "r_y2": 200.33, "r_x3": 220.9, "r_y3": 200.33, "coord_origin": "TOPLEFT" }, "text": "HTML", "orig": "HTML", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 24, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 264.74, "r_y0": 208.4, "r_x1": 285.73, "r_y1": 208.4, "r_x2": 285.73, "r_y2": 200.33, "r_x3": 264.74, "r_y3": 200.33, "coord_origin": "TOPLEFT" }, "text": "0.969", "orig": "0.969", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 25, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 302.44, "r_y0": 208.4, "r_x1": 323.43, "r_y1": 208.4, "r_x2": 323.43, "r_y2": 200.33, "r_x3": 302.44, "r_y3": 200.33, "coord_origin": "TOPLEFT" }, "text": "0.927", "orig": "0.927", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 26, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 339.4, "r_y0": 208.4, "r_x1": 360.39, "r_y1": 208.4, "r_x2": 360.39, "r_y2": 200.33, "r_x3": 339.4, "r_y3": 200.33, "coord_origin": "TOPLEFT" }, "text": "0.955", "orig": "0.955", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 27, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 382.05, "r_y0": 208.4, "r_x1": 403.04, "r_y1": 208.4, "r_x2": 403.04, "r_y2": 200.33, "r_x3": 382.05, "r_y3": 200.33, "coord_origin": "TOPLEFT" }, "text": "0.857", "orig": "0.857", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 28, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 436.73, "r_y0": 208.4, "r_x1": 453.11, "r_y1": 208.4, "r_x2": 453.11, "r_y2": 200.33, "r_x3": 436.73, "r_y3": 200.33, "coord_origin": "TOPLEFT" }, "text": "5.39", "orig": "5.39", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 29, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 155.95, "r_y0": 227.23, "r_x1": 199.83, "r_y1": 227.23, "r_x2": 199.83, "r_y2": 219.16, "r_x3": 155.95, "r_y3": 219.16, "coord_origin": "TOPLEFT" }, "text": "FinTabNet", "orig": "FinTabNet", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 30, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 222.44, "r_y0": 221.75, "r_x1": 247.13, "r_y1": 221.75, "r_x2": 247.13, "r_y2": 213.68, "r_x3": 222.44, "r_y3": 213.68, "coord_origin": "TOPLEFT" }, "text": "OTSL", "orig": "OTSL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 31, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 264.74, "r_y0": 221.75, "r_x1": 285.73, "r_y1": 221.75, "r_x2": 285.73, "r_y2": 213.68, "r_x3": 264.74, "r_y3": 213.68, "coord_origin": "TOPLEFT" }, "text": "0.955", "orig": "0.955", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 32, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 302.44, "r_y0": 221.75, "r_x1": 323.43, "r_y1": 221.75, "r_x2": 323.43, "r_y2": 213.68, "r_x3": 302.44, "r_y3": 213.68, "coord_origin": "TOPLEFT" }, "text": "0.961", "orig": "0.961", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 33, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 337.81, "r_y0": 221.55, "r_x1": 361.98, "r_y1": 221.55, "r_x2": 361.98, "r_y2": 213.62, "r_x3": 337.81, "r_y3": 213.62, "coord_origin": "TOPLEFT" }, "text": "0.959", "orig": "0.959", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 34, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 380.46, "r_y0": 221.55, "r_x1": 404.62, "r_y1": 221.55, "r_x2": 404.62, "r_y2": 213.62, "r_x3": 380.46, "r_y3": 213.62, "coord_origin": "TOPLEFT" }, "text": "0.862", "orig": "0.862", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 35, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 435.49, "r_y0": 221.55, "r_x1": 454.35, "r_y1": 221.55, "r_x2": 454.35, "r_y2": 213.62, "r_x3": 435.49, "r_y3": 213.62, "coord_origin": "TOPLEFT" }, "text": "1.85", "orig": "1.85", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 36, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 220.9, "r_y0": 234.7, "r_x1": 248.67, "r_y1": 234.7, "r_x2": 248.67, "r_y2": 226.63, "r_x3": 220.9, "r_y3": 226.63, "coord_origin": "TOPLEFT" }, "text": "HTML", "orig": "HTML", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 37, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 264.74, "r_y0": 234.7, "r_x1": 285.73, "r_y1": 234.7, "r_x2": 285.73, "r_y2": 226.63, "r_x3": 264.74, "r_y3": 226.63, "coord_origin": "TOPLEFT" }, "text": "0.917", "orig": "0.917", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 38, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 302.44, "r_y0": 234.7, "r_x1": 323.43, "r_y1": 234.7, "r_x2": 323.43, "r_y2": 226.63, "r_x3": 302.44, "r_y3": 226.63, "coord_origin": "TOPLEFT" }, "text": "0.922", "orig": "0.922", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 39, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 341.71, "r_y0": 234.7, "r_x1": 358.09, "r_y1": 234.7, "r_x2": 358.09, "r_y2": 226.63, "r_x3": 341.71, "r_y3": 226.63, "coord_origin": "TOPLEFT" }, "text": "0.92", "orig": "0.92", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 40, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 382.05, "r_y0": 234.7, "r_x1": 403.04, "r_y1": 234.7, "r_x2": 403.04, "r_y2": 226.63, "r_x3": 382.05, "r_y3": 226.63, "coord_origin": "TOPLEFT" }, "text": "0.722", "orig": "0.722", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 41, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 436.73, "r_y0": 234.7, "r_x1": 453.11, "r_y1": 234.7, "r_x2": 453.11, "r_y2": 226.63, "r_x3": 436.73, "r_y3": 226.63, "coord_origin": "TOPLEFT" }, "text": "3.26", "orig": "3.26", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 42, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 148.63, "r_y0": 253.53, "r_x1": 207.15, "r_y1": 253.53, "r_x2": 207.15, "r_y2": 245.46, "r_x3": 148.63, "r_y3": 245.46, "coord_origin": "TOPLEFT" }, "text": "PubTables-1M", "orig": "PubTables-1M", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 43, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 222.44, "r_y0": 248.05, "r_x1": 247.13, "r_y1": 248.05, "r_x2": 247.13, "r_y2": 239.98, "r_x3": 222.44, "r_y3": 239.98, "coord_origin": "TOPLEFT" }, "text": "OTSL", "orig": "OTSL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 44, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 264.74, "r_y0": 248.05, "r_x1": 285.73, "r_y1": 248.05, "r_x2": 285.73, "r_y2": 239.98, "r_x3": 264.74, "r_y3": 239.98, "coord_origin": "TOPLEFT" }, "text": "0.987", "orig": "0.987", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 45, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 302.44, "r_y0": 248.05, "r_x1": 323.43, "r_y1": 248.05, "r_x2": 323.43, "r_y2": 239.98, "r_x3": 302.44, "r_y3": 239.98, "coord_origin": "TOPLEFT" }, "text": "0.964", "orig": "0.964", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 46, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 337.81, "r_y0": 247.85, "r_x1": 361.98, "r_y1": 247.85, "r_x2": 361.98, "r_y2": 239.92, "r_x3": 337.81, "r_y3": 239.92, "coord_origin": "TOPLEFT" }, "text": "0.977", "orig": "0.977", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 47, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 380.46, "r_y0": 247.85, "r_x1": 404.62, "r_y1": 247.85, "r_x2": 404.62, "r_y2": 239.92, "r_x3": 380.46, "r_y3": 239.92, "coord_origin": "TOPLEFT" }, "text": "0.896", "orig": "0.896", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 48, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 435.49, "r_y0": 247.85, "r_x1": 454.35, "r_y1": 247.85, "r_x2": 454.35, "r_y2": 239.92, "r_x3": 435.49, "r_y3": 239.92, "coord_origin": "TOPLEFT" }, "text": "1.79", "orig": "1.79", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 49, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 220.9, "r_y0": 261.0, "r_x1": 248.67, "r_y1": 261.0, "r_x2": 248.67, "r_y2": 252.93, "r_x3": 220.9, "r_y3": 252.93, "coord_origin": "TOPLEFT" }, "text": "HTML", "orig": "HTML", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 50, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 264.74, "r_y0": 261.0, "r_x1": 285.73, "r_y1": 261.0, "r_x2": 285.73, "r_y2": 252.93, "r_x3": 264.74, "r_y3": 252.93, "coord_origin": "TOPLEFT" }, "text": "0.983", "orig": "0.983", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 51, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 302.44, "r_y0": 261.0, "r_x1": 323.43, "r_y1": 261.0, "r_x2": 323.43, "r_y2": 252.93, "r_x3": 302.44, "r_y3": 252.93, "coord_origin": "TOPLEFT" }, "text": "0.944", "orig": "0.944", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 52, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 339.4, "r_y0": 261.0, "r_x1": 360.39, "r_y1": 261.0, "r_x2": 360.39, "r_y2": 252.93, "r_x3": 339.4, "r_y3": 252.93, "coord_origin": "TOPLEFT" }, "text": "0.966", "orig": "0.966", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 53, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 382.05, "r_y0": 261.0, "r_x1": 403.04, "r_y1": 261.0, "r_x2": 403.04, "r_y2": 252.93, "r_x3": 382.05, "r_y3": 252.93, "coord_origin": "TOPLEFT" }, "text": "0.889", "orig": "0.889", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 54, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 436.73, "r_y0": 261.0, "r_x1": 453.11, "r_y1": 261.0, "r_x2": 453.11, "r_y2": 252.93, "r_x3": 436.73, "r_y3": 252.93, "coord_origin": "TOPLEFT" }, "text": "3.26", "orig": "3.26", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [ { "id": 10, "label": "text", "bbox": { "l": 160.78, "t": 166.56, "r": 195.0, "b": 174.63, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 7, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 160.78, "r_y0": 174.63, "r_x1": 195.0, "r_y1": 174.63, "r_x2": 195.0, "r_y2": 166.56, "r_x3": 160.78, "r_y3": 166.56, "coord_origin": "TOPLEFT" }, "text": "Data set", "orig": "Data set", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 11, "label": "text", "bbox": { "l": 215.52, "t": 166.53, "r": 254.04, "b": 174.6, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 8, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 215.52, "r_y0": 174.6, "r_x1": 254.04, "r_y1": 174.6, "r_x2": 254.04, "r_y2": 166.53, "r_x3": 215.52, "r_y3": 166.53, "coord_origin": "TOPLEFT" }, "text": "Language", "orig": "Language", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 12, "label": "text", "bbox": { "l": 300.4, "t": 161.08, "r": 323.99, "b": 169.15, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 9, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 300.4, "r_y0": 169.15, "r_x1": 323.99, "r_y1": 169.15, "r_x2": 323.99, "r_y2": 161.08, "r_x3": 300.4, "r_y3": 161.08, "coord_origin": "TOPLEFT" }, "text": "TEDs", "orig": "TEDs", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 13, "label": "text", "bbox": { "l": 370.35, "t": 166.56, "r": 414.75, "b": 174.63, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 10, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 370.35, "r_y0": 174.63, "r_x1": 414.75, "r_y1": 174.63, "r_x2": 414.75, "r_y2": 166.56, "r_x3": 370.35, "r_y3": 166.56, "coord_origin": "TOPLEFT" }, "text": "mAP(0.75)", "orig": "mAP(0.75)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 14, "label": "text", "bbox": { "l": 426.74, "t": 161.08, "r": 463.11, "b": 169.15, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 11, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 426.74, "r_y0": 169.15, "r_x1": 463.11, "r_y1": 169.15, "r_x2": 463.11, "r_y2": 161.08, "r_x3": 426.74, "r_y3": 161.08, "coord_origin": "TOPLEFT" }, "text": "Inference", "orig": "Inference", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 15, "label": "text", "bbox": { "l": 423.11, "t": 172.04, "r": 466.73, "b": 180.11, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 12, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 423.11, "r_y0": 180.11, "r_x1": 466.73, "r_y1": 180.11, "r_x2": 466.73, "r_y2": 172.04, "r_x3": 423.11, "r_y3": 172.04, "coord_origin": "TOPLEFT" }, "text": "time (secs)", "orig": "time (secs)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 16, "label": "text", "bbox": { "l": 262.41, "t": 174.03, "r": 288.06, "b": 182.1, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 13, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 262.41, "r_y0": 182.1, "r_x1": 288.06, "r_y1": 182.1, "r_x2": 288.06, "r_y2": 174.03, "r_x3": 262.41, "r_y3": 174.03, "coord_origin": "TOPLEFT" }, "text": "simple", "orig": "simple", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 17, "label": "text", "bbox": { "l": 296.43, "t": 174.03, "r": 329.45, "b": 182.1, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 14, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 296.43, "r_y0": 182.1, "r_x1": 329.45, "r_y1": 182.1, "r_x2": 329.45, "r_y2": 174.03, "r_x3": 296.43, "r_y3": 174.03, "coord_origin": "TOPLEFT" }, "text": "complex", "orig": "complex", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 18, "label": "text", "bbox": { "l": 345.03, "t": 174.03, "r": 354.76, "b": 182.1, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 15, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 345.03, "r_y0": 182.1, "r_x1": 354.76, "r_y1": 182.1, "r_x2": 354.76, "r_y2": 174.03, "r_x3": 345.03, "r_y3": 174.03, "coord_origin": "TOPLEFT" }, "text": "all", "orig": "all", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 19, "label": "text", "bbox": { "l": 154.54, "t": 192.86, "r": 201.24, "b": 200.93, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 16, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 154.54, "r_y0": 200.93, "r_x1": 201.24, "r_y1": 200.93, "r_x2": 201.24, "r_y2": 192.86, "r_x3": 154.54, "r_y3": 192.86, "coord_origin": "TOPLEFT" }, "text": "PubTabNet", "orig": "PubTabNet", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 20, "label": "text", "bbox": { "l": 222.44, "t": 187.38, "r": 247.13, "b": 195.45, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 17, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 222.44, "r_y0": 195.45, "r_x1": 247.13, "r_y1": 195.45, "r_x2": 247.13, "r_y2": 187.38, "r_x3": 222.44, "r_y3": 187.38, "coord_origin": "TOPLEFT" }, "text": "OTSL", "orig": "OTSL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 21, "label": "text", "bbox": { "l": 264.74, "t": 187.38, "r": 285.73, "b": 195.45, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 18, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 264.74, "r_y0": 195.45, "r_x1": 285.73, "r_y1": 195.45, "r_x2": 285.73, "r_y2": 187.38, "r_x3": 264.74, "r_y3": 187.38, "coord_origin": "TOPLEFT" }, "text": "0.965", "orig": "0.965", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 22, "label": "text", "bbox": { "l": 302.44, "t": 187.38, "r": 323.43, "b": 195.45, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 19, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 302.44, "r_y0": 195.45, "r_x1": 323.43, "r_y1": 195.45, "r_x2": 323.43, "r_y2": 187.38, "r_x3": 302.44, "r_y3": 187.38, "coord_origin": "TOPLEFT" }, "text": "0.934", "orig": "0.934", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 23, "label": "text", "bbox": { "l": 339.4, "t": 187.38, "r": 360.39, "b": 195.45, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 20, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 339.4, "r_y0": 195.45, "r_x1": 360.39, "r_y1": 195.45, "r_x2": 360.39, "r_y2": 187.38, "r_x3": 339.4, "r_y3": 187.38, "coord_origin": "TOPLEFT" }, "text": "0.955", "orig": "0.955", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 24, "label": "text", "bbox": { "l": 383.12, "t": 187.32, "r": 401.97, "b": 195.24, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 21, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 383.12, "r_y0": 195.24, "r_x1": 401.97, "r_y1": 195.24, "r_x2": 401.97, "r_y2": 187.32, "r_x3": 383.12, "r_y3": 187.32, "coord_origin": "TOPLEFT" }, "text": "0.88", "orig": "0.88", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 25, "label": "text", "bbox": { "l": 435.49, "t": 187.32, "r": 454.35, "b": 195.24, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 22, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 435.49, "r_y0": 195.24, "r_x1": 454.35, "r_y1": 195.24, "r_x2": 454.35, "r_y2": 187.32, "r_x3": 435.49, "r_y3": 187.32, "coord_origin": "TOPLEFT" }, "text": "2.73", "orig": "2.73", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 26, "label": "text", "bbox": { "l": 220.9, "t": 200.33, "r": 248.67, "b": 208.4, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 23, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 220.9, "r_y0": 208.4, "r_x1": 248.67, "r_y1": 208.4, "r_x2": 248.67, "r_y2": 200.33, "r_x3": 220.9, "r_y3": 200.33, "coord_origin": "TOPLEFT" }, "text": "HTML", "orig": "HTML", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 27, "label": "text", "bbox": { "l": 264.74, "t": 200.33, "r": 285.73, "b": 208.4, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 24, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 264.74, "r_y0": 208.4, "r_x1": 285.73, "r_y1": 208.4, "r_x2": 285.73, "r_y2": 200.33, "r_x3": 264.74, "r_y3": 200.33, "coord_origin": "TOPLEFT" }, "text": "0.969", "orig": "0.969", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 28, "label": "text", "bbox": { "l": 302.44, "t": 200.33, "r": 323.43, "b": 208.4, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 25, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 302.44, "r_y0": 208.4, "r_x1": 323.43, "r_y1": 208.4, "r_x2": 323.43, "r_y2": 200.33, "r_x3": 302.44, "r_y3": 200.33, "coord_origin": "TOPLEFT" }, "text": "0.927", "orig": "0.927", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 29, "label": "text", "bbox": { "l": 339.4, "t": 200.33, "r": 360.39, "b": 208.4, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 26, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 339.4, "r_y0": 208.4, "r_x1": 360.39, "r_y1": 208.4, "r_x2": 360.39, "r_y2": 200.33, "r_x3": 339.4, "r_y3": 200.33, "coord_origin": "TOPLEFT" }, "text": "0.955", "orig": "0.955", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 30, "label": "text", "bbox": { "l": 382.05, "t": 200.33, "r": 403.04, "b": 208.4, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 27, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 382.05, "r_y0": 208.4, "r_x1": 403.04, "r_y1": 208.4, "r_x2": 403.04, "r_y2": 200.33, "r_x3": 382.05, "r_y3": 200.33, "coord_origin": "TOPLEFT" }, "text": "0.857", "orig": "0.857", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 31, "label": "text", "bbox": { "l": 436.73, "t": 200.33, "r": 453.11, "b": 208.4, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 28, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 436.73, "r_y0": 208.4, "r_x1": 453.11, "r_y1": 208.4, "r_x2": 453.11, "r_y2": 200.33, "r_x3": 436.73, "r_y3": 200.33, "coord_origin": "TOPLEFT" }, "text": "5.39", "orig": "5.39", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 32, "label": "text", "bbox": { "l": 155.95, "t": 219.16, "r": 199.83, "b": 227.23, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 29, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 155.95, "r_y0": 227.23, "r_x1": 199.83, "r_y1": 227.23, "r_x2": 199.83, "r_y2": 219.16, "r_x3": 155.95, "r_y3": 219.16, "coord_origin": "TOPLEFT" }, "text": "FinTabNet", "orig": "FinTabNet", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 33, "label": "text", "bbox": { "l": 222.44, "t": 213.68, "r": 247.13, "b": 221.75, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 30, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 222.44, "r_y0": 221.75, "r_x1": 247.13, "r_y1": 221.75, "r_x2": 247.13, "r_y2": 213.68, "r_x3": 222.44, "r_y3": 213.68, "coord_origin": "TOPLEFT" }, "text": "OTSL", "orig": "OTSL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 34, "label": "text", "bbox": { "l": 264.74, "t": 213.68, "r": 285.73, "b": 221.75, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 31, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 264.74, "r_y0": 221.75, "r_x1": 285.73, "r_y1": 221.75, "r_x2": 285.73, "r_y2": 213.68, "r_x3": 264.74, "r_y3": 213.68, "coord_origin": "TOPLEFT" }, "text": "0.955", "orig": "0.955", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 35, "label": "text", "bbox": { "l": 302.44, "t": 213.68, "r": 323.43, "b": 221.75, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 32, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 302.44, "r_y0": 221.75, "r_x1": 323.43, "r_y1": 221.75, "r_x2": 323.43, "r_y2": 213.68, "r_x3": 302.44, "r_y3": 213.68, "coord_origin": "TOPLEFT" }, "text": "0.961", "orig": "0.961", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 36, "label": "text", "bbox": { "l": 337.81, "t": 213.62, "r": 361.98, "b": 221.55, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 33, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 337.81, "r_y0": 221.55, "r_x1": 361.98, "r_y1": 221.55, "r_x2": 361.98, "r_y2": 213.62, "r_x3": 337.81, "r_y3": 213.62, "coord_origin": "TOPLEFT" }, "text": "0.959", "orig": "0.959", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 37, "label": "text", "bbox": { "l": 380.46, "t": 213.62, "r": 404.62, "b": 221.55, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 34, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 380.46, "r_y0": 221.55, "r_x1": 404.62, "r_y1": 221.55, "r_x2": 404.62, "r_y2": 213.62, "r_x3": 380.46, "r_y3": 213.62, "coord_origin": "TOPLEFT" }, "text": "0.862", "orig": "0.862", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 38, "label": "text", "bbox": { "l": 435.49, "t": 213.62, "r": 454.35, "b": 221.55, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 35, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 435.49, "r_y0": 221.55, "r_x1": 454.35, "r_y1": 221.55, "r_x2": 454.35, "r_y2": 213.62, "r_x3": 435.49, "r_y3": 213.62, "coord_origin": "TOPLEFT" }, "text": "1.85", "orig": "1.85", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 39, "label": "text", "bbox": { "l": 220.9, "t": 226.63, "r": 248.67, "b": 234.7, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 36, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 220.9, "r_y0": 234.7, "r_x1": 248.67, "r_y1": 234.7, "r_x2": 248.67, "r_y2": 226.63, "r_x3": 220.9, "r_y3": 226.63, "coord_origin": "TOPLEFT" }, "text": "HTML", "orig": "HTML", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 40, "label": "text", "bbox": { "l": 264.74, "t": 226.63, "r": 285.73, "b": 234.7, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 37, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 264.74, "r_y0": 234.7, "r_x1": 285.73, "r_y1": 234.7, "r_x2": 285.73, "r_y2": 226.63, "r_x3": 264.74, "r_y3": 226.63, "coord_origin": "TOPLEFT" }, "text": "0.917", "orig": "0.917", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 41, "label": "text", "bbox": { "l": 302.44, "t": 226.63, "r": 323.43, "b": 234.7, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 38, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 302.44, "r_y0": 234.7, "r_x1": 323.43, "r_y1": 234.7, "r_x2": 323.43, "r_y2": 226.63, "r_x3": 302.44, "r_y3": 226.63, "coord_origin": "TOPLEFT" }, "text": "0.922", "orig": "0.922", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 42, "label": "text", "bbox": { "l": 341.71, "t": 226.63, "r": 358.09, "b": 234.7, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 39, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 341.71, "r_y0": 234.7, "r_x1": 358.09, "r_y1": 234.7, "r_x2": 358.09, "r_y2": 226.63, "r_x3": 341.71, "r_y3": 226.63, "coord_origin": "TOPLEFT" }, "text": "0.92", "orig": "0.92", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 43, "label": "text", "bbox": { "l": 382.05, "t": 226.63, "r": 403.04, "b": 234.7, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 40, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 382.05, "r_y0": 234.7, "r_x1": 403.04, "r_y1": 234.7, "r_x2": 403.04, "r_y2": 226.63, "r_x3": 382.05, "r_y3": 226.63, "coord_origin": "TOPLEFT" }, "text": "0.722", "orig": "0.722", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 44, "label": "text", "bbox": { "l": 436.73, "t": 226.63, "r": 453.11, "b": 234.7, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 41, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 436.73, "r_y0": 234.7, "r_x1": 453.11, "r_y1": 234.7, "r_x2": 453.11, "r_y2": 226.63, "r_x3": 436.73, "r_y3": 226.63, "coord_origin": "TOPLEFT" }, "text": "3.26", "orig": "3.26", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 45, "label": "text", "bbox": { "l": 148.63, "t": 245.46, "r": 207.15, "b": 253.53, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 42, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 148.63, "r_y0": 253.53, "r_x1": 207.15, "r_y1": 253.53, "r_x2": 207.15, "r_y2": 245.46, "r_x3": 148.63, "r_y3": 245.46, "coord_origin": "TOPLEFT" }, "text": "PubTables-1M", "orig": "PubTables-1M", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 46, "label": "text", "bbox": { "l": 222.44, "t": 239.98, "r": 247.13, "b": 248.05, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 43, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 222.44, "r_y0": 248.05, "r_x1": 247.13, "r_y1": 248.05, "r_x2": 247.13, "r_y2": 239.98, "r_x3": 222.44, "r_y3": 239.98, "coord_origin": "TOPLEFT" }, "text": "OTSL", "orig": "OTSL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 47, "label": "text", "bbox": { "l": 264.74, "t": 239.98, "r": 285.73, "b": 248.05, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 44, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 264.74, "r_y0": 248.05, "r_x1": 285.73, "r_y1": 248.05, "r_x2": 285.73, "r_y2": 239.98, "r_x3": 264.74, "r_y3": 239.98, "coord_origin": "TOPLEFT" }, "text": "0.987", "orig": "0.987", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 48, "label": "text", "bbox": { "l": 302.44, "t": 239.98, "r": 323.43, "b": 248.05, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 45, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 302.44, "r_y0": 248.05, "r_x1": 323.43, "r_y1": 248.05, "r_x2": 323.43, "r_y2": 239.98, "r_x3": 302.44, "r_y3": 239.98, "coord_origin": "TOPLEFT" }, "text": "0.964", "orig": "0.964", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 49, "label": "text", "bbox": { "l": 337.81, "t": 239.92, "r": 361.98, "b": 247.85, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 46, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 337.81, "r_y0": 247.85, "r_x1": 361.98, "r_y1": 247.85, "r_x2": 361.98, "r_y2": 239.92, "r_x3": 337.81, "r_y3": 239.92, "coord_origin": "TOPLEFT" }, "text": "0.977", "orig": "0.977", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 50, "label": "text", "bbox": { "l": 380.46, "t": 239.92, "r": 404.62, "b": 247.85, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 47, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 380.46, "r_y0": 247.85, "r_x1": 404.62, "r_y1": 247.85, "r_x2": 404.62, "r_y2": 239.92, "r_x3": 380.46, "r_y3": 239.92, "coord_origin": "TOPLEFT" }, "text": "0.896", "orig": "0.896", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 51, "label": "text", "bbox": { "l": 435.49, "t": 239.92, "r": 454.35, "b": 247.85, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 48, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 435.49, "r_y0": 247.85, "r_x1": 454.35, "r_y1": 247.85, "r_x2": 454.35, "r_y2": 239.92, "r_x3": 435.49, "r_y3": 239.92, "coord_origin": "TOPLEFT" }, "text": "1.79", "orig": "1.79", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 52, "label": "text", "bbox": { "l": 220.9, "t": 252.93, "r": 248.67, "b": 261.0, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 49, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 220.9, "r_y0": 261.0, "r_x1": 248.67, "r_y1": 261.0, "r_x2": 248.67, "r_y2": 252.93, "r_x3": 220.9, "r_y3": 252.93, "coord_origin": "TOPLEFT" }, "text": "HTML", "orig": "HTML", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 53, "label": "text", "bbox": { "l": 264.74, "t": 252.93, "r": 285.73, "b": 261.0, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 50, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 264.74, "r_y0": 261.0, "r_x1": 285.73, "r_y1": 261.0, "r_x2": 285.73, "r_y2": 252.93, "r_x3": 264.74, "r_y3": 252.93, "coord_origin": "TOPLEFT" }, "text": "0.983", "orig": "0.983", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 54, "label": "text", "bbox": { "l": 302.44, "t": 252.93, "r": 323.43, "b": 261.0, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 51, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 302.44, "r_y0": 261.0, "r_x1": 323.43, "r_y1": 261.0, "r_x2": 323.43, "r_y2": 252.93, "r_x3": 302.44, "r_y3": 252.93, "coord_origin": "TOPLEFT" }, "text": "0.944", "orig": "0.944", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 55, "label": "text", "bbox": { "l": 339.4, "t": 252.93, "r": 360.39, "b": 261.0, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 52, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 339.4, "r_y0": 261.0, "r_x1": 360.39, "r_y1": 261.0, "r_x2": 360.39, "r_y2": 252.93, "r_x3": 339.4, "r_y3": 252.93, "coord_origin": "TOPLEFT" }, "text": "0.966", "orig": "0.966", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 56, "label": "text", "bbox": { "l": 382.05, "t": 252.93, "r": 403.04, "b": 261.0, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 53, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 382.05, "r_y0": 261.0, "r_x1": 403.04, "r_y1": 261.0, "r_x2": 403.04, "r_y2": 252.93, "r_x3": 382.05, "r_y3": 252.93, "coord_origin": "TOPLEFT" }, "text": "0.889", "orig": "0.889", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 57, "label": "text", "bbox": { "l": 436.73, "t": 252.93, "r": 453.11, "b": 261.0, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 54, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 436.73, "r_y0": 261.0, "r_x1": 453.11, "r_y1": 261.0, "r_x2": 453.11, "r_y2": 252.93, "r_x3": 436.73, "r_y3": 252.93, "coord_origin": "TOPLEFT" }, "text": "3.26", "orig": "3.26", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] } ] }, "text": null, "otsl_seq": [ "ched", "ched", "ched", "lcel", "lcel", "ched", "ched", "nl", "ucel", "ucel", "ched", "ched", "ched", "ucel", "ucel", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "nl" ], "num_rows": 5, "num_cols": 7, "table_cells": [ { "bbox": { "l": 160.78, "t": 166.56, "r": 195.0, "b": 174.63, "coord_origin": "TOPLEFT" }, "row_span": 2, "col_span": 1, "start_row_offset_idx": 0, "end_row_offset_idx": 2, "start_col_offset_idx": 0, "end_col_offset_idx": 1, "text": "Data set", "column_header": true, "row_header": false, "row_section": false }, { "bbox": { "l": 215.52, "t": 166.53, "r": 254.04, "b": 174.6, "coord_origin": "TOPLEFT" }, "row_span": 2, "col_span": 1, "start_row_offset_idx": 0, "end_row_offset_idx": 2, "start_col_offset_idx": 1, "end_col_offset_idx": 2, "text": "Language", "column_header": true, "row_header": false, "row_section": false }, { "bbox": { "l": 300.4, "t": 161.08, "r": 323.99, "b": 169.15, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 3, "start_row_offset_idx": 0, "end_row_offset_idx": 1, "start_col_offset_idx": 2, "end_col_offset_idx": 5, "text": "TEDs", "column_header": true, "row_header": false, "row_section": false }, { "bbox": { "l": 370.35, "t": 166.56, "r": 414.75, "b": 174.63, "coord_origin": "TOPLEFT" }, "row_span": 2, "col_span": 1, "start_row_offset_idx": 0, "end_row_offset_idx": 2, "start_col_offset_idx": 5, "end_col_offset_idx": 6, "text": "mAP(0.75)", "column_header": true, "row_header": false, "row_section": false }, { "bbox": { "l": 426.74, "t": 161.08, "r": 463.11, "b": 169.15, "coord_origin": "TOPLEFT" }, "row_span": 2, "col_span": 1, "start_row_offset_idx": 0, "end_row_offset_idx": 2, "start_col_offset_idx": 6, "end_col_offset_idx": 7, "text": "Inference time (secs)", "column_header": true, "row_header": false, "row_section": false }, { "bbox": { "l": 262.41, "t": 174.03, "r": 288.06, "b": 182.1, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 1, "end_row_offset_idx": 2, "start_col_offset_idx": 2, "end_col_offset_idx": 3, "text": "simple", "column_header": true, "row_header": false, "row_section": false }, { "bbox": { "l": 296.43, "t": 174.03, "r": 329.45, "b": 182.1, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 1, "end_row_offset_idx": 2, "start_col_offset_idx": 3, "end_col_offset_idx": 4, "text": "complex", "column_header": true, "row_header": false, "row_section": false }, { "bbox": { "l": 345.03, "t": 174.03, "r": 354.76, "b": 182.1, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 1, "end_row_offset_idx": 2, "start_col_offset_idx": 4, "end_col_offset_idx": 5, "text": "all", "column_header": true, "row_header": false, "row_section": false }, { "bbox": { "l": 154.54, "t": 192.86, "r": 201.24, "b": 200.93, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 2, "end_row_offset_idx": 3, "start_col_offset_idx": 0, "end_col_offset_idx": 1, "text": "PubTabNet", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 222.44, "t": 187.38, "r": 247.13, "b": 195.45, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 2, "end_row_offset_idx": 3, "start_col_offset_idx": 1, "end_col_offset_idx": 2, "text": "OTSL HTML", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 264.74, "t": 187.38, "r": 285.73, "b": 195.45, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 2, "end_row_offset_idx": 3, "start_col_offset_idx": 2, "end_col_offset_idx": 3, "text": "0.965 0.969", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 302.44, "t": 187.38, "r": 323.43, "b": 195.45, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 2, "end_row_offset_idx": 3, "start_col_offset_idx": 3, "end_col_offset_idx": 4, "text": "0.934 0.927", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 339.4, "t": 187.38, "r": 360.39, "b": 195.45, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 2, "end_row_offset_idx": 3, "start_col_offset_idx": 4, "end_col_offset_idx": 5, "text": "0.955 0.955", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 383.12, "t": 187.32, "r": 401.97, "b": 195.24, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 2, "end_row_offset_idx": 3, "start_col_offset_idx": 5, "end_col_offset_idx": 6, "text": "0.88 0.857", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 435.49, "t": 187.32, "r": 454.35, "b": 195.24, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 2, "end_row_offset_idx": 3, "start_col_offset_idx": 6, "end_col_offset_idx": 7, "text": "2.73 5.39", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 155.95, "t": 219.16, "r": 199.83, "b": 227.23, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 3, "end_row_offset_idx": 4, "start_col_offset_idx": 0, "end_col_offset_idx": 1, "text": "FinTabNet", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 222.44, "t": 213.68, "r": 247.13, "b": 221.75, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 3, "end_row_offset_idx": 4, "start_col_offset_idx": 1, "end_col_offset_idx": 2, "text": "OTSL HTML", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 264.74, "t": 213.68, "r": 285.73, "b": 221.75, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 3, "end_row_offset_idx": 4, "start_col_offset_idx": 2, "end_col_offset_idx": 3, "text": "0.955 0.917", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 302.44, "t": 213.68, "r": 323.43, "b": 221.75, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 3, "end_row_offset_idx": 4, "start_col_offset_idx": 3, "end_col_offset_idx": 4, "text": "0.961 0.922", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 337.81, "t": 213.62, "r": 361.98, "b": 221.55, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 3, "end_row_offset_idx": 4, "start_col_offset_idx": 4, "end_col_offset_idx": 5, "text": "0.959 0.92", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 380.46, "t": 213.62, "r": 404.62, "b": 221.55, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 3, "end_row_offset_idx": 4, "start_col_offset_idx": 5, "end_col_offset_idx": 6, "text": "0.862 0.722", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 435.49, "t": 213.62, "r": 454.35, "b": 221.55, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 3, "end_row_offset_idx": 4, "start_col_offset_idx": 6, "end_col_offset_idx": 7, "text": "1.85 3.26", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 148.63, "t": 245.46, "r": 207.15, "b": 253.53, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 4, "end_row_offset_idx": 5, "start_col_offset_idx": 0, "end_col_offset_idx": 1, "text": "PubTables-1M", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 222.44, "t": 239.98, "r": 247.13, "b": 248.05, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 4, "end_row_offset_idx": 5, "start_col_offset_idx": 1, "end_col_offset_idx": 2, "text": "OTSL HTML", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 264.74, "t": 239.98, "r": 285.73, "b": 248.05, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 4, "end_row_offset_idx": 5, "start_col_offset_idx": 2, "end_col_offset_idx": 3, "text": "0.987 0.983", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 302.44, "t": 239.98, "r": 323.43, "b": 248.05, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 4, "end_row_offset_idx": 5, "start_col_offset_idx": 3, "end_col_offset_idx": 4, "text": "0.964 0.944", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 337.81, "t": 239.92, "r": 361.98, "b": 247.85, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 4, "end_row_offset_idx": 5, "start_col_offset_idx": 4, "end_col_offset_idx": 5, "text": "0.977 0.966", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 380.46, "t": 239.92, "r": 404.62, "b": 247.85, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 4, "end_row_offset_idx": 5, "start_col_offset_idx": 5, "end_col_offset_idx": 6, "text": "0.896 0.889", "column_header": false, "row_header": false, "row_section": false }, { "bbox": { "l": 435.49, "t": 239.92, "r": 454.35, "b": 247.85, "coord_origin": "TOPLEFT" }, "row_span": 1, "col_span": 1, "start_row_offset_idx": 4, "end_row_offset_idx": 5, "start_col_offset_idx": 6, "end_col_offset_idx": 7, "text": "1.79 3.26", "column_header": false, "row_header": false, "row_section": false } ] }, { "label": "section_header", "id": 3, "page_no": 9, "cluster": { "id": 3, "label": "section_header", "bbox": { "l": 134.76, "t": 288.91, "r": 257.09, "b": 297.72, "coord_origin": "TOPLEFT" }, "confidence": 0.955, "cells": [ { "index": 55, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 297.72, "r_x1": 149.4, "r_y1": 297.72, "r_x2": 149.4, "r_y2": 288.91, "r_x3": 134.76, "r_y3": 288.91, "coord_origin": "TOPLEFT" }, "text": "5.3", "orig": "5.3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 56, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 160.86, "r_y0": 297.72, "r_x1": 257.09, "r_y1": 297.72, "r_x2": 257.09, "r_y2": 288.91, "r_x3": 160.86, "r_y3": 288.91, "coord_origin": "TOPLEFT" }, "text": "Qualitative Results", "orig": "Qualitative Results", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "5.3 Qualitative Results" }, { "label": "text", "id": 1, "page_no": 9, "cluster": { "id": 1, "label": "text", "bbox": { "l": 134.76, "t": 309.86, "r": 480.59, "b": 366.48, "coord_origin": "TOPLEFT" }, "confidence": 0.983, "cells": [ { "index": 57, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 318.66, "r_x1": 480.59, "r_y1": 318.66, "r_x2": 480.59, "r_y2": 309.86, "r_x3": 134.76, "r_y3": 309.86, "coord_origin": "TOPLEFT" }, "text": "To illustrate the qualitative differences between OTSL and HTML, Figure 5", "orig": "To illustrate the qualitative differences between OTSL and HTML, Figure 5", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 58, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 330.61, "r_x1": 480.59, "r_y1": 330.61, "r_x2": 480.59, "r_y2": 321.82, "r_x3": 134.76, "r_y3": 321.82, "coord_origin": "TOPLEFT" }, "text": "demonstrates less overlap and more accurate bounding boxes with OTSL. In", "orig": "demonstrates less overlap and more accurate bounding boxes with OTSL. In", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 59, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 342.57, "r_x1": 480.59, "r_y1": 342.57, "r_x2": 480.59, "r_y2": 333.77, "r_x3": 134.76, "r_y3": 333.77, "coord_origin": "TOPLEFT" }, "text": "Figure 6, OTSL proves to be more effective in handling tables with longer to-", "orig": "Figure 6, OTSL proves to be more effective in handling tables with longer to-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 60, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 354.52, "r_x1": 480.59, "r_y1": 354.52, "r_x2": 480.59, "r_y2": 345.73, "r_x3": 134.76, "r_y3": 345.73, "coord_origin": "TOPLEFT" }, "text": "ken sequences, resulting in even more precise structure prediction and bounding", "orig": "ken sequences, resulting in even more precise structure prediction and bounding", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 61, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 366.48, "r_x1": 161.66, "r_y1": 366.48, "r_x2": 161.66, "r_y2": 357.68, "r_x3": 134.76, "r_y3": 357.68, "coord_origin": "TOPLEFT" }, "text": "boxes.", "orig": "boxes.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "To illustrate the qualitative differences between OTSL and HTML, Figure 5 demonstrates less overlap and more accurate bounding boxes with OTSL. In Figure 6, OTSL proves to be more effective in handling tables with longer token sequences, resulting in even more precise structure prediction and bounding boxes." }, { "label": "caption", "id": 5, "page_no": 9, "cluster": { "id": 5, "label": "caption", "bbox": { "l": 134.76, "t": 397.59, "r": 480.59, "b": 439.72, "coord_origin": "TOPLEFT" }, "confidence": 0.948, "cells": [ { "index": 62, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 405.52, "r_x1": 162.64, "r_y1": 405.52, "r_x2": 162.64, "r_y2": 397.59, "r_x3": 134.76, "r_y3": 397.59, "coord_origin": "TOPLEFT" }, "text": "Fig. 5.", "orig": "Fig. 5.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 63, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 167.38, "r_y0": 405.72, "r_x1": 480.59, "r_y1": 405.72, "r_x2": 480.59, "r_y2": 397.65, "r_x3": 167.38, "r_y3": 397.65, "coord_origin": "TOPLEFT" }, "text": "The OTSL model produces more accurate bounding boxes with less over-", "orig": "The OTSL model produces more accurate bounding boxes with less over-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 64, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 416.68, "r_x1": 480.59, "r_y1": 416.68, "r_x2": 480.59, "r_y2": 408.61, "r_x3": 134.76, "r_y3": 408.61, "coord_origin": "TOPLEFT" }, "text": "lap (E) than the HTML model (D), when predicting the structure of a sparse ta-", "orig": "lap (E) than the HTML model (D), when predicting the structure of a sparse ta-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 65, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 427.64, "r_x1": 480.59, "r_y1": 427.64, "r_x2": 480.59, "r_y2": 419.57, "r_x3": 134.76, "r_y3": 419.57, "coord_origin": "TOPLEFT" }, "text": "ble (A), at twice the inference speed because of shorter sequence length (B),(C).", "orig": "ble (A), at twice the inference speed because of shorter sequence length (B),(C).", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 66, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 438.6, "r_x1": 304.69, "r_y1": 438.6, "r_x2": 304.69, "r_y2": 430.53, "r_x3": 134.76, "r_y3": 430.53, "coord_origin": "TOPLEFT" }, "text": "\"PMC2807444_006_00.png\" PubTabNet.", "orig": "\"PMC2807444_006_00.png\" PubTabNet.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 118, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 342.63, "r_y0": 439.72, "r_x1": 344.82, "r_y1": 439.72, "r_x2": 344.82, "r_y2": 430.2, "r_x3": 342.63, "r_y3": 430.2, "coord_origin": "TOPLEFT" }, "text": "\u03bc", "orig": "\u03bc", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "Fig. 5. The OTSL model produces more accurate bounding boxes with less overlap (E) than the HTML model (D), when predicting the structure of a sparse table (A), at twice the inference speed because of shorter sequence length (B),(C). \"PMC2807444_006_00.png\" PubTabNet. \u03bc" }, { "label": "picture", "id": 2, "page_no": 9, "cluster": { "id": 2, "label": "picture", "bbox": { "l": 162.67, "t": 444.62, "r": 451.7, "b": 663.21, "coord_origin": "TOPLEFT" }, "confidence": 0.974, "cells": [ { "index": 67, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 180.12, "r_y0": 518.95, "r_x1": 190.62, "r_y1": 518.95, "r_x2": 190.62, "r_y2": 516.23, "r_x3": 180.12, "r_y3": 516.23, "coord_origin": "TOPLEFT" }, "text": "", "orig": "
", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 68, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 183.24, "r_y0": 522.85, "r_x1": 304.55, "r_y1": 522.85, "r_x2": 304.55, "r_y2": 520.13, "r_x3": 183.24, "r_y3": 520.13, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 69, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 183.24, "r_y0": 526.75, "r_x1": 388.42, "r_y1": 526.75, "r_x2": 388.42, "r_y2": 524.03, "r_x3": 183.24, "r_y3": 524.03, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 70, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 183.24, "r_y0": 530.65, "r_x1": 388.42, "r_y1": 530.65, "r_x2": 388.42, "r_y2": 527.93, "r_x3": 183.24, "r_y3": 527.93, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 71, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 183.24, "r_y0": 534.55, "r_x1": 388.42, "r_y1": 534.55, "r_x2": 388.42, "r_y2": 531.83, "r_x3": 183.24, "r_y3": 531.83, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 72, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 183.24, "r_y0": 538.44, "r_x1": 388.42, "r_y1": 538.44, "r_x2": 388.42, "r_y2": 535.73, "r_x3": 183.24, "r_y3": 535.73, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 73, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 183.24, "r_y0": 542.34, "r_x1": 388.42, "r_y1": 542.34, "r_x2": 388.42, "r_y2": 539.63, "r_x3": 183.24, "r_y3": 539.63, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 74, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 183.24, "r_y0": 546.24, "r_x1": 388.42, "r_y1": 546.24, "r_x2": 388.42, "r_y2": 543.53, "r_x3": 183.24, "r_y3": 543.53, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 75, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 183.24, "r_y0": 550.14, "r_x1": 388.42, "r_y1": 550.14, "r_x2": 388.42, "r_y2": 547.42, "r_x3": 183.24, "r_y3": 547.42, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 76, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 183.24, "r_y0": 554.04, "r_x1": 388.42, "r_y1": 554.04, "r_x2": 388.42, "r_y2": 551.32, "r_x3": 183.24, "r_y3": 551.32, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 77, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 180.12, "r_y0": 557.94, "r_x1": 191.87, "r_y1": 557.94, "r_x2": 191.87, "r_y2": 555.22, "r_x3": 180.12, "r_y3": 555.22, "coord_origin": "TOPLEFT" }, "text": "
", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 78, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 407.38, "r_y0": 521.02, "r_x1": 408.82, "r_y1": 521.02, "r_x2": 408.82, "r_y2": 518.3, "r_x3": 407.38, "r_y3": 518.3, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 79, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 410.26, "r_y0": 521.02, "r_x1": 450.49, "r_y1": 521.02, "r_x2": 450.49, "r_y2": 518.3, "r_x3": 410.26, "r_y3": 518.3, "coord_origin": "TOPLEFT" }, "text": "C L L L C L L L L L C L L NL", "orig": "C L L L C L L L L L C L L NL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 80, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 407.38, "r_y0": 524.92, "r_x1": 408.82, "r_y1": 524.92, "r_x2": 408.82, "r_y2": 522.2, "r_x3": 407.38, "r_y3": 522.2, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 81, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 410.26, "r_y0": 524.92, "r_x1": 450.49, "r_y1": 524.92, "r_x2": 450.49, "r_y2": 522.2, "r_x3": 410.26, "r_y3": 522.2, "coord_origin": "TOPLEFT" }, "text": "C C C C C C C C C C C C C NL", "orig": "C C C C C C C C C C C C C NL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 82, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 407.38, "r_y0": 528.81, "r_x1": 408.82, "r_y1": 528.81, "r_x2": 408.82, "r_y2": 526.1, "r_x3": 407.38, "r_y3": 526.1, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 83, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 410.26, "r_y0": 528.81, "r_x1": 450.49, "r_y1": 528.81, "r_x2": 450.49, "r_y2": 526.1, "r_x3": 410.26, "r_y3": 526.1, "coord_origin": "TOPLEFT" }, "text": "C C C C C C C C C C C C C NL", "orig": "C C C C C C C C C C C C C NL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 84, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 407.38, "r_y0": 532.71, "r_x1": 408.82, "r_y1": 532.71, "r_x2": 408.82, "r_y2": 530.0, "r_x3": 407.38, "r_y3": 530.0, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 85, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 410.26, "r_y0": 532.71, "r_x1": 450.49, "r_y1": 532.71, "r_x2": 450.49, "r_y2": 530.0, "r_x3": 410.26, "r_y3": 530.0, "coord_origin": "TOPLEFT" }, "text": "C C C C C C C C C C C C C NL", "orig": "C C C C C C C C C C C C C NL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 86, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 407.38, "r_y0": 536.61, "r_x1": 408.82, "r_y1": 536.61, "r_x2": 408.82, "r_y2": 533.9, "r_x3": 407.38, "r_y3": 533.9, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 87, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 410.26, "r_y0": 536.61, "r_x1": 450.49, "r_y1": 536.61, "r_x2": 450.49, "r_y2": 533.9, "r_x3": 410.26, "r_y3": 533.9, "coord_origin": "TOPLEFT" }, "text": "C C C C C C C C C C C C C NL", "orig": "C C C C C C C C C C C C C NL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 88, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 407.38, "r_y0": 540.51, "r_x1": 408.82, "r_y1": 540.51, "r_x2": 408.82, "r_y2": 537.79, "r_x3": 407.38, "r_y3": 537.79, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 89, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 410.26, "r_y0": 540.51, "r_x1": 450.49, "r_y1": 540.51, "r_x2": 450.49, "r_y2": 537.79, "r_x3": 410.26, "r_y3": 537.79, "coord_origin": "TOPLEFT" }, "text": "C C C C C C C C C C C C C NL", "orig": "C C C C C C C C C C C C C NL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 90, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 407.38, "r_y0": 544.41, "r_x1": 408.82, "r_y1": 544.41, "r_x2": 408.82, "r_y2": 541.69, "r_x3": 407.38, "r_y3": 541.69, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 91, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 410.26, "r_y0": 544.41, "r_x1": 450.49, "r_y1": 544.41, "r_x2": 450.49, "r_y2": 541.69, "r_x3": 410.26, "r_y3": 541.69, "coord_origin": "TOPLEFT" }, "text": "C C C C C C C C C C C C C NL", "orig": "C C C C C C C C C C C C C NL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 92, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 407.38, "r_y0": 548.31, "r_x1": 408.82, "r_y1": 548.31, "r_x2": 408.82, "r_y2": 545.59, "r_x3": 407.38, "r_y3": 545.59, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 93, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 410.26, "r_y0": 548.31, "r_x1": 450.49, "r_y1": 548.31, "r_x2": 450.49, "r_y2": 545.59, "r_x3": 410.26, "r_y3": 545.59, "coord_origin": "TOPLEFT" }, "text": "C C C C C C C C C C C C C NL", "orig": "C C C C C C C C C C C C C NL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 94, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 407.38, "r_y0": 552.21, "r_x1": 408.82, "r_y1": 552.21, "r_x2": 408.82, "r_y2": 549.49, "r_x3": 407.38, "r_y3": 549.49, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 95, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 410.26, "r_y0": 552.21, "r_x1": 450.49, "r_y1": 552.21, "r_x2": 450.49, "r_y2": 549.49, "r_x3": 410.26, "r_y3": 549.49, "coord_origin": "TOPLEFT" }, "text": "C C C C C C C C C C C C C NL", "orig": "C C C C C C C C C C C C C NL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 96, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 164.53, "r_y0": 515.31, "r_x1": 181.85, "r_y1": 515.31, "r_x2": 181.85, "r_y2": 509.46, "r_x3": 164.53, "r_y3": 509.46, "coord_origin": "TOPLEFT" }, "text": "HTML", "orig": "HTML", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 97, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 183.58, "r_y0": 515.31, "r_x1": 186.4, "r_y1": 515.31, "r_x2": 186.4, "r_y2": 509.46, "r_x3": 183.58, "r_y3": 509.46, "coord_origin": "TOPLEFT" }, "text": "#", "orig": "#", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 98, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 189.21, "r_y0": 515.31, "r_x1": 208.9, "r_y1": 515.31, "r_x2": 208.9, "r_y2": 509.46, "r_x3": 189.21, "r_y3": 509.46, "coord_origin": "TOPLEFT" }, "text": "tokens:", "orig": "tokens:", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 99, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 210.63, "r_y0": 515.31, "r_x1": 221.04, "r_y1": 515.31, "r_x2": 221.04, "r_y2": 509.46, "r_x3": 210.63, "r_y3": 509.46, "coord_origin": "TOPLEFT" }, "text": "258", "orig": "258", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 100, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 390.2, "r_y0": 515.46, "r_x1": 406.84, "r_y1": 515.46, "r_x2": 406.84, "r_y2": 509.6, "r_x3": 390.2, "r_y3": 509.6, "coord_origin": "TOPLEFT" }, "text": "OTSL", "orig": "OTSL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 101, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 408.57, "r_y0": 515.46, "r_x1": 411.38, "r_y1": 515.46, "r_x2": 411.38, "r_y2": 509.6, "r_x3": 408.57, "r_y3": 509.6, "coord_origin": "TOPLEFT" }, "text": "#", "orig": "#", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 102, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 414.2, "r_y0": 515.46, "r_x1": 433.89, "r_y1": 515.46, "r_x2": 433.89, "r_y2": 509.6, "r_x3": 414.2, "r_y3": 509.6, "coord_origin": "TOPLEFT" }, "text": "tokens:", "orig": "tokens:", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 103, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 435.62, "r_y0": 515.46, "r_x1": 446.03, "r_y1": 515.46, "r_x2": 446.03, "r_y2": 509.6, "r_x3": 435.62, "r_y3": 509.6, "coord_origin": "TOPLEFT" }, "text": "135", "orig": "135", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 104, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 167.19, "r_y0": 526.39, "r_x1": 172.82, "r_y1": 526.39, "r_x2": 172.82, "r_y2": 519.07, "r_x3": 167.19, "r_y3": 519.07, "coord_origin": "TOPLEFT" }, "text": "B", "orig": "B", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 105, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 187.34, "r_y0": 455.94, "r_x1": 192.97, "r_y1": 455.94, "r_x2": 192.97, "r_y2": 448.62, "r_x3": 187.34, "r_y3": 448.62, "coord_origin": "TOPLEFT" }, "text": "A", "orig": "A", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 106, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 167.39, "r_y0": 573.32, "r_x1": 173.02, "r_y1": 573.32, "r_x2": 173.02, "r_y2": 566.01, "r_x3": 167.39, "r_y3": 566.01, "coord_origin": "TOPLEFT" }, "text": "D", "orig": "D", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 107, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 248.46, "r_y0": 629.09, "r_x1": 253.66, "r_y1": 629.09, "r_x2": 253.66, "r_y2": 621.78, "r_x3": 248.46, "r_y3": 621.78, "coord_origin": "TOPLEFT" }, "text": "E", "orig": "E", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 108, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 395.9, "r_y0": 526.51, "r_x1": 401.53, "r_y1": 526.51, "r_x2": 401.53, "r_y2": 519.2, "r_x3": 395.9, "r_y3": 519.2, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 109, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 171.63, "r_y0": 597.27, "r_x1": 177.48, "r_y1": 597.27, "r_x2": 177.48, "r_y2": 580.29, "r_x3": 171.63, "r_y3": 580.29, "coord_origin": "TOPLEFT" }, "text": "HTML", "orig": "HTML", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 110, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 251.06, "r_y0": 649.92, "r_x1": 256.91, "r_y1": 649.92, "r_x2": 256.91, "r_y2": 633.63, "r_x3": 251.06, "r_y3": 633.63, "coord_origin": "TOPLEFT" }, "text": "OTSL", "orig": "OTSL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 111, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 372.15, "r_y0": 607.31, "r_x1": 427.04, "r_y1": 607.31, "r_x2": 427.04, "r_y2": 601.46, "r_x3": 372.15, "r_y3": 601.46, "coord_origin": "TOPLEFT" }, "text": "HTML model shows", "orig": "HTML model shows", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 112, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 372.15, "r_y0": 613.75, "r_x1": 430.07, "r_y1": 613.75, "r_x2": 430.07, "r_y2": 607.9, "r_x3": 372.15, "r_y3": 607.9, "coord_origin": "TOPLEFT" }, "text": "bounding box drifting", "orig": "bounding box drifting", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 113, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 176.88, "r_y0": 648.72, "r_x1": 231.08, "r_y1": 648.72, "r_x2": 231.08, "r_y2": 642.87, "r_x3": 176.88, "r_y3": 642.87, "coord_origin": "TOPLEFT" }, "text": "OTSL model shows", "orig": "OTSL model shows", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 114, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 176.88, "r_y0": 655.17, "r_x1": 230.99, "r_y1": 655.17, "r_x2": 230.99, "r_y2": 649.31, "r_x3": 176.88, "r_y3": 649.31, "coord_origin": "TOPLEFT" }, "text": "clean bounding box", "orig": "clean bounding box", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 115, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 176.88, "r_y0": 661.61, "r_x1": 203.93, "r_y1": 661.61, "r_x2": 203.93, "r_y2": 655.76, "r_x3": 176.88, "r_y3": 655.76, "coord_origin": "TOPLEFT" }, "text": "alignment", "orig": "alignment", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 116, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 215.93, "r_y0": 569.16, "r_x1": 218.47, "r_y1": 569.16, "r_x2": 218.47, "r_y2": 557.56, "r_x3": 215.93, "r_y3": 557.56, "coord_origin": "TOPLEFT" }, "text": "\u2264", "orig": "\u2264", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 117, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 229.06, "r_y0": 569.16, "r_x1": 231.72, "r_y1": 569.16, "r_x2": 231.72, "r_y2": 557.56, "r_x3": 229.06, "r_y3": 557.56, "coord_origin": "TOPLEFT" }, "text": "\u03bc", "orig": "\u03bc", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 119, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 261.21, "r_y0": 451.2, "r_x1": 263.57, "r_y1": 451.2, "r_x2": 263.57, "r_y2": 448.46, "r_x3": 261.21, "r_y3": 448.46, "coord_origin": "TOPLEFT" }, "text": "S", "orig": "S", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 120, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 312.33, "r_y0": 451.2, "r_x1": 313.64, "r_y1": 451.2, "r_x2": 313.64, "r_y2": 448.46, "r_x3": 312.33, "r_y3": 448.46, "coord_origin": "TOPLEFT" }, "text": "I", "orig": "I", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 121, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 377.41, "r_y0": 451.2, "r_x1": 380.06, "r_y1": 451.2, "r_x2": 380.06, "r_y2": 448.46, "r_x3": 377.41, "r_y3": 448.46, "coord_origin": "TOPLEFT" }, "text": "R", "orig": "R", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 122, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 200.64, "r_y0": 456.08, "r_x1": 205.82, "r_y1": 456.08, "r_x2": 205.82, "r_y2": 453.34, "r_x3": 200.64, "r_y3": 453.34, "coord_origin": "TOPLEFT" }, "text": "ST", "orig": "ST", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 123, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 222.21, "r_y0": 456.08, "r_x1": 229.77, "r_y1": 456.08, "r_x2": 229.77, "r_y2": 453.34, "r_x3": 222.21, "r_y3": 453.34, "coord_origin": "TOPLEFT" }, "text": "0.03", "orig": "0.03", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 124, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 243.27, "r_y0": 456.08, "r_x1": 250.83, "r_y1": 456.08, "r_x2": 250.83, "r_y2": 453.34, "r_x3": 243.27, "r_y3": 453.34, "coord_origin": "TOPLEFT" }, "text": "0.06", "orig": "0.06", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 125, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 264.3, "r_y0": 456.08, "r_x1": 271.85, "r_y1": 456.08, "r_x2": 271.85, "r_y2": 453.34, "r_x3": 264.3, "r_y3": 453.34, "coord_origin": "TOPLEFT" }, "text": "0.12", "orig": "0.12", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 126, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 285.32, "r_y0": 456.08, "r_x1": 292.88, "r_y1": 456.08, "r_x2": 292.88, "r_y2": 453.34, "r_x3": 285.32, "r_y3": 453.34, "coord_origin": "TOPLEFT" }, "text": "0.25", "orig": "0.25", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 127, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 306.38, "r_y0": 456.08, "r_x1": 311.77, "r_y1": 456.08, "r_x2": 311.77, "r_y2": 453.34, "r_x3": 306.38, "r_y3": 453.34, "coord_origin": "TOPLEFT" }, "text": "0.5", "orig": "0.5", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 128, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 323.42, "r_y0": 456.08, "r_x1": 325.58, "r_y1": 456.08, "r_x2": 325.58, "r_y2": 453.34, "r_x3": 323.42, "r_y3": 453.34, "coord_origin": "TOPLEFT" }, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 129, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 334.46, "r_y0": 456.08, "r_x1": 336.62, "r_y1": 456.08, "r_x2": 336.62, "r_y2": 453.34, "r_x3": 334.46, "r_y3": 453.34, "coord_origin": "TOPLEFT" }, "text": "2", "orig": "2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 130, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 345.53, "r_y0": 456.08, "r_x1": 347.69, "r_y1": 456.08, "r_x2": 347.69, "r_y2": 453.34, "r_x3": 345.53, "r_y3": 453.34, "coord_origin": "TOPLEFT" }, "text": "4", "orig": "4", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 131, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 356.57, "r_y0": 456.08, "r_x1": 358.73, "r_y1": 456.08, "r_x2": 358.73, "r_y2": 453.34, "r_x3": 356.57, "r_y3": 453.34, "coord_origin": "TOPLEFT" }, "text": "8", "orig": "8", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 132, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 367.64, "r_y0": 456.08, "r_x1": 371.97, "r_y1": 456.08, "r_x2": 371.97, "r_y2": 453.34, "r_x3": 367.64, "r_y3": 453.34, "coord_origin": "TOPLEFT" }, "text": "16", "orig": "16", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 133, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 382.67, "r_y0": 456.08, "r_x1": 387.01, "r_y1": 456.08, "r_x2": 387.01, "r_y2": 453.34, "r_x3": 382.67, "r_y3": 453.34, "coord_origin": "TOPLEFT" }, "text": "32", "orig": "32", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 134, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 397.74, "r_y0": 456.08, "r_x1": 402.07, "r_y1": 456.08, "r_x2": 402.07, "r_y2": 453.34, "r_x3": 397.74, "r_y3": 453.34, "coord_origin": "TOPLEFT" }, "text": "64", "orig": "64", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 135, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 412.79, "r_y0": 457.8, "r_x1": 414.93, "r_y1": 457.8, "r_x2": 414.93, "r_y2": 447.99, "r_x3": 412.79, "r_y3": 447.99, "coord_origin": "TOPLEFT" }, "text": "\u2265", "orig": "\u2265", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 136, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 414.96, "r_y0": 456.08, "r_x1": 422.52, "r_y1": 456.08, "r_x2": 422.52, "r_y2": 453.34, "r_x3": 414.96, "r_y3": 453.34, "coord_origin": "TOPLEFT" }, "text": " 128", "orig": " 128", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 137, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 200.64, "r_y0": 466.66, "r_x1": 204.58, "r_y1": 466.66, "r_x2": 204.58, "r_y2": 463.92, "r_x3": 200.64, "r_y3": 463.92, "coord_origin": "TOPLEFT" }, "text": "63", "orig": "63", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 138, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 367.63, "r_y0": 466.66, "r_x1": 369.58, "r_y1": 466.66, "r_x2": 369.58, "r_y2": 463.92, "r_x3": 367.63, "r_y3": 463.92, "coord_origin": "TOPLEFT" }, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 139, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 382.66, "r_y0": 466.66, "r_x1": 384.62, "r_y1": 466.66, "r_x2": 384.62, "r_y2": 463.92, "r_x3": 382.66, "r_y3": 463.92, "coord_origin": "TOPLEFT" }, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 140, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 397.73, "r_y0": 466.66, "r_x1": 399.68, "r_y1": 466.66, "r_x2": 399.68, "r_y2": 463.92, "r_x3": 397.73, "r_y3": 463.92, "coord_origin": "TOPLEFT" }, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 141, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 200.64, "r_y0": 471.54, "r_x1": 206.52, "r_y1": 471.54, "r_x2": 206.52, "r_y2": 468.8, "r_x3": 200.64, "r_y3": 468.8, "coord_origin": "TOPLEFT" }, "text": "199", "orig": "199", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 142, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 264.29, "r_y0": 471.54, "r_x1": 266.26, "r_y1": 471.54, "r_x2": 266.26, "r_y2": 468.8, "r_x3": 264.29, "r_y3": 468.8, "coord_origin": "TOPLEFT" }, "text": "5", "orig": "5", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 143, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 306.37, "r_y0": 471.54, "r_x1": 308.34, "r_y1": 471.54, "r_x2": 308.34, "r_y2": 468.8, "r_x3": 306.37, "r_y3": 468.8, "coord_origin": "TOPLEFT" }, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 144, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 345.52, "r_y0": 471.54, "r_x1": 347.48, "r_y1": 471.54, "r_x2": 347.48, "r_y2": 468.8, "r_x3": 345.52, "r_y3": 468.8, "coord_origin": "TOPLEFT" }, "text": "2", "orig": "2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 145, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 356.56, "r_y0": 471.54, "r_x1": 358.52, "r_y1": 471.54, "r_x2": 358.52, "r_y2": 468.8, "r_x3": 356.56, "r_y3": 468.8, "coord_origin": "TOPLEFT" }, "text": "4", "orig": "4", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 146, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 367.63, "r_y0": 471.54, "r_x1": 369.59, "r_y1": 471.54, "r_x2": 369.59, "r_y2": 468.8, "r_x3": 367.63, "r_y3": 468.8, "coord_origin": "TOPLEFT" }, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 147, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 382.66, "r_y0": 471.54, "r_x1": 384.63, "r_y1": 471.54, "r_x2": 384.63, "r_y2": 468.8, "r_x3": 382.66, "r_y3": 468.8, "coord_origin": "TOPLEFT" }, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 148, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 200.64, "r_y0": 476.42, "r_x1": 206.52, "r_y1": 476.42, "r_x2": 206.52, "r_y2": 473.68, "r_x3": 200.64, "r_y3": 473.68, "coord_origin": "TOPLEFT" }, "text": "416", "orig": "416", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 149, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 264.29, "r_y0": 476.42, "r_x1": 266.26, "r_y1": 476.42, "r_x2": 266.26, "r_y2": 473.68, "r_x3": 264.29, "r_y3": 473.68, "coord_origin": "TOPLEFT" }, "text": "4", "orig": "4", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 150, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 200.64, "r_y0": 481.27, "r_x1": 206.52, "r_y1": 481.27, "r_x2": 206.52, "r_y2": 478.53, "r_x3": 200.64, "r_y3": 478.53, "coord_origin": "TOPLEFT" }, "text": "230", "orig": "230", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 151, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 243.26, "r_y0": 481.27, "r_x1": 245.23, "r_y1": 481.27, "r_x2": 245.23, "r_y2": 478.53, "r_x3": 243.26, "r_y3": 478.53, "coord_origin": "TOPLEFT" }, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 152, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 264.29, "r_y0": 481.27, "r_x1": 266.26, "r_y1": 481.27, "r_x2": 266.26, "r_y2": 478.53, "r_x3": 264.29, "r_y3": 478.53, "coord_origin": "TOPLEFT" }, "text": "9", "orig": "9", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 153, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 323.4, "r_y0": 481.27, "r_x1": 325.37, "r_y1": 481.27, "r_x2": 325.37, "r_y2": 478.53, "r_x3": 323.4, "r_y3": 478.53, "coord_origin": "TOPLEFT" }, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 154, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 397.73, "r_y0": 481.27, "r_x1": 399.69, "r_y1": 481.27, "r_x2": 399.69, "r_y2": 478.53, "r_x3": 397.73, "r_y3": 478.53, "coord_origin": "TOPLEFT" }, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 155, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 200.64, "r_y0": 486.15, "r_x1": 206.52, "r_y1": 486.15, "r_x2": 206.52, "r_y2": 483.41, "r_x3": 200.64, "r_y3": 483.41, "coord_origin": "TOPLEFT" }, "text": "276", "orig": "276", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 156, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 382.66, "r_y0": 486.15, "r_x1": 384.62, "r_y1": 486.15, "r_x2": 384.62, "r_y2": 483.41, "r_x3": 382.66, "r_y3": 483.41, "coord_origin": "TOPLEFT" }, "text": "2", "orig": "2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 157, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 397.73, "r_y0": 486.15, "r_x1": 401.65, "r_y1": 486.15, "r_x2": 401.65, "r_y2": 483.41, "r_x3": 397.73, "r_y3": 483.41, "coord_origin": "TOPLEFT" }, "text": "12", "orig": "12", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 158, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 412.79, "r_y0": 486.15, "r_x1": 414.74, "r_y1": 486.15, "r_x2": 414.74, "r_y2": 483.41, "r_x3": 412.79, "r_y3": 483.41, "coord_origin": "TOPLEFT" }, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 159, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 200.64, "r_y0": 491.03, "r_x1": 207.14, "r_y1": 491.03, "r_x2": 207.14, "r_y2": 488.29, "r_x3": 200.64, "r_y3": 488.29, "coord_origin": "TOPLEFT" }, "text": "320", "orig": "320", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 160, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 367.63, "r_y0": 491.03, "r_x1": 369.78, "r_y1": 491.03, "r_x2": 369.78, "r_y2": 488.29, "r_x3": 367.63, "r_y3": 488.29, "coord_origin": "TOPLEFT" }, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 161, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 382.66, "r_y0": 491.03, "r_x1": 384.82, "r_y1": 491.03, "r_x2": 384.82, "r_y2": 488.29, "r_x3": 382.66, "r_y3": 488.29, "coord_origin": "TOPLEFT" }, "text": "4", "orig": "4", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 162, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 397.73, "r_y0": 491.03, "r_x1": 402.05, "r_y1": 491.03, "r_x2": 402.05, "r_y2": 488.29, "r_x3": 397.73, "r_y3": 488.29, "coord_origin": "TOPLEFT" }, "text": "20", "orig": "20", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 163, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 200.64, "r_y0": 495.9, "r_x1": 208.49, "r_y1": 495.9, "r_x2": 208.49, "r_y2": 493.17, "r_x3": 200.64, "r_y3": 493.17, "coord_origin": "TOPLEFT" }, "text": "2013", "orig": "2013", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 164, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 264.29, "r_y0": 495.9, "r_x1": 266.26, "r_y1": 495.9, "r_x2": 266.26, "r_y2": 493.17, "r_x3": 264.29, "r_y3": 493.17, "coord_origin": "TOPLEFT" }, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [ { "id": 58, "label": "text", "bbox": { "l": 180.12, "t": 516.23, "r": 190.62, "b": 518.95, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 67, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 180.12, "r_y0": 518.95, "r_x1": 190.62, "r_y1": 518.95, "r_x2": 190.62, "r_y2": 516.23, "r_x3": 180.12, "r_y3": 516.23, "coord_origin": "TOPLEFT" }, "text": "", "orig": "
", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 59, "label": "text", "bbox": { "l": 183.24, "t": 520.13, "r": 304.55, "b": 522.85, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 68, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 183.24, "r_y0": 522.85, "r_x1": 304.55, "r_y1": 522.85, "r_x2": 304.55, "r_y2": 520.13, "r_x3": 183.24, "r_y3": 520.13, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 60, "label": "text", "bbox": { "l": 183.24, "t": 524.03, "r": 388.42, "b": 526.75, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 69, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 183.24, "r_y0": 526.75, "r_x1": 388.42, "r_y1": 526.75, "r_x2": 388.42, "r_y2": 524.03, "r_x3": 183.24, "r_y3": 524.03, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 61, "label": "text", "bbox": { "l": 183.24, "t": 527.93, "r": 388.42, "b": 530.65, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 70, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 183.24, "r_y0": 530.65, "r_x1": 388.42, "r_y1": 530.65, "r_x2": 388.42, "r_y2": 527.93, "r_x3": 183.24, "r_y3": 527.93, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 62, "label": "text", "bbox": { "l": 183.24, "t": 531.83, "r": 388.42, "b": 534.55, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 71, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 183.24, "r_y0": 534.55, "r_x1": 388.42, "r_y1": 534.55, "r_x2": 388.42, "r_y2": 531.83, "r_x3": 183.24, "r_y3": 531.83, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 63, "label": "text", "bbox": { "l": 183.24, "t": 535.73, "r": 388.42, "b": 538.44, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 72, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 183.24, "r_y0": 538.44, "r_x1": 388.42, "r_y1": 538.44, "r_x2": 388.42, "r_y2": 535.73, "r_x3": 183.24, "r_y3": 535.73, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 64, "label": "text", "bbox": { "l": 183.24, "t": 539.63, "r": 388.42, "b": 542.34, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 73, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 183.24, "r_y0": 542.34, "r_x1": 388.42, "r_y1": 542.34, "r_x2": 388.42, "r_y2": 539.63, "r_x3": 183.24, "r_y3": 539.63, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 65, "label": "text", "bbox": { "l": 183.24, "t": 543.53, "r": 388.42, "b": 546.24, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 74, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 183.24, "r_y0": 546.24, "r_x1": 388.42, "r_y1": 546.24, "r_x2": 388.42, "r_y2": 543.53, "r_x3": 183.24, "r_y3": 543.53, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 66, "label": "text", "bbox": { "l": 183.24, "t": 547.42, "r": 388.42, "b": 550.14, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 75, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 183.24, "r_y0": 550.14, "r_x1": 388.42, "r_y1": 550.14, "r_x2": 388.42, "r_y2": 547.42, "r_x3": 183.24, "r_y3": 547.42, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 67, "label": "text", "bbox": { "l": 183.24, "t": 551.32, "r": 388.42, "b": 554.04, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 76, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 183.24, "r_y0": 554.04, "r_x1": 388.42, "r_y1": 554.04, "r_x2": 388.42, "r_y2": 551.32, "r_x3": 183.24, "r_y3": 551.32, "coord_origin": "TOPLEFT" }, "text": "", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 68, "label": "text", "bbox": { "l": 180.12, "t": 555.22, "r": 191.87, "b": 557.94, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 77, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 180.12, "r_y0": 557.94, "r_x1": 191.87, "r_y1": 557.94, "r_x2": 191.87, "r_y2": 555.22, "r_x3": 180.12, "r_y3": 555.22, "coord_origin": "TOPLEFT" }, "text": "
", "orig": "", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 69, "label": "text", "bbox": { "l": 407.38, "t": 518.3, "r": 408.82, "b": 521.02, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 78, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 407.38, "r_y0": 521.02, "r_x1": 408.82, "r_y1": 521.02, "r_x2": 408.82, "r_y2": 518.3, "r_x3": 407.38, "r_y3": 518.3, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 70, "label": "text", "bbox": { "l": 410.26, "t": 518.3, "r": 450.49, "b": 521.02, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 79, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 410.26, "r_y0": 521.02, "r_x1": 450.49, "r_y1": 521.02, "r_x2": 450.49, "r_y2": 518.3, "r_x3": 410.26, "r_y3": 518.3, "coord_origin": "TOPLEFT" }, "text": "C L L L C L L L L L C L L NL", "orig": "C L L L C L L L L L C L L NL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 71, "label": "text", "bbox": { "l": 407.38, "t": 522.2, "r": 408.82, "b": 524.92, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 80, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 407.38, "r_y0": 524.92, "r_x1": 408.82, "r_y1": 524.92, "r_x2": 408.82, "r_y2": 522.2, "r_x3": 407.38, "r_y3": 522.2, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 72, "label": "text", "bbox": { "l": 410.26, "t": 522.2, "r": 450.49, "b": 524.92, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 81, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 410.26, "r_y0": 524.92, "r_x1": 450.49, "r_y1": 524.92, "r_x2": 450.49, "r_y2": 522.2, "r_x3": 410.26, "r_y3": 522.2, "coord_origin": "TOPLEFT" }, "text": "C C C C C C C C C C C C C NL", "orig": "C C C C C C C C C C C C C NL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 73, "label": "text", "bbox": { "l": 407.38, "t": 526.1, "r": 408.82, "b": 528.81, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 82, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 407.38, "r_y0": 528.81, "r_x1": 408.82, "r_y1": 528.81, "r_x2": 408.82, "r_y2": 526.1, "r_x3": 407.38, "r_y3": 526.1, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 74, "label": "text", "bbox": { "l": 410.26, "t": 526.1, "r": 450.49, "b": 528.81, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 83, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 410.26, "r_y0": 528.81, "r_x1": 450.49, "r_y1": 528.81, "r_x2": 450.49, "r_y2": 526.1, "r_x3": 410.26, "r_y3": 526.1, "coord_origin": "TOPLEFT" }, "text": "C C C C C C C C C C C C C NL", "orig": "C C C C C C C C C C C C C NL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 75, "label": "text", "bbox": { "l": 407.38, "t": 530.0, "r": 408.82, "b": 532.71, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 84, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 407.38, "r_y0": 532.71, "r_x1": 408.82, "r_y1": 532.71, "r_x2": 408.82, "r_y2": 530.0, "r_x3": 407.38, "r_y3": 530.0, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 76, "label": "text", "bbox": { "l": 410.26, "t": 530.0, "r": 450.49, "b": 532.71, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 85, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 410.26, "r_y0": 532.71, "r_x1": 450.49, "r_y1": 532.71, "r_x2": 450.49, "r_y2": 530.0, "r_x3": 410.26, "r_y3": 530.0, "coord_origin": "TOPLEFT" }, "text": "C C C C C C C C C C C C C NL", "orig": "C C C C C C C C C C C C C NL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 77, "label": "text", "bbox": { "l": 407.38, "t": 533.9, "r": 408.82, "b": 536.61, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 86, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 407.38, "r_y0": 536.61, "r_x1": 408.82, "r_y1": 536.61, "r_x2": 408.82, "r_y2": 533.9, "r_x3": 407.38, "r_y3": 533.9, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 78, "label": "text", "bbox": { "l": 410.26, "t": 533.9, "r": 450.49, "b": 536.61, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 87, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 410.26, "r_y0": 536.61, "r_x1": 450.49, "r_y1": 536.61, "r_x2": 450.49, "r_y2": 533.9, "r_x3": 410.26, "r_y3": 533.9, "coord_origin": "TOPLEFT" }, "text": "C C C C C C C C C C C C C NL", "orig": "C C C C C C C C C C C C C NL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 79, "label": "text", "bbox": { "l": 407.38, "t": 537.79, "r": 408.82, "b": 540.51, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 88, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 407.38, "r_y0": 540.51, "r_x1": 408.82, "r_y1": 540.51, "r_x2": 408.82, "r_y2": 537.79, "r_x3": 407.38, "r_y3": 537.79, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 80, "label": "text", "bbox": { "l": 410.26, "t": 537.79, "r": 450.49, "b": 540.51, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 89, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 410.26, "r_y0": 540.51, "r_x1": 450.49, "r_y1": 540.51, "r_x2": 450.49, "r_y2": 537.79, "r_x3": 410.26, "r_y3": 537.79, "coord_origin": "TOPLEFT" }, "text": "C C C C C C C C C C C C C NL", "orig": "C C C C C C C C C C C C C NL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 81, "label": "text", "bbox": { "l": 407.38, "t": 541.69, "r": 408.82, "b": 544.41, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 90, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 407.38, "r_y0": 544.41, "r_x1": 408.82, "r_y1": 544.41, "r_x2": 408.82, "r_y2": 541.69, "r_x3": 407.38, "r_y3": 541.69, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 82, "label": "text", "bbox": { "l": 410.26, "t": 541.69, "r": 450.49, "b": 544.41, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 91, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 410.26, "r_y0": 544.41, "r_x1": 450.49, "r_y1": 544.41, "r_x2": 450.49, "r_y2": 541.69, "r_x3": 410.26, "r_y3": 541.69, "coord_origin": "TOPLEFT" }, "text": "C C C C C C C C C C C C C NL", "orig": "C C C C C C C C C C C C C NL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 83, "label": "text", "bbox": { "l": 407.38, "t": 545.59, "r": 408.82, "b": 548.31, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 92, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 407.38, "r_y0": 548.31, "r_x1": 408.82, "r_y1": 548.31, "r_x2": 408.82, "r_y2": 545.59, "r_x3": 407.38, "r_y3": 545.59, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 84, "label": "text", "bbox": { "l": 410.26, "t": 545.59, "r": 450.49, "b": 548.31, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 93, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 410.26, "r_y0": 548.31, "r_x1": 450.49, "r_y1": 548.31, "r_x2": 450.49, "r_y2": 545.59, "r_x3": 410.26, "r_y3": 545.59, "coord_origin": "TOPLEFT" }, "text": "C C C C C C C C C C C C C NL", "orig": "C C C C C C C C C C C C C NL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 85, "label": "text", "bbox": { "l": 407.38, "t": 549.49, "r": 408.82, "b": 552.21, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 94, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 407.38, "r_y0": 552.21, "r_x1": 408.82, "r_y1": 552.21, "r_x2": 408.82, "r_y2": 549.49, "r_x3": 407.38, "r_y3": 549.49, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 86, "label": "text", "bbox": { "l": 410.26, "t": 549.49, "r": 450.49, "b": 552.21, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 95, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 410.26, "r_y0": 552.21, "r_x1": 450.49, "r_y1": 552.21, "r_x2": 450.49, "r_y2": 549.49, "r_x3": 410.26, "r_y3": 549.49, "coord_origin": "TOPLEFT" }, "text": "C C C C C C C C C C C C C NL", "orig": "C C C C C C C C C C C C C NL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 87, "label": "text", "bbox": { "l": 164.53, "t": 509.46, "r": 181.85, "b": 515.31, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 96, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 164.53, "r_y0": 515.31, "r_x1": 181.85, "r_y1": 515.31, "r_x2": 181.85, "r_y2": 509.46, "r_x3": 164.53, "r_y3": 509.46, "coord_origin": "TOPLEFT" }, "text": "HTML", "orig": "HTML", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 88, "label": "text", "bbox": { "l": 183.58, "t": 509.46, "r": 186.4, "b": 515.31, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 97, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 183.58, "r_y0": 515.31, "r_x1": 186.4, "r_y1": 515.31, "r_x2": 186.4, "r_y2": 509.46, "r_x3": 183.58, "r_y3": 509.46, "coord_origin": "TOPLEFT" }, "text": "#", "orig": "#", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 89, "label": "text", "bbox": { "l": 189.21, "t": 509.46, "r": 208.9, "b": 515.31, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 98, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 189.21, "r_y0": 515.31, "r_x1": 208.9, "r_y1": 515.31, "r_x2": 208.9, "r_y2": 509.46, "r_x3": 189.21, "r_y3": 509.46, "coord_origin": "TOPLEFT" }, "text": "tokens:", "orig": "tokens:", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 90, "label": "text", "bbox": { "l": 210.63, "t": 509.46, "r": 221.04, "b": 515.31, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 99, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 210.63, "r_y0": 515.31, "r_x1": 221.04, "r_y1": 515.31, "r_x2": 221.04, "r_y2": 509.46, "r_x3": 210.63, "r_y3": 509.46, "coord_origin": "TOPLEFT" }, "text": "258", "orig": "258", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 91, "label": "text", "bbox": { "l": 390.2, "t": 509.6, "r": 406.84, "b": 515.46, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 100, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 390.2, "r_y0": 515.46, "r_x1": 406.84, "r_y1": 515.46, "r_x2": 406.84, "r_y2": 509.6, "r_x3": 390.2, "r_y3": 509.6, "coord_origin": "TOPLEFT" }, "text": "OTSL", "orig": "OTSL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 92, "label": "text", "bbox": { "l": 408.57, "t": 509.6, "r": 411.38, "b": 515.46, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 101, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 408.57, "r_y0": 515.46, "r_x1": 411.38, "r_y1": 515.46, "r_x2": 411.38, "r_y2": 509.6, "r_x3": 408.57, "r_y3": 509.6, "coord_origin": "TOPLEFT" }, "text": "#", "orig": "#", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 93, "label": "text", "bbox": { "l": 414.2, "t": 509.6, "r": 433.89, "b": 515.46, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 102, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 414.2, "r_y0": 515.46, "r_x1": 433.89, "r_y1": 515.46, "r_x2": 433.89, "r_y2": 509.6, "r_x3": 414.2, "r_y3": 509.6, "coord_origin": "TOPLEFT" }, "text": "tokens:", "orig": "tokens:", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 94, "label": "text", "bbox": { "l": 435.62, "t": 509.6, "r": 446.03, "b": 515.46, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 103, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 435.62, "r_y0": 515.46, "r_x1": 446.03, "r_y1": 515.46, "r_x2": 446.03, "r_y2": 509.6, "r_x3": 435.62, "r_y3": 509.6, "coord_origin": "TOPLEFT" }, "text": "135", "orig": "135", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 95, "label": "text", "bbox": { "l": 167.19, "t": 519.07, "r": 172.82, "b": 526.39, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 104, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 167.19, "r_y0": 526.39, "r_x1": 172.82, "r_y1": 526.39, "r_x2": 172.82, "r_y2": 519.07, "r_x3": 167.19, "r_y3": 519.07, "coord_origin": "TOPLEFT" }, "text": "B", "orig": "B", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 96, "label": "text", "bbox": { "l": 187.34, "t": 448.62, "r": 192.97, "b": 455.94, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 105, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 187.34, "r_y0": 455.94, "r_x1": 192.97, "r_y1": 455.94, "r_x2": 192.97, "r_y2": 448.62, "r_x3": 187.34, "r_y3": 448.62, "coord_origin": "TOPLEFT" }, "text": "A", "orig": "A", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 97, "label": "text", "bbox": { "l": 167.39, "t": 566.01, "r": 173.02, "b": 573.32, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 106, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 167.39, "r_y0": 573.32, "r_x1": 173.02, "r_y1": 573.32, "r_x2": 173.02, "r_y2": 566.01, "r_x3": 167.39, "r_y3": 566.01, "coord_origin": "TOPLEFT" }, "text": "D", "orig": "D", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 98, "label": "text", "bbox": { "l": 248.46, "t": 621.78, "r": 253.66, "b": 629.09, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 107, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 248.46, "r_y0": 629.09, "r_x1": 253.66, "r_y1": 629.09, "r_x2": 253.66, "r_y2": 621.78, "r_x3": 248.46, "r_y3": 621.78, "coord_origin": "TOPLEFT" }, "text": "E", "orig": "E", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 99, "label": "text", "bbox": { "l": 395.9, "t": 519.2, "r": 401.53, "b": 526.51, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 108, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 395.9, "r_y0": 526.51, "r_x1": 401.53, "r_y1": 526.51, "r_x2": 401.53, "r_y2": 519.2, "r_x3": 395.9, "r_y3": 519.2, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 100, "label": "text", "bbox": { "l": 171.63, "t": 580.29, "r": 177.48, "b": 597.27, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 109, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 171.63, "r_y0": 597.27, "r_x1": 177.48, "r_y1": 597.27, "r_x2": 177.48, "r_y2": 580.29, "r_x3": 171.63, "r_y3": 580.29, "coord_origin": "TOPLEFT" }, "text": "HTML", "orig": "HTML", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 101, "label": "text", "bbox": { "l": 251.06, "t": 633.63, "r": 256.91, "b": 649.92, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 110, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 251.06, "r_y0": 649.92, "r_x1": 256.91, "r_y1": 649.92, "r_x2": 256.91, "r_y2": 633.63, "r_x3": 251.06, "r_y3": 633.63, "coord_origin": "TOPLEFT" }, "text": "OTSL", "orig": "OTSL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 102, "label": "text", "bbox": { "l": 372.15, "t": 601.46, "r": 427.04, "b": 607.31, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 111, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 372.15, "r_y0": 607.31, "r_x1": 427.04, "r_y1": 607.31, "r_x2": 427.04, "r_y2": 601.46, "r_x3": 372.15, "r_y3": 601.46, "coord_origin": "TOPLEFT" }, "text": "HTML model shows", "orig": "HTML model shows", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 103, "label": "text", "bbox": { "l": 372.15, "t": 607.9, "r": 430.07, "b": 613.75, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 112, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 372.15, "r_y0": 613.75, "r_x1": 430.07, "r_y1": 613.75, "r_x2": 430.07, "r_y2": 607.9, "r_x3": 372.15, "r_y3": 607.9, "coord_origin": "TOPLEFT" }, "text": "bounding box drifting", "orig": "bounding box drifting", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 104, "label": "text", "bbox": { "l": 176.88, "t": 642.87, "r": 231.08, "b": 648.72, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 113, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 176.88, "r_y0": 648.72, "r_x1": 231.08, "r_y1": 648.72, "r_x2": 231.08, "r_y2": 642.87, "r_x3": 176.88, "r_y3": 642.87, "coord_origin": "TOPLEFT" }, "text": "OTSL model shows", "orig": "OTSL model shows", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 105, "label": "text", "bbox": { "l": 176.88, "t": 649.31, "r": 230.99, "b": 655.17, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 114, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 176.88, "r_y0": 655.17, "r_x1": 230.99, "r_y1": 655.17, "r_x2": 230.99, "r_y2": 649.31, "r_x3": 176.88, "r_y3": 649.31, "coord_origin": "TOPLEFT" }, "text": "clean bounding box", "orig": "clean bounding box", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 106, "label": "text", "bbox": { "l": 176.88, "t": 655.76, "r": 203.93, "b": 661.61, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 115, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 176.88, "r_y0": 661.61, "r_x1": 203.93, "r_y1": 661.61, "r_x2": 203.93, "r_y2": 655.76, "r_x3": 176.88, "r_y3": 655.76, "coord_origin": "TOPLEFT" }, "text": "alignment", "orig": "alignment", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 107, "label": "text", "bbox": { "l": 215.93, "t": 557.56, "r": 218.47, "b": 569.16, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 116, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 215.93, "r_y0": 569.16, "r_x1": 218.47, "r_y1": 569.16, "r_x2": 218.47, "r_y2": 557.56, "r_x3": 215.93, "r_y3": 557.56, "coord_origin": "TOPLEFT" }, "text": "\u2264", "orig": "\u2264", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 108, "label": "text", "bbox": { "l": 229.06, "t": 557.56, "r": 231.72, "b": 569.16, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 117, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 229.06, "r_y0": 569.16, "r_x1": 231.72, "r_y1": 569.16, "r_x2": 231.72, "r_y2": 557.56, "r_x3": 229.06, "r_y3": 557.56, "coord_origin": "TOPLEFT" }, "text": "\u03bc", "orig": "\u03bc", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 109, "label": "text", "bbox": { "l": 261.21, "t": 448.46, "r": 263.57, "b": 451.2, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 119, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 261.21, "r_y0": 451.2, "r_x1": 263.57, "r_y1": 451.2, "r_x2": 263.57, "r_y2": 448.46, "r_x3": 261.21, "r_y3": 448.46, "coord_origin": "TOPLEFT" }, "text": "S", "orig": "S", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 110, "label": "text", "bbox": { "l": 312.33, "t": 448.46, "r": 313.64, "b": 451.2, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 120, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 312.33, "r_y0": 451.2, "r_x1": 313.64, "r_y1": 451.2, "r_x2": 313.64, "r_y2": 448.46, "r_x3": 312.33, "r_y3": 448.46, "coord_origin": "TOPLEFT" }, "text": "I", "orig": "I", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 111, "label": "text", "bbox": { "l": 377.41, "t": 448.46, "r": 380.06, "b": 451.2, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 121, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 377.41, "r_y0": 451.2, "r_x1": 380.06, "r_y1": 451.2, "r_x2": 380.06, "r_y2": 448.46, "r_x3": 377.41, "r_y3": 448.46, "coord_origin": "TOPLEFT" }, "text": "R", "orig": "R", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 112, "label": "text", "bbox": { "l": 200.64, "t": 453.34, "r": 205.82, "b": 456.08, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 122, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 200.64, "r_y0": 456.08, "r_x1": 205.82, "r_y1": 456.08, "r_x2": 205.82, "r_y2": 453.34, "r_x3": 200.64, "r_y3": 453.34, "coord_origin": "TOPLEFT" }, "text": "ST", "orig": "ST", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 113, "label": "text", "bbox": { "l": 222.21, "t": 453.34, "r": 229.77, "b": 456.08, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 123, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 222.21, "r_y0": 456.08, "r_x1": 229.77, "r_y1": 456.08, "r_x2": 229.77, "r_y2": 453.34, "r_x3": 222.21, "r_y3": 453.34, "coord_origin": "TOPLEFT" }, "text": "0.03", "orig": "0.03", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 114, "label": "text", "bbox": { "l": 243.27, "t": 453.34, "r": 250.83, "b": 456.08, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 124, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 243.27, "r_y0": 456.08, "r_x1": 250.83, "r_y1": 456.08, "r_x2": 250.83, "r_y2": 453.34, "r_x3": 243.27, "r_y3": 453.34, "coord_origin": "TOPLEFT" }, "text": "0.06", "orig": "0.06", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 115, "label": "text", "bbox": { "l": 264.3, "t": 453.34, "r": 271.85, "b": 456.08, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 125, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 264.3, "r_y0": 456.08, "r_x1": 271.85, "r_y1": 456.08, "r_x2": 271.85, "r_y2": 453.34, "r_x3": 264.3, "r_y3": 453.34, "coord_origin": "TOPLEFT" }, "text": "0.12", "orig": "0.12", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 116, "label": "text", "bbox": { "l": 285.32, "t": 453.34, "r": 292.88, "b": 456.08, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 126, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 285.32, "r_y0": 456.08, "r_x1": 292.88, "r_y1": 456.08, "r_x2": 292.88, "r_y2": 453.34, "r_x3": 285.32, "r_y3": 453.34, "coord_origin": "TOPLEFT" }, "text": "0.25", "orig": "0.25", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 117, "label": "text", "bbox": { "l": 306.38, "t": 453.34, "r": 311.77, "b": 456.08, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 127, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 306.38, "r_y0": 456.08, "r_x1": 311.77, "r_y1": 456.08, "r_x2": 311.77, "r_y2": 453.34, "r_x3": 306.38, "r_y3": 453.34, "coord_origin": "TOPLEFT" }, "text": "0.5", "orig": "0.5", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 118, "label": "text", "bbox": { "l": 323.42, "t": 453.34, "r": 325.58, "b": 456.08, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 128, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 323.42, "r_y0": 456.08, "r_x1": 325.58, "r_y1": 456.08, "r_x2": 325.58, "r_y2": 453.34, "r_x3": 323.42, "r_y3": 453.34, "coord_origin": "TOPLEFT" }, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 119, "label": "text", "bbox": { "l": 334.46, "t": 453.34, "r": 336.62, "b": 456.08, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 129, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 334.46, "r_y0": 456.08, "r_x1": 336.62, "r_y1": 456.08, "r_x2": 336.62, "r_y2": 453.34, "r_x3": 334.46, "r_y3": 453.34, "coord_origin": "TOPLEFT" }, "text": "2", "orig": "2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 120, "label": "text", "bbox": { "l": 345.53, "t": 453.34, "r": 347.69, "b": 456.08, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 130, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 345.53, "r_y0": 456.08, "r_x1": 347.69, "r_y1": 456.08, "r_x2": 347.69, "r_y2": 453.34, "r_x3": 345.53, "r_y3": 453.34, "coord_origin": "TOPLEFT" }, "text": "4", "orig": "4", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 121, "label": "text", "bbox": { "l": 356.57, "t": 453.34, "r": 358.73, "b": 456.08, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 131, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 356.57, "r_y0": 456.08, "r_x1": 358.73, "r_y1": 456.08, "r_x2": 358.73, "r_y2": 453.34, "r_x3": 356.57, "r_y3": 453.34, "coord_origin": "TOPLEFT" }, "text": "8", "orig": "8", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 122, "label": "text", "bbox": { "l": 367.64, "t": 453.34, "r": 371.97, "b": 456.08, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 132, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 367.64, "r_y0": 456.08, "r_x1": 371.97, "r_y1": 456.08, "r_x2": 371.97, "r_y2": 453.34, "r_x3": 367.64, "r_y3": 453.34, "coord_origin": "TOPLEFT" }, "text": "16", "orig": "16", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 123, "label": "text", "bbox": { "l": 382.67, "t": 453.34, "r": 387.01, "b": 456.08, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 133, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 382.67, "r_y0": 456.08, "r_x1": 387.01, "r_y1": 456.08, "r_x2": 387.01, "r_y2": 453.34, "r_x3": 382.67, "r_y3": 453.34, "coord_origin": "TOPLEFT" }, "text": "32", "orig": "32", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 124, "label": "text", "bbox": { "l": 397.74, "t": 453.34, "r": 402.07, "b": 456.08, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 134, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 397.74, "r_y0": 456.08, "r_x1": 402.07, "r_y1": 456.08, "r_x2": 402.07, "r_y2": 453.34, "r_x3": 397.74, "r_y3": 453.34, "coord_origin": "TOPLEFT" }, "text": "64", "orig": "64", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 125, "label": "text", "bbox": { "l": 412.79, "t": 447.99, "r": 414.93, "b": 457.8, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 135, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 412.79, "r_y0": 457.8, "r_x1": 414.93, "r_y1": 457.8, "r_x2": 414.93, "r_y2": 447.99, "r_x3": 412.79, "r_y3": 447.99, "coord_origin": "TOPLEFT" }, "text": "\u2265", "orig": "\u2265", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 126, "label": "text", "bbox": { "l": 414.96, "t": 453.34, "r": 422.52, "b": 456.08, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 136, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 414.96, "r_y0": 456.08, "r_x1": 422.52, "r_y1": 456.08, "r_x2": 422.52, "r_y2": 453.34, "r_x3": 414.96, "r_y3": 453.34, "coord_origin": "TOPLEFT" }, "text": " 128", "orig": " 128", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 127, "label": "text", "bbox": { "l": 200.64, "t": 463.92, "r": 204.58, "b": 466.66, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 137, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 200.64, "r_y0": 466.66, "r_x1": 204.58, "r_y1": 466.66, "r_x2": 204.58, "r_y2": 463.92, "r_x3": 200.64, "r_y3": 463.92, "coord_origin": "TOPLEFT" }, "text": "63", "orig": "63", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 128, "label": "text", "bbox": { "l": 367.63, "t": 463.92, "r": 369.58, "b": 466.66, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 138, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 367.63, "r_y0": 466.66, "r_x1": 369.58, "r_y1": 466.66, "r_x2": 369.58, "r_y2": 463.92, "r_x3": 367.63, "r_y3": 463.92, "coord_origin": "TOPLEFT" }, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 129, "label": "text", "bbox": { "l": 382.66, "t": 463.92, "r": 384.62, "b": 466.66, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 139, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 382.66, "r_y0": 466.66, "r_x1": 384.62, "r_y1": 466.66, "r_x2": 384.62, "r_y2": 463.92, "r_x3": 382.66, "r_y3": 463.92, "coord_origin": "TOPLEFT" }, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 130, "label": "text", "bbox": { "l": 397.73, "t": 463.92, "r": 399.68, "b": 466.66, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 140, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 397.73, "r_y0": 466.66, "r_x1": 399.68, "r_y1": 466.66, "r_x2": 399.68, "r_y2": 463.92, "r_x3": 397.73, "r_y3": 463.92, "coord_origin": "TOPLEFT" }, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 131, "label": "text", "bbox": { "l": 200.64, "t": 468.8, "r": 206.52, "b": 471.54, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 141, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 200.64, "r_y0": 471.54, "r_x1": 206.52, "r_y1": 471.54, "r_x2": 206.52, "r_y2": 468.8, "r_x3": 200.64, "r_y3": 468.8, "coord_origin": "TOPLEFT" }, "text": "199", "orig": "199", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 132, "label": "text", "bbox": { "l": 264.29, "t": 468.8, "r": 266.26, "b": 471.54, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 142, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 264.29, "r_y0": 471.54, "r_x1": 266.26, "r_y1": 471.54, "r_x2": 266.26, "r_y2": 468.8, "r_x3": 264.29, "r_y3": 468.8, "coord_origin": "TOPLEFT" }, "text": "5", "orig": "5", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 133, "label": "text", "bbox": { "l": 306.37, "t": 468.8, "r": 308.34, "b": 471.54, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 143, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 306.37, "r_y0": 471.54, "r_x1": 308.34, "r_y1": 471.54, "r_x2": 308.34, "r_y2": 468.8, "r_x3": 306.37, "r_y3": 468.8, "coord_origin": "TOPLEFT" }, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 134, "label": "text", "bbox": { "l": 345.52, "t": 468.8, "r": 347.48, "b": 471.54, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 144, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 345.52, "r_y0": 471.54, "r_x1": 347.48, "r_y1": 471.54, "r_x2": 347.48, "r_y2": 468.8, "r_x3": 345.52, "r_y3": 468.8, "coord_origin": "TOPLEFT" }, "text": "2", "orig": "2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 135, "label": "text", "bbox": { "l": 356.56, "t": 468.8, "r": 358.52, "b": 471.54, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 145, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 356.56, "r_y0": 471.54, "r_x1": 358.52, "r_y1": 471.54, "r_x2": 358.52, "r_y2": 468.8, "r_x3": 356.56, "r_y3": 468.8, "coord_origin": "TOPLEFT" }, "text": "4", "orig": "4", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 136, "label": "text", "bbox": { "l": 367.63, "t": 468.8, "r": 369.59, "b": 471.54, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 146, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 367.63, "r_y0": 471.54, "r_x1": 369.59, "r_y1": 471.54, "r_x2": 369.59, "r_y2": 468.8, "r_x3": 367.63, "r_y3": 468.8, "coord_origin": "TOPLEFT" }, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 137, "label": "text", "bbox": { "l": 382.66, "t": 468.8, "r": 384.63, "b": 471.54, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 147, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 382.66, "r_y0": 471.54, "r_x1": 384.63, "r_y1": 471.54, "r_x2": 384.63, "r_y2": 468.8, "r_x3": 382.66, "r_y3": 468.8, "coord_origin": "TOPLEFT" }, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 138, "label": "text", "bbox": { "l": 200.64, "t": 473.68, "r": 206.52, "b": 476.42, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 148, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 200.64, "r_y0": 476.42, "r_x1": 206.52, "r_y1": 476.42, "r_x2": 206.52, "r_y2": 473.68, "r_x3": 200.64, "r_y3": 473.68, "coord_origin": "TOPLEFT" }, "text": "416", "orig": "416", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 139, "label": "text", "bbox": { "l": 264.29, "t": 473.68, "r": 266.26, "b": 476.42, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 149, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 264.29, "r_y0": 476.42, "r_x1": 266.26, "r_y1": 476.42, "r_x2": 266.26, "r_y2": 473.68, "r_x3": 264.29, "r_y3": 473.68, "coord_origin": "TOPLEFT" }, "text": "4", "orig": "4", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 140, "label": "text", "bbox": { "l": 200.64, "t": 478.53, "r": 206.52, "b": 481.27, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 150, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 200.64, "r_y0": 481.27, "r_x1": 206.52, "r_y1": 481.27, "r_x2": 206.52, "r_y2": 478.53, "r_x3": 200.64, "r_y3": 478.53, "coord_origin": "TOPLEFT" }, "text": "230", "orig": "230", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 141, "label": "text", "bbox": { "l": 243.26, "t": 478.53, "r": 245.23, "b": 481.27, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 151, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 243.26, "r_y0": 481.27, "r_x1": 245.23, "r_y1": 481.27, "r_x2": 245.23, "r_y2": 478.53, "r_x3": 243.26, "r_y3": 478.53, "coord_origin": "TOPLEFT" }, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 142, "label": "text", "bbox": { "l": 264.29, "t": 478.53, "r": 266.26, "b": 481.27, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 152, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 264.29, "r_y0": 481.27, "r_x1": 266.26, "r_y1": 481.27, "r_x2": 266.26, "r_y2": 478.53, "r_x3": 264.29, "r_y3": 478.53, "coord_origin": "TOPLEFT" }, "text": "9", "orig": "9", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 143, "label": "text", "bbox": { "l": 323.4, "t": 478.53, "r": 325.37, "b": 481.27, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 153, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 323.4, "r_y0": 481.27, "r_x1": 325.37, "r_y1": 481.27, "r_x2": 325.37, "r_y2": 478.53, "r_x3": 323.4, "r_y3": 478.53, "coord_origin": "TOPLEFT" }, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 144, "label": "text", "bbox": { "l": 397.73, "t": 478.53, "r": 399.69, "b": 481.27, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 154, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 397.73, "r_y0": 481.27, "r_x1": 399.69, "r_y1": 481.27, "r_x2": 399.69, "r_y2": 478.53, "r_x3": 397.73, "r_y3": 478.53, "coord_origin": "TOPLEFT" }, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 145, "label": "text", "bbox": { "l": 200.64, "t": 483.41, "r": 206.52, "b": 486.15, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 155, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 200.64, "r_y0": 486.15, "r_x1": 206.52, "r_y1": 486.15, "r_x2": 206.52, "r_y2": 483.41, "r_x3": 200.64, "r_y3": 483.41, "coord_origin": "TOPLEFT" }, "text": "276", "orig": "276", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 146, "label": "text", "bbox": { "l": 382.66, "t": 483.41, "r": 384.62, "b": 486.15, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 156, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 382.66, "r_y0": 486.15, "r_x1": 384.62, "r_y1": 486.15, "r_x2": 384.62, "r_y2": 483.41, "r_x3": 382.66, "r_y3": 483.41, "coord_origin": "TOPLEFT" }, "text": "2", "orig": "2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 147, "label": "text", "bbox": { "l": 397.73, "t": 483.41, "r": 401.65, "b": 486.15, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 157, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 397.73, "r_y0": 486.15, "r_x1": 401.65, "r_y1": 486.15, "r_x2": 401.65, "r_y2": 483.41, "r_x3": 397.73, "r_y3": 483.41, "coord_origin": "TOPLEFT" }, "text": "12", "orig": "12", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 148, "label": "text", "bbox": { "l": 412.79, "t": 483.41, "r": 414.74, "b": 486.15, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 158, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 412.79, "r_y0": 486.15, "r_x1": 414.74, "r_y1": 486.15, "r_x2": 414.74, "r_y2": 483.41, "r_x3": 412.79, "r_y3": 483.41, "coord_origin": "TOPLEFT" }, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 149, "label": "text", "bbox": { "l": 200.64, "t": 488.29, "r": 207.14, "b": 491.03, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 159, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 200.64, "r_y0": 491.03, "r_x1": 207.14, "r_y1": 491.03, "r_x2": 207.14, "r_y2": 488.29, "r_x3": 200.64, "r_y3": 488.29, "coord_origin": "TOPLEFT" }, "text": "320", "orig": "320", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 150, "label": "text", "bbox": { "l": 367.63, "t": 488.29, "r": 369.78, "b": 491.03, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 160, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 367.63, "r_y0": 491.03, "r_x1": 369.78, "r_y1": 491.03, "r_x2": 369.78, "r_y2": 488.29, "r_x3": 367.63, "r_y3": 488.29, "coord_origin": "TOPLEFT" }, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 151, "label": "text", "bbox": { "l": 382.66, "t": 488.29, "r": 384.82, "b": 491.03, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 161, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 382.66, "r_y0": 491.03, "r_x1": 384.82, "r_y1": 491.03, "r_x2": 384.82, "r_y2": 488.29, "r_x3": 382.66, "r_y3": 488.29, "coord_origin": "TOPLEFT" }, "text": "4", "orig": "4", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 152, "label": "text", "bbox": { "l": 397.73, "t": 488.29, "r": 402.05, "b": 491.03, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 162, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 397.73, "r_y0": 491.03, "r_x1": 402.05, "r_y1": 491.03, "r_x2": 402.05, "r_y2": 488.29, "r_x3": 397.73, "r_y3": 488.29, "coord_origin": "TOPLEFT" }, "text": "20", "orig": "20", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 153, "label": "text", "bbox": { "l": 200.64, "t": 493.17, "r": 208.49, "b": 495.9, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 163, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 200.64, "r_y0": 495.9, "r_x1": 208.49, "r_y1": 495.9, "r_x2": 208.49, "r_y2": 493.17, "r_x3": 200.64, "r_y3": 493.17, "coord_origin": "TOPLEFT" }, "text": "2013", "orig": "2013", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 154, "label": "text", "bbox": { "l": 264.29, "t": 493.17, "r": 266.26, "b": 495.9, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 164, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 264.29, "r_y0": 495.9, "r_x1": 266.26, "r_y1": 495.9, "r_x2": 266.26, "r_y2": 493.17, "r_x3": 264.29, "r_y3": 493.17, "coord_origin": "TOPLEFT" }, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] } ] }, "text": "", "annotations": [], "provenance": null, "predicted_class": null, "confidence": null }, { "label": "text", "id": 155, "page_no": 9, "cluster": { "id": 155, "label": "text", "bbox": { "l": 227.91, "t": 665.83, "r": 230.1, "b": 675.35, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 165, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 227.91, "r_y0": 675.35, "r_x1": 230.1, "r_y1": 675.35, "r_x2": 230.1, "r_y2": 665.83, "r_x3": 227.91, "r_y3": 665.83, "coord_origin": "TOPLEFT" }, "text": "\u03bc", "orig": "\u03bc", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "\u03bc" }, { "label": "text", "id": 156, "page_no": 9, "cluster": { "id": 156, "label": "text", "bbox": { "l": 300.58, "t": 683.62, "r": 302.73, "b": 693.43, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 166, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 300.58, "r_y0": 693.43, "r_x1": 302.73, "r_y1": 693.43, "r_x2": 302.73, "r_y2": 683.62, "r_x3": 300.58, "r_y3": 683.62, "coord_origin": "TOPLEFT" }, "text": "\u2265", "orig": "\u2265", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "\u2265" } ], "headers": [ { "label": "page_header", "id": 7, "page_no": 9, "cluster": { "id": 7, "label": "page_header", "bbox": { "l": 134.76, "t": 93.77, "r": 143.98, "b": 101.84, "coord_origin": "TOPLEFT" }, "confidence": 0.831, "cells": [ { "index": 0, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 101.84, "r_x1": 143.98, "r_y1": 101.84, "r_x2": 143.98, "r_y2": 93.77, "r_x3": 134.76, "r_y3": 93.77, "coord_origin": "TOPLEFT" }, "text": "10", "orig": "10", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "10" }, { "label": "page_header", "id": 6, "page_no": 9, "cluster": { "id": 6, "label": "page_header", "bbox": { "l": 167.82, "t": 93.77, "r": 231.72, "b": 101.84, "coord_origin": "TOPLEFT" }, "confidence": 0.837, "cells": [ { "index": 1, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 167.82, "r_y0": 101.84, "r_x1": 178.08, "r_y1": 101.84, "r_x2": 178.08, "r_y2": 93.77, "r_x3": 167.82, "r_y3": 93.77, "coord_origin": "TOPLEFT" }, "text": "M.", "orig": "M.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 2, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 182.38, "r_y0": 101.84, "r_x1": 231.72, "r_y1": 101.84, "r_x2": 231.72, "r_y2": 93.77, "r_x3": 182.38, "r_y3": 93.77, "coord_origin": "TOPLEFT" }, "text": "Lysak, et al.", "orig": "Lysak, et al.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "M. Lysak, et al." } ] } }, { "page_no": 10, "size": { "width": 612.0, "height": 792.0 }, "parsed_page": { "dimension": { "angle": 0.0, "rect": { "r_x0": 0.0, "r_y0": 0.0, "r_x1": 612.0, "r_y1": 0.0, "r_x2": 612.0, "r_y2": 792.0, "r_x3": 0.0, "r_y3": 792.0, "coord_origin": "BOTTOMLEFT" }, "boundary_type": "crop_box", "art_bbox": { "l": 0.0, "t": 792.0, "r": 612.0, "b": 0.0, "coord_origin": "BOTTOMLEFT" }, "bleed_bbox": { "l": 0.0, "t": 792.0, "r": 612.0, "b": 0.0, "coord_origin": "BOTTOMLEFT" }, "crop_bbox": { "l": 0.0, "t": 792.0, "r": 612.0, "b": 0.0, "coord_origin": "BOTTOMLEFT" }, "media_bbox": { "l": 0.0, "t": 792.0, "r": 612.0, "b": 0.0, "coord_origin": "BOTTOMLEFT" }, "trim_bbox": { "l": 0.0, "t": 792.0, "r": 612.0, "b": 0.0, "coord_origin": "BOTTOMLEFT" } }, "bitmap_resources": [], "char_cells": [], "word_cells": [], "textline_cells": [ { "index": 0, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 194.48, "r_y0": 101.84, "r_x1": 447.54, "r_y1": 101.84, "r_x2": 447.54, "r_y2": 93.77, "r_x3": 194.48, "r_y3": 93.77, "coord_origin": "TOPLEFT" }, "text": "Optimized Table Tokenization for Table Structure Recognition", "orig": "Optimized Table Tokenization for Table Structure Recognition", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 1, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 471.38, "r_y0": 101.84, "r_x1": 480.59, "r_y1": 101.84, "r_x2": 480.59, "r_y2": 93.77, "r_x3": 471.38, "r_y3": 93.77, "coord_origin": "TOPLEFT" }, "text": "11", "orig": "11", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 2, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 133.73, "r_x1": 162.64, "r_y1": 133.73, "r_x2": 162.64, "r_y2": 125.8, "r_x3": 134.76, "r_y3": 125.8, "coord_origin": "TOPLEFT" }, "text": "Fig. 6.", "orig": "Fig. 6.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 3, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 165.22, "r_y0": 133.93, "r_x1": 480.59, "r_y1": 133.93, "r_x2": 480.59, "r_y2": 125.86, "r_x3": 165.22, "r_y3": 125.86, "coord_origin": "TOPLEFT" }, "text": "Visualization of predicted structure and detected bounding boxes on a complex", "orig": "Visualization of predicted structure and detected bounding boxes on a complex", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 4, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 144.89, "r_x1": 480.59, "r_y1": 144.89, "r_x2": 480.59, "r_y2": 136.82, "r_x3": 134.76, "r_y3": 136.82, "coord_origin": "TOPLEFT" }, "text": "table with many rows. The OTSL model (B) captured repeating pattern of horizontally", "orig": "table with many rows. The OTSL model (B) captured repeating pattern of horizontally", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 5, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 155.85, "r_x1": 480.59, "r_y1": 155.85, "r_x2": 480.59, "r_y2": 147.78, "r_x3": 134.76, "r_y3": 147.78, "coord_origin": "TOPLEFT" }, "text": "merged cells from the GT (A), unlike the HTML model (C). The HTML model also", "orig": "merged cells from the GT (A), unlike the HTML model (C). The HTML model also", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 6, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 166.81, "r_x1": 480.59, "r_y1": 166.81, "r_x2": 480.59, "r_y2": 158.74, "r_x3": 134.76, "r_y3": 158.74, "coord_origin": "TOPLEFT" }, "text": "didn\u2019t complete the HTML sequence correctly and displayed a lot more of drift and", "orig": "didn\u2019t complete the HTML sequence correctly and displayed a lot more of drift and", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 7, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 177.77, "r_x1": 415.84, "r_y1": 177.77, "r_x2": 415.84, "r_y2": 169.7, "r_x3": 134.76, "r_y3": 169.7, "coord_origin": "TOPLEFT" }, "text": "overlap of bounding boxes. \"PMC5406406_003_01.png\" PubTabNet.", "orig": "overlap of bounding boxes. \"PMC5406406_003_01.png\" PubTabNet.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 8, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 171.5, "r_y0": 320.36, "r_x1": 177.6, "r_y1": 320.36, "r_x2": 177.6, "r_y2": 312.45, "r_x3": 171.5, "r_y3": 312.45, "coord_origin": "TOPLEFT" }, "text": "B", "orig": "B", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 9, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 171.06, "r_y0": 500.57, "r_x1": 177.15, "r_y1": 500.57, "r_x2": 177.15, "r_y2": 492.65, "r_x3": 171.06, "r_y3": 492.65, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 10, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 283.05, "r_y0": 633.42, "r_x1": 374.96, "r_y1": 633.42, "r_x2": 374.96, "r_y2": 627.48, "r_x3": 283.05, "r_y3": 627.48, "coord_origin": "TOPLEFT" }, "text": "Incorrect end of HTML sequence", "orig": "Incorrect end of HTML sequence", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 11, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 283.05, "r_y0": 623.29, "r_x1": 398.06, "r_y1": 623.29, "r_x2": 398.06, "r_y2": 617.36, "r_x3": 283.05, "r_y3": 617.36, "coord_origin": "TOPLEFT" }, "text": "Horizontally merged cells are not present", "orig": "Horizontally merged cells are not present", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 12, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 293.64, "r_y0": 471.53, "r_x1": 437.51, "r_y1": 471.53, "r_x2": 437.51, "r_y2": 465.6, "r_x3": 293.64, "r_y3": 465.6, "coord_origin": "TOPLEFT" }, "text": "Repeating pattern is well represented in predictions", "orig": "Repeating pattern is well represented in predictions", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 13, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 181.89, "r_y0": 294.29, "r_x1": 239.23, "r_y1": 294.29, "r_x2": 239.23, "r_y2": 288.36, "r_x3": 181.89, "r_y3": 288.36, "coord_origin": "TOPLEFT" }, "text": "Repeating pattern of", "orig": "Repeating pattern of", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 14, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 181.89, "r_y0": 300.83, "r_x1": 251.53, "r_y1": 300.83, "r_x2": 251.53, "r_y2": 294.89, "r_x3": 181.89, "r_y3": 294.89, "coord_origin": "TOPLEFT" }, "text": "horizontally merged cells", "orig": "horizontally merged cells", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 15, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 247.83, "r_y0": 194.82, "r_x1": 253.61, "r_y1": 194.82, "r_x2": 253.61, "r_y2": 184.76, "r_x3": 247.83, "r_y3": 184.76, "coord_origin": "TOPLEFT" }, "text": "A", "orig": "A", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 16, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 292.19, "r_y0": 613.74, "r_x1": 381.55, "r_y1": 613.74, "r_x2": 381.55, "r_y2": 607.81, "r_x3": 292.19, "r_y3": 607.81, "coord_origin": "TOPLEFT" }, "text": "Bounding box drifting at the end", "orig": "Bounding box drifting at the end", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 17, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 172.28, "r_y0": 403.4, "r_x1": 180.19, "r_y1": 403.4, "r_x2": 180.19, "r_y2": 381.36, "r_x3": 172.28, "r_y3": 381.36, "coord_origin": "TOPLEFT" }, "text": "OTSL", "orig": "OTSL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 18, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 172.28, "r_y0": 578.75, "r_x1": 180.19, "r_y1": 578.75, "r_x2": 180.19, "r_y2": 555.78, "r_x3": 172.28, "r_y3": 555.78, "coord_origin": "TOPLEFT" }, "text": "HTML", "orig": "HTML", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "has_chars": false, "has_words": false, "has_lines": true, "image": null, "lines": [] }, "predictions": { "layout": { "clusters": [ { "id": 0, "label": "page_header", "bbox": { "l": 194.48, "t": 93.77, "r": 447.54, "b": 101.84, "coord_origin": "TOPLEFT" }, "confidence": 0.93, "cells": [ { "index": 0, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 194.48, "r_y0": 101.84, "r_x1": 447.54, "r_y1": 101.84, "r_x2": 447.54, "r_y2": 93.77, "r_x3": 194.48, "r_y3": 93.77, "coord_origin": "TOPLEFT" }, "text": "Optimized Table Tokenization for Table Structure Recognition", "orig": "Optimized Table Tokenization for Table Structure Recognition", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 1, "label": "page_header", "bbox": { "l": 471.38, "t": 93.77, "r": 480.59, "b": 101.84, "coord_origin": "TOPLEFT" }, "confidence": 0.901, "cells": [ { "index": 1, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 471.38, "r_y0": 101.84, "r_x1": 480.59, "r_y1": 101.84, "r_x2": 480.59, "r_y2": 93.77, "r_x3": 471.38, "r_y3": 93.77, "coord_origin": "TOPLEFT" }, "text": "11", "orig": "11", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 2, "label": "caption", "bbox": { "l": 134.76, "t": 125.8, "r": 480.59, "b": 177.77, "coord_origin": "TOPLEFT" }, "confidence": 0.866, "cells": [ { "index": 2, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 133.73, "r_x1": 162.64, "r_y1": 133.73, "r_x2": 162.64, "r_y2": 125.8, "r_x3": 134.76, "r_y3": 125.8, "coord_origin": "TOPLEFT" }, "text": "Fig. 6.", "orig": "Fig. 6.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 3, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 165.22, "r_y0": 133.93, "r_x1": 480.59, "r_y1": 133.93, "r_x2": 480.59, "r_y2": 125.86, "r_x3": 165.22, "r_y3": 125.86, "coord_origin": "TOPLEFT" }, "text": "Visualization of predicted structure and detected bounding boxes on a complex", "orig": "Visualization of predicted structure and detected bounding boxes on a complex", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 4, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 144.89, "r_x1": 480.59, "r_y1": 144.89, "r_x2": 480.59, "r_y2": 136.82, "r_x3": 134.76, "r_y3": 136.82, "coord_origin": "TOPLEFT" }, "text": "table with many rows. The OTSL model (B) captured repeating pattern of horizontally", "orig": "table with many rows. The OTSL model (B) captured repeating pattern of horizontally", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 5, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 155.85, "r_x1": 480.59, "r_y1": 155.85, "r_x2": 480.59, "r_y2": 147.78, "r_x3": 134.76, "r_y3": 147.78, "coord_origin": "TOPLEFT" }, "text": "merged cells from the GT (A), unlike the HTML model (C). The HTML model also", "orig": "merged cells from the GT (A), unlike the HTML model (C). The HTML model also", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 6, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 166.81, "r_x1": 480.59, "r_y1": 166.81, "r_x2": 480.59, "r_y2": 158.74, "r_x3": 134.76, "r_y3": 158.74, "coord_origin": "TOPLEFT" }, "text": "didn\u2019t complete the HTML sequence correctly and displayed a lot more of drift and", "orig": "didn\u2019t complete the HTML sequence correctly and displayed a lot more of drift and", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 7, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 177.77, "r_x1": 415.84, "r_y1": 177.77, "r_x2": 415.84, "r_y2": 169.7, "r_x3": 134.76, "r_y3": 169.7, "coord_origin": "TOPLEFT" }, "text": "overlap of bounding boxes. \"PMC5406406_003_01.png\" PubTabNet.", "orig": "overlap of bounding boxes. \"PMC5406406_003_01.png\" PubTabNet.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 3, "label": "picture", "bbox": { "l": 168.39, "t": 181.97, "r": 447.35, "b": 634.01, "coord_origin": "TOPLEFT" }, "confidence": 0.761, "cells": [ { "index": 8, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 171.5, "r_y0": 320.36, "r_x1": 177.6, "r_y1": 320.36, "r_x2": 177.6, "r_y2": 312.45, "r_x3": 171.5, "r_y3": 312.45, "coord_origin": "TOPLEFT" }, "text": "B", "orig": "B", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 9, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 171.06, "r_y0": 500.57, "r_x1": 177.15, "r_y1": 500.57, "r_x2": 177.15, "r_y2": 492.65, "r_x3": 171.06, "r_y3": 492.65, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 10, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 283.05, "r_y0": 633.42, "r_x1": 374.96, "r_y1": 633.42, "r_x2": 374.96, "r_y2": 627.48, "r_x3": 283.05, "r_y3": 627.48, "coord_origin": "TOPLEFT" }, "text": "Incorrect end of HTML sequence", "orig": "Incorrect end of HTML sequence", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 11, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 283.05, "r_y0": 623.29, "r_x1": 398.06, "r_y1": 623.29, "r_x2": 398.06, "r_y2": 617.36, "r_x3": 283.05, "r_y3": 617.36, "coord_origin": "TOPLEFT" }, "text": "Horizontally merged cells are not present", "orig": "Horizontally merged cells are not present", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 12, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 293.64, "r_y0": 471.53, "r_x1": 437.51, "r_y1": 471.53, "r_x2": 437.51, "r_y2": 465.6, "r_x3": 293.64, "r_y3": 465.6, "coord_origin": "TOPLEFT" }, "text": "Repeating pattern is well represented in predictions", "orig": "Repeating pattern is well represented in predictions", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 13, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 181.89, "r_y0": 294.29, "r_x1": 239.23, "r_y1": 294.29, "r_x2": 239.23, "r_y2": 288.36, "r_x3": 181.89, "r_y3": 288.36, "coord_origin": "TOPLEFT" }, "text": "Repeating pattern of", "orig": "Repeating pattern of", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 14, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 181.89, "r_y0": 300.83, "r_x1": 251.53, "r_y1": 300.83, "r_x2": 251.53, "r_y2": 294.89, "r_x3": 181.89, "r_y3": 294.89, "coord_origin": "TOPLEFT" }, "text": "horizontally merged cells", "orig": "horizontally merged cells", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 15, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 247.83, "r_y0": 194.82, "r_x1": 253.61, "r_y1": 194.82, "r_x2": 253.61, "r_y2": 184.76, "r_x3": 247.83, "r_y3": 184.76, "coord_origin": "TOPLEFT" }, "text": "A", "orig": "A", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 16, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 292.19, "r_y0": 613.74, "r_x1": 381.55, "r_y1": 613.74, "r_x2": 381.55, "r_y2": 607.81, "r_x3": 292.19, "r_y3": 607.81, "coord_origin": "TOPLEFT" }, "text": "Bounding box drifting at the end", "orig": "Bounding box drifting at the end", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 17, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 172.28, "r_y0": 403.4, "r_x1": 180.19, "r_y1": 403.4, "r_x2": 180.19, "r_y2": 381.36, "r_x3": 172.28, "r_y3": 381.36, "coord_origin": "TOPLEFT" }, "text": "OTSL", "orig": "OTSL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 18, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 172.28, "r_y0": 578.75, "r_x1": 180.19, "r_y1": 578.75, "r_x2": 180.19, "r_y2": 555.78, "r_x3": 172.28, "r_y3": 555.78, "coord_origin": "TOPLEFT" }, "text": "HTML", "orig": "HTML", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [ { "id": 18, "label": "text", "bbox": { "l": 171.5, "t": 312.45, "r": 177.6, "b": 320.36, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 8, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 171.5, "r_y0": 320.36, "r_x1": 177.6, "r_y1": 320.36, "r_x2": 177.6, "r_y2": 312.45, "r_x3": 171.5, "r_y3": 312.45, "coord_origin": "TOPLEFT" }, "text": "B", "orig": "B", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 19, "label": "text", "bbox": { "l": 171.06, "t": 492.65, "r": 177.15, "b": 500.57, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 9, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 171.06, "r_y0": 500.57, "r_x1": 177.15, "r_y1": 500.57, "r_x2": 177.15, "r_y2": 492.65, "r_x3": 171.06, "r_y3": 492.65, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 20, "label": "text", "bbox": { "l": 283.05, "t": 627.48, "r": 374.96, "b": 633.42, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 10, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 283.05, "r_y0": 633.42, "r_x1": 374.96, "r_y1": 633.42, "r_x2": 374.96, "r_y2": 627.48, "r_x3": 283.05, "r_y3": 627.48, "coord_origin": "TOPLEFT" }, "text": "Incorrect end of HTML sequence", "orig": "Incorrect end of HTML sequence", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 21, "label": "text", "bbox": { "l": 283.05, "t": 617.36, "r": 398.06, "b": 623.29, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 11, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 283.05, "r_y0": 623.29, "r_x1": 398.06, "r_y1": 623.29, "r_x2": 398.06, "r_y2": 617.36, "r_x3": 283.05, "r_y3": 617.36, "coord_origin": "TOPLEFT" }, "text": "Horizontally merged cells are not present", "orig": "Horizontally merged cells are not present", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 22, "label": "text", "bbox": { "l": 293.64, "t": 465.6, "r": 437.51, "b": 471.53, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 12, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 293.64, "r_y0": 471.53, "r_x1": 437.51, "r_y1": 471.53, "r_x2": 437.51, "r_y2": 465.6, "r_x3": 293.64, "r_y3": 465.6, "coord_origin": "TOPLEFT" }, "text": "Repeating pattern is well represented in predictions", "orig": "Repeating pattern is well represented in predictions", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 23, "label": "text", "bbox": { "l": 181.89, "t": 288.36, "r": 239.23, "b": 294.29, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 13, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 181.89, "r_y0": 294.29, "r_x1": 239.23, "r_y1": 294.29, "r_x2": 239.23, "r_y2": 288.36, "r_x3": 181.89, "r_y3": 288.36, "coord_origin": "TOPLEFT" }, "text": "Repeating pattern of", "orig": "Repeating pattern of", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 24, "label": "text", "bbox": { "l": 181.89, "t": 294.89, "r": 251.53, "b": 300.83, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 14, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 181.89, "r_y0": 300.83, "r_x1": 251.53, "r_y1": 300.83, "r_x2": 251.53, "r_y2": 294.89, "r_x3": 181.89, "r_y3": 294.89, "coord_origin": "TOPLEFT" }, "text": "horizontally merged cells", "orig": "horizontally merged cells", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 25, "label": "text", "bbox": { "l": 247.83, "t": 184.76, "r": 253.61, "b": 194.82, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 15, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 247.83, "r_y0": 194.82, "r_x1": 253.61, "r_y1": 194.82, "r_x2": 253.61, "r_y2": 184.76, "r_x3": 247.83, "r_y3": 184.76, "coord_origin": "TOPLEFT" }, "text": "A", "orig": "A", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 26, "label": "text", "bbox": { "l": 292.19, "t": 607.81, "r": 381.55, "b": 613.74, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 16, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 292.19, "r_y0": 613.74, "r_x1": 381.55, "r_y1": 613.74, "r_x2": 381.55, "r_y2": 607.81, "r_x3": 292.19, "r_y3": 607.81, "coord_origin": "TOPLEFT" }, "text": "Bounding box drifting at the end", "orig": "Bounding box drifting at the end", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 27, "label": "text", "bbox": { "l": 172.28, "t": 381.36, "r": 180.19, "b": 403.4, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 17, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 172.28, "r_y0": 403.4, "r_x1": 180.19, "r_y1": 403.4, "r_x2": 180.19, "r_y2": 381.36, "r_x3": 172.28, "r_y3": 381.36, "coord_origin": "TOPLEFT" }, "text": "OTSL", "orig": "OTSL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 28, "label": "text", "bbox": { "l": 172.28, "t": 555.78, "r": 180.19, "b": 578.75, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 18, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 172.28, "r_y0": 578.75, "r_x1": 180.19, "r_y1": 578.75, "r_x2": 180.19, "r_y2": 555.78, "r_x3": 172.28, "r_y3": 555.78, "coord_origin": "TOPLEFT" }, "text": "HTML", "orig": "HTML", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] } ] } ] }, "tablestructure": { "table_map": {} }, "figures_classification": null, "equations_prediction": null, "vlm_response": null }, "assembled": { "elements": [ { "label": "page_header", "id": 0, "page_no": 10, "cluster": { "id": 0, "label": "page_header", "bbox": { "l": 194.48, "t": 93.77, "r": 447.54, "b": 101.84, "coord_origin": "TOPLEFT" }, "confidence": 0.93, "cells": [ { "index": 0, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 194.48, "r_y0": 101.84, "r_x1": 447.54, "r_y1": 101.84, "r_x2": 447.54, "r_y2": 93.77, "r_x3": 194.48, "r_y3": 93.77, "coord_origin": "TOPLEFT" }, "text": "Optimized Table Tokenization for Table Structure Recognition", "orig": "Optimized Table Tokenization for Table Structure Recognition", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "Optimized Table Tokenization for Table Structure Recognition" }, { "label": "page_header", "id": 1, "page_no": 10, "cluster": { "id": 1, "label": "page_header", "bbox": { "l": 471.38, "t": 93.77, "r": 480.59, "b": 101.84, "coord_origin": "TOPLEFT" }, "confidence": 0.901, "cells": [ { "index": 1, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 471.38, "r_y0": 101.84, "r_x1": 480.59, "r_y1": 101.84, "r_x2": 480.59, "r_y2": 93.77, "r_x3": 471.38, "r_y3": 93.77, "coord_origin": "TOPLEFT" }, "text": "11", "orig": "11", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "11" }, { "label": "caption", "id": 2, "page_no": 10, "cluster": { "id": 2, "label": "caption", "bbox": { "l": 134.76, "t": 125.8, "r": 480.59, "b": 177.77, "coord_origin": "TOPLEFT" }, "confidence": 0.866, "cells": [ { "index": 2, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 133.73, "r_x1": 162.64, "r_y1": 133.73, "r_x2": 162.64, "r_y2": 125.8, "r_x3": 134.76, "r_y3": 125.8, "coord_origin": "TOPLEFT" }, "text": "Fig. 6.", "orig": "Fig. 6.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 3, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 165.22, "r_y0": 133.93, "r_x1": 480.59, "r_y1": 133.93, "r_x2": 480.59, "r_y2": 125.86, "r_x3": 165.22, "r_y3": 125.86, "coord_origin": "TOPLEFT" }, "text": "Visualization of predicted structure and detected bounding boxes on a complex", "orig": "Visualization of predicted structure and detected bounding boxes on a complex", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 4, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 144.89, "r_x1": 480.59, "r_y1": 144.89, "r_x2": 480.59, "r_y2": 136.82, "r_x3": 134.76, "r_y3": 136.82, "coord_origin": "TOPLEFT" }, "text": "table with many rows. The OTSL model (B) captured repeating pattern of horizontally", "orig": "table with many rows. The OTSL model (B) captured repeating pattern of horizontally", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 5, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 155.85, "r_x1": 480.59, "r_y1": 155.85, "r_x2": 480.59, "r_y2": 147.78, "r_x3": 134.76, "r_y3": 147.78, "coord_origin": "TOPLEFT" }, "text": "merged cells from the GT (A), unlike the HTML model (C). The HTML model also", "orig": "merged cells from the GT (A), unlike the HTML model (C). The HTML model also", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 6, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 166.81, "r_x1": 480.59, "r_y1": 166.81, "r_x2": 480.59, "r_y2": 158.74, "r_x3": 134.76, "r_y3": 158.74, "coord_origin": "TOPLEFT" }, "text": "didn\u2019t complete the HTML sequence correctly and displayed a lot more of drift and", "orig": "didn\u2019t complete the HTML sequence correctly and displayed a lot more of drift and", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 7, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 177.77, "r_x1": 415.84, "r_y1": 177.77, "r_x2": 415.84, "r_y2": 169.7, "r_x3": 134.76, "r_y3": 169.7, "coord_origin": "TOPLEFT" }, "text": "overlap of bounding boxes. \"PMC5406406_003_01.png\" PubTabNet.", "orig": "overlap of bounding boxes. \"PMC5406406_003_01.png\" PubTabNet.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "Fig. 6. Visualization of predicted structure and detected bounding boxes on a complex table with many rows. The OTSL model (B) captured repeating pattern of horizontally merged cells from the GT (A), unlike the HTML model (C). The HTML model also didn't complete the HTML sequence correctly and displayed a lot more of drift and overlap of bounding boxes. \"PMC5406406_003_01.png\" PubTabNet." }, { "label": "picture", "id": 3, "page_no": 10, "cluster": { "id": 3, "label": "picture", "bbox": { "l": 168.39, "t": 181.97, "r": 447.35, "b": 634.01, "coord_origin": "TOPLEFT" }, "confidence": 0.761, "cells": [ { "index": 8, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 171.5, "r_y0": 320.36, "r_x1": 177.6, "r_y1": 320.36, "r_x2": 177.6, "r_y2": 312.45, "r_x3": 171.5, "r_y3": 312.45, "coord_origin": "TOPLEFT" }, "text": "B", "orig": "B", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 9, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 171.06, "r_y0": 500.57, "r_x1": 177.15, "r_y1": 500.57, "r_x2": 177.15, "r_y2": 492.65, "r_x3": 171.06, "r_y3": 492.65, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 10, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 283.05, "r_y0": 633.42, "r_x1": 374.96, "r_y1": 633.42, "r_x2": 374.96, "r_y2": 627.48, "r_x3": 283.05, "r_y3": 627.48, "coord_origin": "TOPLEFT" }, "text": "Incorrect end of HTML sequence", "orig": "Incorrect end of HTML sequence", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 11, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 283.05, "r_y0": 623.29, "r_x1": 398.06, "r_y1": 623.29, "r_x2": 398.06, "r_y2": 617.36, "r_x3": 283.05, "r_y3": 617.36, "coord_origin": "TOPLEFT" }, "text": "Horizontally merged cells are not present", "orig": "Horizontally merged cells are not present", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 12, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 293.64, "r_y0": 471.53, "r_x1": 437.51, "r_y1": 471.53, "r_x2": 437.51, "r_y2": 465.6, "r_x3": 293.64, "r_y3": 465.6, "coord_origin": "TOPLEFT" }, "text": "Repeating pattern is well represented in predictions", "orig": "Repeating pattern is well represented in predictions", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 13, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 181.89, "r_y0": 294.29, "r_x1": 239.23, "r_y1": 294.29, "r_x2": 239.23, "r_y2": 288.36, "r_x3": 181.89, "r_y3": 288.36, "coord_origin": "TOPLEFT" }, "text": "Repeating pattern of", "orig": "Repeating pattern of", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 14, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 181.89, "r_y0": 300.83, "r_x1": 251.53, "r_y1": 300.83, "r_x2": 251.53, "r_y2": 294.89, "r_x3": 181.89, "r_y3": 294.89, "coord_origin": "TOPLEFT" }, "text": "horizontally merged cells", "orig": "horizontally merged cells", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 15, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 247.83, "r_y0": 194.82, "r_x1": 253.61, "r_y1": 194.82, "r_x2": 253.61, "r_y2": 184.76, "r_x3": 247.83, "r_y3": 184.76, "coord_origin": "TOPLEFT" }, "text": "A", "orig": "A", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 16, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 292.19, "r_y0": 613.74, "r_x1": 381.55, "r_y1": 613.74, "r_x2": 381.55, "r_y2": 607.81, "r_x3": 292.19, "r_y3": 607.81, "coord_origin": "TOPLEFT" }, "text": "Bounding box drifting at the end", "orig": "Bounding box drifting at the end", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 17, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 172.28, "r_y0": 403.4, "r_x1": 180.19, "r_y1": 403.4, "r_x2": 180.19, "r_y2": 381.36, "r_x3": 172.28, "r_y3": 381.36, "coord_origin": "TOPLEFT" }, "text": "OTSL", "orig": "OTSL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 18, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 172.28, "r_y0": 578.75, "r_x1": 180.19, "r_y1": 578.75, "r_x2": 180.19, "r_y2": 555.78, "r_x3": 172.28, "r_y3": 555.78, "coord_origin": "TOPLEFT" }, "text": "HTML", "orig": "HTML", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [ { "id": 18, "label": "text", "bbox": { "l": 171.5, "t": 312.45, "r": 177.6, "b": 320.36, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 8, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 171.5, "r_y0": 320.36, "r_x1": 177.6, "r_y1": 320.36, "r_x2": 177.6, "r_y2": 312.45, "r_x3": 171.5, "r_y3": 312.45, "coord_origin": "TOPLEFT" }, "text": "B", "orig": "B", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 19, "label": "text", "bbox": { "l": 171.06, "t": 492.65, "r": 177.15, "b": 500.57, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 9, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 171.06, "r_y0": 500.57, "r_x1": 177.15, "r_y1": 500.57, "r_x2": 177.15, "r_y2": 492.65, "r_x3": 171.06, "r_y3": 492.65, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 20, "label": "text", "bbox": { "l": 283.05, "t": 627.48, "r": 374.96, "b": 633.42, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 10, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 283.05, "r_y0": 633.42, "r_x1": 374.96, "r_y1": 633.42, "r_x2": 374.96, "r_y2": 627.48, "r_x3": 283.05, "r_y3": 627.48, "coord_origin": "TOPLEFT" }, "text": "Incorrect end of HTML sequence", "orig": "Incorrect end of HTML sequence", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 21, "label": "text", "bbox": { "l": 283.05, "t": 617.36, "r": 398.06, "b": 623.29, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 11, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 283.05, "r_y0": 623.29, "r_x1": 398.06, "r_y1": 623.29, "r_x2": 398.06, "r_y2": 617.36, "r_x3": 283.05, "r_y3": 617.36, "coord_origin": "TOPLEFT" }, "text": "Horizontally merged cells are not present", "orig": "Horizontally merged cells are not present", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 22, "label": "text", "bbox": { "l": 293.64, "t": 465.6, "r": 437.51, "b": 471.53, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 12, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 293.64, "r_y0": 471.53, "r_x1": 437.51, "r_y1": 471.53, "r_x2": 437.51, "r_y2": 465.6, "r_x3": 293.64, "r_y3": 465.6, "coord_origin": "TOPLEFT" }, "text": "Repeating pattern is well represented in predictions", "orig": "Repeating pattern is well represented in predictions", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 23, "label": "text", "bbox": { "l": 181.89, "t": 288.36, "r": 239.23, "b": 294.29, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 13, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 181.89, "r_y0": 294.29, "r_x1": 239.23, "r_y1": 294.29, "r_x2": 239.23, "r_y2": 288.36, "r_x3": 181.89, "r_y3": 288.36, "coord_origin": "TOPLEFT" }, "text": "Repeating pattern of", "orig": "Repeating pattern of", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 24, "label": "text", "bbox": { "l": 181.89, "t": 294.89, "r": 251.53, "b": 300.83, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 14, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 181.89, "r_y0": 300.83, "r_x1": 251.53, "r_y1": 300.83, "r_x2": 251.53, "r_y2": 294.89, "r_x3": 181.89, "r_y3": 294.89, "coord_origin": "TOPLEFT" }, "text": "horizontally merged cells", "orig": "horizontally merged cells", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 25, "label": "text", "bbox": { "l": 247.83, "t": 184.76, "r": 253.61, "b": 194.82, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 15, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 247.83, "r_y0": 194.82, "r_x1": 253.61, "r_y1": 194.82, "r_x2": 253.61, "r_y2": 184.76, "r_x3": 247.83, "r_y3": 184.76, "coord_origin": "TOPLEFT" }, "text": "A", "orig": "A", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 26, "label": "text", "bbox": { "l": 292.19, "t": 607.81, "r": 381.55, "b": 613.74, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 16, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 292.19, "r_y0": 613.74, "r_x1": 381.55, "r_y1": 613.74, "r_x2": 381.55, "r_y2": 607.81, "r_x3": 292.19, "r_y3": 607.81, "coord_origin": "TOPLEFT" }, "text": "Bounding box drifting at the end", "orig": "Bounding box drifting at the end", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 27, "label": "text", "bbox": { "l": 172.28, "t": 381.36, "r": 180.19, "b": 403.4, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 17, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 172.28, "r_y0": 403.4, "r_x1": 180.19, "r_y1": 403.4, "r_x2": 180.19, "r_y2": 381.36, "r_x3": 172.28, "r_y3": 381.36, "coord_origin": "TOPLEFT" }, "text": "OTSL", "orig": "OTSL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 28, "label": "text", "bbox": { "l": 172.28, "t": 555.78, "r": 180.19, "b": 578.75, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 18, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 172.28, "r_y0": 578.75, "r_x1": 180.19, "r_y1": 578.75, "r_x2": 180.19, "r_y2": 555.78, "r_x3": 172.28, "r_y3": 555.78, "coord_origin": "TOPLEFT" }, "text": "HTML", "orig": "HTML", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] } ] }, "text": "", "annotations": [], "provenance": null, "predicted_class": null, "confidence": null } ], "body": [ { "label": "caption", "id": 2, "page_no": 10, "cluster": { "id": 2, "label": "caption", "bbox": { "l": 134.76, "t": 125.8, "r": 480.59, "b": 177.77, "coord_origin": "TOPLEFT" }, "confidence": 0.866, "cells": [ { "index": 2, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 133.73, "r_x1": 162.64, "r_y1": 133.73, "r_x2": 162.64, "r_y2": 125.8, "r_x3": 134.76, "r_y3": 125.8, "coord_origin": "TOPLEFT" }, "text": "Fig. 6.", "orig": "Fig. 6.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 3, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 165.22, "r_y0": 133.93, "r_x1": 480.59, "r_y1": 133.93, "r_x2": 480.59, "r_y2": 125.86, "r_x3": 165.22, "r_y3": 125.86, "coord_origin": "TOPLEFT" }, "text": "Visualization of predicted structure and detected bounding boxes on a complex", "orig": "Visualization of predicted structure and detected bounding boxes on a complex", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 4, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 144.89, "r_x1": 480.59, "r_y1": 144.89, "r_x2": 480.59, "r_y2": 136.82, "r_x3": 134.76, "r_y3": 136.82, "coord_origin": "TOPLEFT" }, "text": "table with many rows. The OTSL model (B) captured repeating pattern of horizontally", "orig": "table with many rows. The OTSL model (B) captured repeating pattern of horizontally", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 5, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 155.85, "r_x1": 480.59, "r_y1": 155.85, "r_x2": 480.59, "r_y2": 147.78, "r_x3": 134.76, "r_y3": 147.78, "coord_origin": "TOPLEFT" }, "text": "merged cells from the GT (A), unlike the HTML model (C). The HTML model also", "orig": "merged cells from the GT (A), unlike the HTML model (C). The HTML model also", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 6, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 166.81, "r_x1": 480.59, "r_y1": 166.81, "r_x2": 480.59, "r_y2": 158.74, "r_x3": 134.76, "r_y3": 158.74, "coord_origin": "TOPLEFT" }, "text": "didn\u2019t complete the HTML sequence correctly and displayed a lot more of drift and", "orig": "didn\u2019t complete the HTML sequence correctly and displayed a lot more of drift and", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 7, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 177.77, "r_x1": 415.84, "r_y1": 177.77, "r_x2": 415.84, "r_y2": 169.7, "r_x3": 134.76, "r_y3": 169.7, "coord_origin": "TOPLEFT" }, "text": "overlap of bounding boxes. \"PMC5406406_003_01.png\" PubTabNet.", "orig": "overlap of bounding boxes. \"PMC5406406_003_01.png\" PubTabNet.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "Fig. 6. Visualization of predicted structure and detected bounding boxes on a complex table with many rows. The OTSL model (B) captured repeating pattern of horizontally merged cells from the GT (A), unlike the HTML model (C). The HTML model also didn't complete the HTML sequence correctly and displayed a lot more of drift and overlap of bounding boxes. \"PMC5406406_003_01.png\" PubTabNet." }, { "label": "picture", "id": 3, "page_no": 10, "cluster": { "id": 3, "label": "picture", "bbox": { "l": 168.39, "t": 181.97, "r": 447.35, "b": 634.01, "coord_origin": "TOPLEFT" }, "confidence": 0.761, "cells": [ { "index": 8, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 171.5, "r_y0": 320.36, "r_x1": 177.6, "r_y1": 320.36, "r_x2": 177.6, "r_y2": 312.45, "r_x3": 171.5, "r_y3": 312.45, "coord_origin": "TOPLEFT" }, "text": "B", "orig": "B", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 9, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 171.06, "r_y0": 500.57, "r_x1": 177.15, "r_y1": 500.57, "r_x2": 177.15, "r_y2": 492.65, "r_x3": 171.06, "r_y3": 492.65, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 10, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 283.05, "r_y0": 633.42, "r_x1": 374.96, "r_y1": 633.42, "r_x2": 374.96, "r_y2": 627.48, "r_x3": 283.05, "r_y3": 627.48, "coord_origin": "TOPLEFT" }, "text": "Incorrect end of HTML sequence", "orig": "Incorrect end of HTML sequence", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 11, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 283.05, "r_y0": 623.29, "r_x1": 398.06, "r_y1": 623.29, "r_x2": 398.06, "r_y2": 617.36, "r_x3": 283.05, "r_y3": 617.36, "coord_origin": "TOPLEFT" }, "text": "Horizontally merged cells are not present", "orig": "Horizontally merged cells are not present", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 12, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 293.64, "r_y0": 471.53, "r_x1": 437.51, "r_y1": 471.53, "r_x2": 437.51, "r_y2": 465.6, "r_x3": 293.64, "r_y3": 465.6, "coord_origin": "TOPLEFT" }, "text": "Repeating pattern is well represented in predictions", "orig": "Repeating pattern is well represented in predictions", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 13, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 181.89, "r_y0": 294.29, "r_x1": 239.23, "r_y1": 294.29, "r_x2": 239.23, "r_y2": 288.36, "r_x3": 181.89, "r_y3": 288.36, "coord_origin": "TOPLEFT" }, "text": "Repeating pattern of", "orig": "Repeating pattern of", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 14, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 181.89, "r_y0": 300.83, "r_x1": 251.53, "r_y1": 300.83, "r_x2": 251.53, "r_y2": 294.89, "r_x3": 181.89, "r_y3": 294.89, "coord_origin": "TOPLEFT" }, "text": "horizontally merged cells", "orig": "horizontally merged cells", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 15, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 247.83, "r_y0": 194.82, "r_x1": 253.61, "r_y1": 194.82, "r_x2": 253.61, "r_y2": 184.76, "r_x3": 247.83, "r_y3": 184.76, "coord_origin": "TOPLEFT" }, "text": "A", "orig": "A", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 16, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 292.19, "r_y0": 613.74, "r_x1": 381.55, "r_y1": 613.74, "r_x2": 381.55, "r_y2": 607.81, "r_x3": 292.19, "r_y3": 607.81, "coord_origin": "TOPLEFT" }, "text": "Bounding box drifting at the end", "orig": "Bounding box drifting at the end", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 17, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 172.28, "r_y0": 403.4, "r_x1": 180.19, "r_y1": 403.4, "r_x2": 180.19, "r_y2": 381.36, "r_x3": 172.28, "r_y3": 381.36, "coord_origin": "TOPLEFT" }, "text": "OTSL", "orig": "OTSL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 18, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 172.28, "r_y0": 578.75, "r_x1": 180.19, "r_y1": 578.75, "r_x2": 180.19, "r_y2": 555.78, "r_x3": 172.28, "r_y3": 555.78, "coord_origin": "TOPLEFT" }, "text": "HTML", "orig": "HTML", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [ { "id": 18, "label": "text", "bbox": { "l": 171.5, "t": 312.45, "r": 177.6, "b": 320.36, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 8, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 171.5, "r_y0": 320.36, "r_x1": 177.6, "r_y1": 320.36, "r_x2": 177.6, "r_y2": 312.45, "r_x3": 171.5, "r_y3": 312.45, "coord_origin": "TOPLEFT" }, "text": "B", "orig": "B", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 19, "label": "text", "bbox": { "l": 171.06, "t": 492.65, "r": 177.15, "b": 500.57, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 9, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 171.06, "r_y0": 500.57, "r_x1": 177.15, "r_y1": 500.57, "r_x2": 177.15, "r_y2": 492.65, "r_x3": 171.06, "r_y3": 492.65, "coord_origin": "TOPLEFT" }, "text": "C", "orig": "C", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 20, "label": "text", "bbox": { "l": 283.05, "t": 627.48, "r": 374.96, "b": 633.42, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 10, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 283.05, "r_y0": 633.42, "r_x1": 374.96, "r_y1": 633.42, "r_x2": 374.96, "r_y2": 627.48, "r_x3": 283.05, "r_y3": 627.48, "coord_origin": "TOPLEFT" }, "text": "Incorrect end of HTML sequence", "orig": "Incorrect end of HTML sequence", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 21, "label": "text", "bbox": { "l": 283.05, "t": 617.36, "r": 398.06, "b": 623.29, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 11, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 283.05, "r_y0": 623.29, "r_x1": 398.06, "r_y1": 623.29, "r_x2": 398.06, "r_y2": 617.36, "r_x3": 283.05, "r_y3": 617.36, "coord_origin": "TOPLEFT" }, "text": "Horizontally merged cells are not present", "orig": "Horizontally merged cells are not present", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 22, "label": "text", "bbox": { "l": 293.64, "t": 465.6, "r": 437.51, "b": 471.53, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 12, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 293.64, "r_y0": 471.53, "r_x1": 437.51, "r_y1": 471.53, "r_x2": 437.51, "r_y2": 465.6, "r_x3": 293.64, "r_y3": 465.6, "coord_origin": "TOPLEFT" }, "text": "Repeating pattern is well represented in predictions", "orig": "Repeating pattern is well represented in predictions", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 23, "label": "text", "bbox": { "l": 181.89, "t": 288.36, "r": 239.23, "b": 294.29, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 13, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 181.89, "r_y0": 294.29, "r_x1": 239.23, "r_y1": 294.29, "r_x2": 239.23, "r_y2": 288.36, "r_x3": 181.89, "r_y3": 288.36, "coord_origin": "TOPLEFT" }, "text": "Repeating pattern of", "orig": "Repeating pattern of", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 24, "label": "text", "bbox": { "l": 181.89, "t": 294.89, "r": 251.53, "b": 300.83, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 14, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 181.89, "r_y0": 300.83, "r_x1": 251.53, "r_y1": 300.83, "r_x2": 251.53, "r_y2": 294.89, "r_x3": 181.89, "r_y3": 294.89, "coord_origin": "TOPLEFT" }, "text": "horizontally merged cells", "orig": "horizontally merged cells", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 25, "label": "text", "bbox": { "l": 247.83, "t": 184.76, "r": 253.61, "b": 194.82, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 15, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 247.83, "r_y0": 194.82, "r_x1": 253.61, "r_y1": 194.82, "r_x2": 253.61, "r_y2": 184.76, "r_x3": 247.83, "r_y3": 184.76, "coord_origin": "TOPLEFT" }, "text": "A", "orig": "A", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 26, "label": "text", "bbox": { "l": 292.19, "t": 607.81, "r": 381.55, "b": 613.74, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 16, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 292.19, "r_y0": 613.74, "r_x1": 381.55, "r_y1": 613.74, "r_x2": 381.55, "r_y2": 607.81, "r_x3": 292.19, "r_y3": 607.81, "coord_origin": "TOPLEFT" }, "text": "Bounding box drifting at the end", "orig": "Bounding box drifting at the end", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 27, "label": "text", "bbox": { "l": 172.28, "t": 381.36, "r": 180.19, "b": 403.4, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 17, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 172.28, "r_y0": 403.4, "r_x1": 180.19, "r_y1": 403.4, "r_x2": 180.19, "r_y2": 381.36, "r_x3": 172.28, "r_y3": 381.36, "coord_origin": "TOPLEFT" }, "text": "OTSL", "orig": "OTSL", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 28, "label": "text", "bbox": { "l": 172.28, "t": 555.78, "r": 180.19, "b": 578.75, "coord_origin": "TOPLEFT" }, "confidence": 1.0, "cells": [ { "index": 18, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 172.28, "r_y0": 578.75, "r_x1": 180.19, "r_y1": 578.75, "r_x2": 180.19, "r_y2": 555.78, "r_x3": 172.28, "r_y3": 555.78, "coord_origin": "TOPLEFT" }, "text": "HTML", "orig": "HTML", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] } ] }, "text": "", "annotations": [], "provenance": null, "predicted_class": null, "confidence": null } ], "headers": [ { "label": "page_header", "id": 0, "page_no": 10, "cluster": { "id": 0, "label": "page_header", "bbox": { "l": 194.48, "t": 93.77, "r": 447.54, "b": 101.84, "coord_origin": "TOPLEFT" }, "confidence": 0.93, "cells": [ { "index": 0, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 194.48, "r_y0": 101.84, "r_x1": 447.54, "r_y1": 101.84, "r_x2": 447.54, "r_y2": 93.77, "r_x3": 194.48, "r_y3": 93.77, "coord_origin": "TOPLEFT" }, "text": "Optimized Table Tokenization for Table Structure Recognition", "orig": "Optimized Table Tokenization for Table Structure Recognition", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "Optimized Table Tokenization for Table Structure Recognition" }, { "label": "page_header", "id": 1, "page_no": 10, "cluster": { "id": 1, "label": "page_header", "bbox": { "l": 471.38, "t": 93.77, "r": 480.59, "b": 101.84, "coord_origin": "TOPLEFT" }, "confidence": 0.901, "cells": [ { "index": 1, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 471.38, "r_y0": 101.84, "r_x1": 480.59, "r_y1": 101.84, "r_x2": 480.59, "r_y2": 93.77, "r_x3": 471.38, "r_y3": 93.77, "coord_origin": "TOPLEFT" }, "text": "11", "orig": "11", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "11" } ] } }, { "page_no": 11, "size": { "width": 612.0, "height": 792.0 }, "parsed_page": { "dimension": { "angle": 0.0, "rect": { "r_x0": 0.0, "r_y0": 0.0, "r_x1": 612.0, "r_y1": 0.0, "r_x2": 612.0, "r_y2": 792.0, "r_x3": 0.0, "r_y3": 792.0, "coord_origin": "BOTTOMLEFT" }, "boundary_type": "crop_box", "art_bbox": { "l": 0.0, "t": 792.0, "r": 612.0, "b": 0.0, "coord_origin": "BOTTOMLEFT" }, "bleed_bbox": { "l": 0.0, "t": 792.0, "r": 612.0, "b": 0.0, "coord_origin": "BOTTOMLEFT" }, "crop_bbox": { "l": 0.0, "t": 792.0, "r": 612.0, "b": 0.0, "coord_origin": "BOTTOMLEFT" }, "media_bbox": { "l": 0.0, "t": 792.0, "r": 612.0, "b": 0.0, "coord_origin": "BOTTOMLEFT" }, "trim_bbox": { "l": 0.0, "t": 792.0, "r": 612.0, "b": 0.0, "coord_origin": "BOTTOMLEFT" } }, "bitmap_resources": [], "char_cells": [], "word_cells": [], "textline_cells": [ { "index": 0, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 101.84, "r_x1": 143.98, "r_y1": 101.84, "r_x2": 143.98, "r_y2": 93.77, "r_x3": 134.76, "r_y3": 93.77, "coord_origin": "TOPLEFT" }, "text": "12", "orig": "12", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 1, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 167.82, "r_y0": 101.84, "r_x1": 178.08, "r_y1": 101.84, "r_x2": 178.08, "r_y2": 93.77, "r_x3": 167.82, "r_y3": 93.77, "coord_origin": "TOPLEFT" }, "text": "M.", "orig": "M.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 2, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 182.38, "r_y0": 101.84, "r_x1": 231.72, "r_y1": 101.84, "r_x2": 231.72, "r_y2": 93.77, "r_x3": 182.38, "r_y3": 93.77, "coord_origin": "TOPLEFT" }, "text": "Lysak, et al.", "orig": "Lysak, et al.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 3, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 128.12, "r_x1": 141.49, "r_y1": 128.12, "r_x2": 141.49, "r_y2": 117.55, "r_x3": 134.76, "r_y3": 117.55, "coord_origin": "TOPLEFT" }, "text": "6", "orig": "6", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 4, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 154.94, "r_y0": 128.12, "r_x1": 219.25, "r_y1": 128.12, "r_x2": 219.25, "r_y2": 117.55, "r_x3": 154.94, "r_y3": 117.55, "coord_origin": "TOPLEFT" }, "text": "Conclusion", "orig": "Conclusion", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 5, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 155.66, "r_x1": 480.59, "r_y1": 155.66, "r_x2": 480.59, "r_y2": 146.86, "r_x3": 134.76, "r_y3": 146.86, "coord_origin": "TOPLEFT" }, "text": "We demonstrated that representing tables in HTML for the task of table struc-", "orig": "We demonstrated that representing tables in HTML for the task of table struc-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 6, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 167.62, "r_x1": 480.59, "r_y1": 167.62, "r_x2": 480.59, "r_y2": 158.82, "r_x3": 134.76, "r_y3": 158.82, "coord_origin": "TOPLEFT" }, "text": "ture recognition with Im2Seq models is ill-suited and has serious limitations.", "orig": "ture recognition with Im2Seq models is ill-suited and has serious limitations.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 7, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 179.57, "r_x1": 480.59, "r_y1": 179.57, "r_x2": 480.59, "r_y2": 170.77, "r_x3": 134.76, "r_y3": 170.77, "coord_origin": "TOPLEFT" }, "text": "Furthermore, we presented in this paper an Optimized Table Structure Language", "orig": "Furthermore, we presented in this paper an Optimized Table Structure Language", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 8, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 191.53, "r_x1": 480.6, "r_y1": 191.53, "r_x2": 480.6, "r_y2": 182.73, "r_x3": 134.76, "r_y3": 182.73, "coord_origin": "TOPLEFT" }, "text": "(OTSL) which, when compared to commonly used general purpose languages,", "orig": "(OTSL) which, when compared to commonly used general purpose languages,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 9, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 203.48, "r_x1": 239.54, "r_y1": 203.48, "r_x2": 239.54, "r_y2": 194.68, "r_x3": 134.76, "r_y3": 194.68, "coord_origin": "TOPLEFT" }, "text": "has several key benefits.", "orig": "has several key benefits.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 10, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 149.71, "r_y0": 216.24, "r_x1": 480.59, "r_y1": 216.24, "r_x2": 480.59, "r_y2": 207.44, "r_x3": 149.71, "r_y3": 207.44, "coord_origin": "TOPLEFT" }, "text": "First and foremost, given the same network configuration, inference time for", "orig": "First and foremost, given the same network configuration, inference time for", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 11, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 228.2, "r_x1": 480.59, "r_y1": 228.2, "r_x2": 480.59, "r_y2": 219.4, "r_x3": 134.76, "r_y3": 219.4, "coord_origin": "TOPLEFT" }, "text": "a table-structure prediction is about 2 times faster compared to the conventional", "orig": "a table-structure prediction is about 2 times faster compared to the conventional", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 12, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 240.15, "r_x1": 480.59, "r_y1": 240.15, "r_x2": 480.59, "r_y2": 231.35, "r_x3": 134.76, "r_y3": 231.35, "coord_origin": "TOPLEFT" }, "text": "HTML approach. This is primarily owed to the shorter sequence length of the", "orig": "HTML approach. This is primarily owed to the shorter sequence length of the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 13, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 252.11, "r_x1": 480.59, "r_y1": 252.11, "r_x2": 480.59, "r_y2": 243.31, "r_x3": 134.76, "r_y3": 243.31, "coord_origin": "TOPLEFT" }, "text": "OTSL representation. Additional performance benefits can be obtained with", "orig": "OTSL representation. Additional performance benefits can be obtained with", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 14, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 264.06, "r_x1": 480.59, "r_y1": 264.06, "r_x2": 480.59, "r_y2": 255.26, "r_x3": 134.76, "r_y3": 255.26, "coord_origin": "TOPLEFT" }, "text": "HPO (hyper parameter optimization). As we demonstrate in our experiments,", "orig": "HPO (hyper parameter optimization). As we demonstrate in our experiments,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 15, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 276.02, "r_x1": 480.59, "r_y1": 276.02, "r_x2": 480.59, "r_y2": 267.22, "r_x3": 134.76, "r_y3": 267.22, "coord_origin": "TOPLEFT" }, "text": "models trained on OTSL can be significantly smaller, e.g. by reducing the number", "orig": "models trained on OTSL can be significantly smaller, e.g. by reducing the number", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 16, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 287.97, "r_x1": 480.59, "r_y1": 287.97, "r_x2": 480.59, "r_y2": 279.17, "r_x3": 134.76, "r_y3": 279.17, "coord_origin": "TOPLEFT" }, "text": "of encoder and decoder layers, while preserving comparatively good prediction", "orig": "of encoder and decoder layers, while preserving comparatively good prediction", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 17, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 299.93, "r_x1": 480.59, "r_y1": 299.93, "r_x2": 480.59, "r_y2": 291.13, "r_x3": 134.76, "r_y3": 291.13, "coord_origin": "TOPLEFT" }, "text": "quality. This can further improve inference performance, yielding 5-6 times faster", "orig": "quality. This can further improve inference performance, yielding 5-6 times faster", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 18, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 311.88, "r_x1": 480.59, "r_y1": 311.88, "r_x2": 480.59, "r_y2": 303.08, "r_x3": 134.76, "r_y3": 303.08, "coord_origin": "TOPLEFT" }, "text": "inference speed in OTSL with prediction quality comparable to models trained", "orig": "inference speed in OTSL with prediction quality comparable to models trained", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 19, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 323.84, "r_x1": 240.92, "r_y1": 323.84, "r_x2": 240.92, "r_y2": 315.04, "r_x3": 134.76, "r_y3": 315.04, "coord_origin": "TOPLEFT" }, "text": "on HTML (see Table 1).", "orig": "on HTML (see Table 1).", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 20, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 149.71, "r_y0": 336.6, "r_x1": 480.59, "r_y1": 336.6, "r_x2": 480.59, "r_y2": 327.8, "r_x3": 149.71, "r_y3": 327.8, "coord_origin": "TOPLEFT" }, "text": "Secondly, OTSL has more inherent structure and a significantly restricted vo-", "orig": "Secondly, OTSL has more inherent structure and a significantly restricted vo-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 21, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 348.55, "r_x1": 480.59, "r_y1": 348.55, "r_x2": 480.59, "r_y2": 339.75, "r_x3": 134.76, "r_y3": 339.75, "coord_origin": "TOPLEFT" }, "text": "cabulary size. This allows autoregressive models to perform better in the TED", "orig": "cabulary size. This allows autoregressive models to perform better in the TED", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 22, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 360.51, "r_x1": 480.59, "r_y1": 360.51, "r_x2": 480.59, "r_y2": 351.71, "r_x3": 134.76, "r_y3": 351.71, "coord_origin": "TOPLEFT" }, "text": "metric, but especially with regards to prediction accuracy of the table-cell bound-", "orig": "metric, but especially with regards to prediction accuracy of the table-cell bound-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 23, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 372.46, "r_x1": 480.59, "r_y1": 372.46, "r_x2": 480.59, "r_y2": 363.66, "r_x3": 134.76, "r_y3": 363.66, "coord_origin": "TOPLEFT" }, "text": "ing boxes (see Table 2). As shown in Figure 5, we observe that the OTSL dras-", "orig": "ing boxes (see Table 2). As shown in Figure 5, we observe that the OTSL dras-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 24, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 384.42, "r_x1": 480.59, "r_y1": 384.42, "r_x2": 480.59, "r_y2": 375.62, "r_x3": 134.76, "r_y3": 375.62, "coord_origin": "TOPLEFT" }, "text": "tically reduces the drift for table cell bounding boxes at high row count and in", "orig": "tically reduces the drift for table cell bounding boxes at high row count and in", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 25, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 396.37, "r_x1": 480.59, "r_y1": 396.37, "r_x2": 480.59, "r_y2": 387.57, "r_x3": 134.76, "r_y3": 387.57, "coord_origin": "TOPLEFT" }, "text": "sparse tables. This leads to more accurate predictions and a significant reduction", "orig": "sparse tables. This leads to more accurate predictions and a significant reduction", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 26, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 408.33, "r_x1": 480.59, "r_y1": 408.33, "r_x2": 480.59, "r_y2": 399.53, "r_x3": 134.76, "r_y3": 399.53, "coord_origin": "TOPLEFT" }, "text": "in post-processing complexity, which is an undesired necessity in HTML-based", "orig": "in post-processing complexity, which is an undesired necessity in HTML-based", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 27, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 420.28, "r_x1": 480.59, "r_y1": 420.28, "r_x2": 480.59, "r_y2": 411.49, "r_x3": 134.76, "r_y3": 411.49, "coord_origin": "TOPLEFT" }, "text": "Im2Seq models. Significant novelty lies in OTSL syntactical rules, which are few,", "orig": "Im2Seq models. Significant novelty lies in OTSL syntactical rules, which are few,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 28, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 432.24, "r_x1": 480.59, "r_y1": 432.24, "r_x2": 480.59, "r_y2": 423.44, "r_x3": 134.76, "r_y3": 423.44, "coord_origin": "TOPLEFT" }, "text": "simple and always backwards looking. Each new token can be validated only by", "orig": "simple and always backwards looking. Each new token can be validated only by", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 29, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 444.19, "r_x1": 480.59, "r_y1": 444.19, "r_x2": 480.59, "r_y2": 435.4, "r_x3": 134.76, "r_y3": 435.4, "coord_origin": "TOPLEFT" }, "text": "analyzing the sequence of previous tokens, without requiring the entire sequence", "orig": "analyzing the sequence of previous tokens, without requiring the entire sequence", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 30, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 456.15, "r_x1": 480.59, "r_y1": 456.15, "r_x2": 480.59, "r_y2": 447.35, "r_x3": 134.76, "r_y3": 447.35, "coord_origin": "TOPLEFT" }, "text": "to detect mistakes. This in return allows to perform structural error detection", "orig": "to detect mistakes. This in return allows to perform structural error detection", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 31, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 468.1, "r_x1": 366.78, "r_y1": 468.1, "r_x2": 366.78, "r_y2": 459.31, "r_x3": 134.76, "r_y3": 459.31, "coord_origin": "TOPLEFT" }, "text": "and correction on-the-fly during sequence generation.", "orig": "and correction on-the-fly during sequence generation.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 32, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 504.39, "r_x1": 197.69, "r_y1": 504.39, "r_x2": 197.69, "r_y2": 493.82, "r_x3": 134.76, "r_y3": 493.82, "coord_origin": "TOPLEFT" }, "text": "References", "orig": "References", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 33, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 139.37, "r_y0": 530.95, "r_x1": 146.46, "r_y1": 530.95, "r_x2": 146.46, "r_y2": 522.88, "r_x3": 139.37, "r_y3": 522.88, "coord_origin": "TOPLEFT" }, "text": "1.", "orig": "1.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 34, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.02, "r_y0": 530.95, "r_x1": 480.59, "r_y1": 530.95, "r_x2": 480.59, "r_y2": 522.88, "r_x3": 151.02, "r_y3": 522.88, "coord_origin": "TOPLEFT" }, "text": "Auer, C., Dolfi, M., Carvalho, A., Ramis, C.B., Staar, P.W.J.: Delivering doc-", "orig": "Auer, C., Dolfi, M., Carvalho, A., Ramis, C.B., Staar, P.W.J.: Delivering doc-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 35, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.52, "r_y0": 541.91, "r_x1": 480.59, "r_y1": 541.91, "r_x2": 480.59, "r_y2": 533.84, "r_x3": 151.52, "r_y3": 533.84, "coord_origin": "TOPLEFT" }, "text": "ument conversion as a cloud service with high throughput and responsiveness.", "orig": "ument conversion as a cloud service with high throughput and responsiveness.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 36, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.52, "r_y0": 552.87, "r_x1": 176.34, "r_y1": 552.87, "r_x2": 176.34, "r_y2": 544.8, "r_x3": 151.52, "r_y3": 544.8, "coord_origin": "TOPLEFT" }, "text": "CoRR", "orig": "CoRR", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 37, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 179.46, "r_y0": 552.66, "r_x1": 250.68, "r_y1": 552.66, "r_x2": 250.68, "r_y2": 544.74, "r_x3": 179.46, "r_y3": 544.74, "coord_origin": "TOPLEFT" }, "text": "abs/2206.00785", "orig": "abs/2206.00785", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 38, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 253.8, "r_y0": 552.87, "r_x1": 281.96, "r_y1": 552.87, "r_x2": 281.96, "r_y2": 544.8, "r_x3": 253.8, "r_y3": 544.8, "coord_origin": "TOPLEFT" }, "text": "(2022).", "orig": "(2022).", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 39, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 285.08, "r_y0": 552.91, "r_x1": 478.03, "r_y1": 552.91, "r_x2": 478.03, "r_y2": 545.44, "r_x3": 285.08, "r_y3": 545.44, "coord_origin": "TOPLEFT" }, "text": "https://doi.org/10.48550/arXiv.2206.00785", "orig": "https://doi.org/10.48550/arXiv.2206.00785", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 40, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 478.03, "r_y0": 552.87, "r_x1": 480.59, "r_y1": 552.87, "r_x2": 480.59, "r_y2": 544.8, "r_x3": 478.03, "r_y3": 544.8, "coord_origin": "TOPLEFT" }, "text": ",", "orig": ",", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 41, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.52, "r_y0": 563.87, "r_x1": 344.47, "r_y1": 563.87, "r_x2": 344.47, "r_y2": 556.4, "r_x3": 151.52, "r_y3": 556.4, "coord_origin": "TOPLEFT" }, "text": "https://doi.org/10.48550/arXiv.2206.00785", "orig": "https://doi.org/10.48550/arXiv.2206.00785", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 42, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 139.37, "r_y0": 575.59, "r_x1": 145.94, "r_y1": 575.59, "r_x2": 145.94, "r_y2": 567.52, "r_x3": 139.37, "r_y3": 567.52, "coord_origin": "TOPLEFT" }, "text": "2.", "orig": "2.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 43, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 150.17, "r_y0": 575.59, "r_x1": 480.59, "r_y1": 575.59, "r_x2": 480.59, "r_y2": 567.52, "r_x3": 150.17, "r_y3": 567.52, "coord_origin": "TOPLEFT" }, "text": "Chen, B., Peng, D., Zhang, J., Ren, Y., Jin, L.: Complex table structure recognition", "orig": "Chen, B., Peng, D., Zhang, J., Ren, Y., Jin, L.: Complex table structure recognition", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 44, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.52, "r_y0": 586.55, "r_x1": 480.59, "r_y1": 586.55, "r_x2": 480.59, "r_y2": 578.48, "r_x3": 151.52, "r_y3": 578.48, "coord_origin": "TOPLEFT" }, "text": "in the wild using transformer and identity matrix-based augmentation. In: Porwal,", "orig": "in the wild using transformer and identity matrix-based augmentation. In: Porwal,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 45, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.52, "r_y0": 597.51, "r_x1": 480.59, "r_y1": 597.51, "r_x2": 480.59, "r_y2": 589.44, "r_x3": 151.52, "r_y3": 589.44, "coord_origin": "TOPLEFT" }, "text": "U., Forn\u00e9s, A., Shafait, F. (eds.) Frontiers in Handwriting Recognition. pp. 545-", "orig": "U., Forn\u00e9s, A., Shafait, F. (eds.) Frontiers in Handwriting Recognition. pp. 545-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 46, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.52, "r_y0": 608.47, "r_x1": 364.18, "r_y1": 608.47, "r_x2": 364.18, "r_y2": 600.4, "r_x3": 151.52, "r_y3": 600.4, "coord_origin": "TOPLEFT" }, "text": "561. Springer International Publishing, Cham (2022)", "orig": "561. Springer International Publishing, Cham (2022)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 47, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 139.37, "r_y0": 620.23, "r_x1": 146.44, "r_y1": 620.23, "r_x2": 146.44, "r_y2": 612.16, "r_x3": 139.37, "r_y3": 612.16, "coord_origin": "TOPLEFT" }, "text": "3.", "orig": "3.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 48, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 150.98, "r_y0": 620.23, "r_x1": 480.59, "r_y1": 620.23, "r_x2": 480.59, "r_y2": 612.16, "r_x3": 150.98, "r_y3": 612.16, "coord_origin": "TOPLEFT" }, "text": "Chi, Z., Huang, H., Xu, H.D., Yu, H., Yin, W., Mao, X.L.: Complicated table", "orig": "Chi, Z., Huang, H., Xu, H.D., Yu, H., Yin, W., Mao, X.L.: Complicated table", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 49, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.52, "r_y0": 631.19, "r_x1": 400.23, "r_y1": 631.19, "r_x2": 400.23, "r_y2": 623.12, "r_x3": 151.52, "r_y3": 623.12, "coord_origin": "TOPLEFT" }, "text": "structure recognition. arXiv preprint arXiv:1908.04729 (2019)", "orig": "structure recognition. arXiv preprint arXiv:1908.04729 (2019)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 50, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 139.37, "r_y0": 642.95, "r_x1": 146.52, "r_y1": 642.95, "r_x2": 146.52, "r_y2": 634.88, "r_x3": 139.37, "r_y3": 634.88, "coord_origin": "TOPLEFT" }, "text": "4.", "orig": "4.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 51, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.12, "r_y0": 642.95, "r_x1": 480.59, "r_y1": 642.95, "r_x2": 480.59, "r_y2": 634.88, "r_x3": 151.12, "r_y3": 634.88, "coord_origin": "TOPLEFT" }, "text": "Deng, Y., Rosenberg, D., Mann, G.: Challenges in end-to-end neural scientific", "orig": "Deng, Y., Rosenberg, D., Mann, G.: Challenges in end-to-end neural scientific", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 52, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.52, "r_y0": 653.91, "r_x1": 480.59, "r_y1": 653.91, "r_x2": 480.59, "r_y2": 645.84, "r_x3": 151.52, "r_y3": 645.84, "coord_origin": "TOPLEFT" }, "text": "table recognition. In: 2019 International Conference on Document Analysis and", "orig": "table recognition. In: 2019 International Conference on Document Analysis and", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 53, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.52, "r_y0": 664.87, "r_x1": 350.11, "r_y1": 664.87, "r_x2": 350.11, "r_y2": 656.8, "r_x3": 151.52, "r_y3": 656.8, "coord_origin": "TOPLEFT" }, "text": "Recognition (ICDAR). pp. 894-901. IEEE (2019)", "orig": "Recognition (ICDAR). pp. 894-901. IEEE (2019)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "has_chars": false, "has_words": false, "has_lines": true, "image": null, "lines": [] }, "predictions": { "layout": { "clusters": [ { "id": 10, "label": "page_header", "bbox": { "l": 134.76, "t": 93.77, "r": 143.98, "b": 101.84, "coord_origin": "TOPLEFT" }, "confidence": 0.861, "cells": [ { "index": 0, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 101.84, "r_x1": 143.98, "r_y1": 101.84, "r_x2": 143.98, "r_y2": 93.77, "r_x3": 134.76, "r_y3": 93.77, "coord_origin": "TOPLEFT" }, "text": "12", "orig": "12", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 9, "label": "page_header", "bbox": { "l": 167.82, "t": 93.77, "r": 231.72, "b": 101.84, "coord_origin": "TOPLEFT" }, "confidence": 0.893, "cells": [ { "index": 1, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 167.82, "r_y0": 101.84, "r_x1": 178.08, "r_y1": 101.84, "r_x2": 178.08, "r_y2": 93.77, "r_x3": 167.82, "r_y3": 93.77, "coord_origin": "TOPLEFT" }, "text": "M.", "orig": "M.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 2, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 182.38, "r_y0": 101.84, "r_x1": 231.72, "r_y1": 101.84, "r_x2": 231.72, "r_y2": 93.77, "r_x3": 182.38, "r_y3": 93.77, "coord_origin": "TOPLEFT" }, "text": "Lysak, et al.", "orig": "Lysak, et al.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 8, "label": "section_header", "bbox": { "l": 134.76, "t": 117.55, "r": 219.25, "b": 128.12, "coord_origin": "TOPLEFT" }, "confidence": 0.916, "cells": [ { "index": 3, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 128.12, "r_x1": 141.49, "r_y1": 128.12, "r_x2": 141.49, "r_y2": 117.55, "r_x3": 134.76, "r_y3": 117.55, "coord_origin": "TOPLEFT" }, "text": "6", "orig": "6", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 4, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 154.94, "r_y0": 128.12, "r_x1": 219.25, "r_y1": 128.12, "r_x2": 219.25, "r_y2": 117.55, "r_x3": 154.94, "r_y3": 117.55, "coord_origin": "TOPLEFT" }, "text": "Conclusion", "orig": "Conclusion", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 2, "label": "text", "bbox": { "l": 134.76, "t": 146.86, "r": 480.6, "b": 203.48, "coord_origin": "TOPLEFT" }, "confidence": 0.981, "cells": [ { "index": 5, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 155.66, "r_x1": 480.59, "r_y1": 155.66, "r_x2": 480.59, "r_y2": 146.86, "r_x3": 134.76, "r_y3": 146.86, "coord_origin": "TOPLEFT" }, "text": "We demonstrated that representing tables in HTML for the task of table struc-", "orig": "We demonstrated that representing tables in HTML for the task of table struc-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 6, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 167.62, "r_x1": 480.59, "r_y1": 167.62, "r_x2": 480.59, "r_y2": 158.82, "r_x3": 134.76, "r_y3": 158.82, "coord_origin": "TOPLEFT" }, "text": "ture recognition with Im2Seq models is ill-suited and has serious limitations.", "orig": "ture recognition with Im2Seq models is ill-suited and has serious limitations.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 7, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 179.57, "r_x1": 480.59, "r_y1": 179.57, "r_x2": 480.59, "r_y2": 170.77, "r_x3": 134.76, "r_y3": 170.77, "coord_origin": "TOPLEFT" }, "text": "Furthermore, we presented in this paper an Optimized Table Structure Language", "orig": "Furthermore, we presented in this paper an Optimized Table Structure Language", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 8, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 191.53, "r_x1": 480.6, "r_y1": 191.53, "r_x2": 480.6, "r_y2": 182.73, "r_x3": 134.76, "r_y3": 182.73, "coord_origin": "TOPLEFT" }, "text": "(OTSL) which, when compared to commonly used general purpose languages,", "orig": "(OTSL) which, when compared to commonly used general purpose languages,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 9, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 203.48, "r_x1": 239.54, "r_y1": 203.48, "r_x2": 239.54, "r_y2": 194.68, "r_x3": 134.76, "r_y3": 194.68, "coord_origin": "TOPLEFT" }, "text": "has several key benefits.", "orig": "has several key benefits.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 0, "label": "text", "bbox": { "l": 134.76, "t": 207.44, "r": 480.59, "b": 323.84, "coord_origin": "TOPLEFT" }, "confidence": 0.987, "cells": [ { "index": 10, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 149.71, "r_y0": 216.24, "r_x1": 480.59, "r_y1": 216.24, "r_x2": 480.59, "r_y2": 207.44, "r_x3": 149.71, "r_y3": 207.44, "coord_origin": "TOPLEFT" }, "text": "First and foremost, given the same network configuration, inference time for", "orig": "First and foremost, given the same network configuration, inference time for", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 11, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 228.2, "r_x1": 480.59, "r_y1": 228.2, "r_x2": 480.59, "r_y2": 219.4, "r_x3": 134.76, "r_y3": 219.4, "coord_origin": "TOPLEFT" }, "text": "a table-structure prediction is about 2 times faster compared to the conventional", "orig": "a table-structure prediction is about 2 times faster compared to the conventional", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 12, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 240.15, "r_x1": 480.59, "r_y1": 240.15, "r_x2": 480.59, "r_y2": 231.35, "r_x3": 134.76, "r_y3": 231.35, "coord_origin": "TOPLEFT" }, "text": "HTML approach. This is primarily owed to the shorter sequence length of the", "orig": "HTML approach. This is primarily owed to the shorter sequence length of the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 13, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 252.11, "r_x1": 480.59, "r_y1": 252.11, "r_x2": 480.59, "r_y2": 243.31, "r_x3": 134.76, "r_y3": 243.31, "coord_origin": "TOPLEFT" }, "text": "OTSL representation. Additional performance benefits can be obtained with", "orig": "OTSL representation. Additional performance benefits can be obtained with", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 14, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 264.06, "r_x1": 480.59, "r_y1": 264.06, "r_x2": 480.59, "r_y2": 255.26, "r_x3": 134.76, "r_y3": 255.26, "coord_origin": "TOPLEFT" }, "text": "HPO (hyper parameter optimization). As we demonstrate in our experiments,", "orig": "HPO (hyper parameter optimization). As we demonstrate in our experiments,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 15, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 276.02, "r_x1": 480.59, "r_y1": 276.02, "r_x2": 480.59, "r_y2": 267.22, "r_x3": 134.76, "r_y3": 267.22, "coord_origin": "TOPLEFT" }, "text": "models trained on OTSL can be significantly smaller, e.g. by reducing the number", "orig": "models trained on OTSL can be significantly smaller, e.g. by reducing the number", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 16, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 287.97, "r_x1": 480.59, "r_y1": 287.97, "r_x2": 480.59, "r_y2": 279.17, "r_x3": 134.76, "r_y3": 279.17, "coord_origin": "TOPLEFT" }, "text": "of encoder and decoder layers, while preserving comparatively good prediction", "orig": "of encoder and decoder layers, while preserving comparatively good prediction", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 17, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 299.93, "r_x1": 480.59, "r_y1": 299.93, "r_x2": 480.59, "r_y2": 291.13, "r_x3": 134.76, "r_y3": 291.13, "coord_origin": "TOPLEFT" }, "text": "quality. This can further improve inference performance, yielding 5-6 times faster", "orig": "quality. This can further improve inference performance, yielding 5-6 times faster", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 18, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 311.88, "r_x1": 480.59, "r_y1": 311.88, "r_x2": 480.59, "r_y2": 303.08, "r_x3": 134.76, "r_y3": 303.08, "coord_origin": "TOPLEFT" }, "text": "inference speed in OTSL with prediction quality comparable to models trained", "orig": "inference speed in OTSL with prediction quality comparable to models trained", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 19, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 323.84, "r_x1": 240.92, "r_y1": 323.84, "r_x2": 240.92, "r_y2": 315.04, "r_x3": 134.76, "r_y3": 315.04, "coord_origin": "TOPLEFT" }, "text": "on HTML (see Table 1).", "orig": "on HTML (see Table 1).", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 1, "label": "text", "bbox": { "l": 134.76, "t": 327.8, "r": 480.59, "b": 468.1, "coord_origin": "TOPLEFT" }, "confidence": 0.987, "cells": [ { "index": 20, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 149.71, "r_y0": 336.6, "r_x1": 480.59, "r_y1": 336.6, "r_x2": 480.59, "r_y2": 327.8, "r_x3": 149.71, "r_y3": 327.8, "coord_origin": "TOPLEFT" }, "text": "Secondly, OTSL has more inherent structure and a significantly restricted vo-", "orig": "Secondly, OTSL has more inherent structure and a significantly restricted vo-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 21, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 348.55, "r_x1": 480.59, "r_y1": 348.55, "r_x2": 480.59, "r_y2": 339.75, "r_x3": 134.76, "r_y3": 339.75, "coord_origin": "TOPLEFT" }, "text": "cabulary size. This allows autoregressive models to perform better in the TED", "orig": "cabulary size. This allows autoregressive models to perform better in the TED", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 22, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 360.51, "r_x1": 480.59, "r_y1": 360.51, "r_x2": 480.59, "r_y2": 351.71, "r_x3": 134.76, "r_y3": 351.71, "coord_origin": "TOPLEFT" }, "text": "metric, but especially with regards to prediction accuracy of the table-cell bound-", "orig": "metric, but especially with regards to prediction accuracy of the table-cell bound-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 23, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 372.46, "r_x1": 480.59, "r_y1": 372.46, "r_x2": 480.59, "r_y2": 363.66, "r_x3": 134.76, "r_y3": 363.66, "coord_origin": "TOPLEFT" }, "text": "ing boxes (see Table 2). As shown in Figure 5, we observe that the OTSL dras-", "orig": "ing boxes (see Table 2). As shown in Figure 5, we observe that the OTSL dras-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 24, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 384.42, "r_x1": 480.59, "r_y1": 384.42, "r_x2": 480.59, "r_y2": 375.62, "r_x3": 134.76, "r_y3": 375.62, "coord_origin": "TOPLEFT" }, "text": "tically reduces the drift for table cell bounding boxes at high row count and in", "orig": "tically reduces the drift for table cell bounding boxes at high row count and in", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 25, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 396.37, "r_x1": 480.59, "r_y1": 396.37, "r_x2": 480.59, "r_y2": 387.57, "r_x3": 134.76, "r_y3": 387.57, "coord_origin": "TOPLEFT" }, "text": "sparse tables. This leads to more accurate predictions and a significant reduction", "orig": "sparse tables. This leads to more accurate predictions and a significant reduction", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 26, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 408.33, "r_x1": 480.59, "r_y1": 408.33, "r_x2": 480.59, "r_y2": 399.53, "r_x3": 134.76, "r_y3": 399.53, "coord_origin": "TOPLEFT" }, "text": "in post-processing complexity, which is an undesired necessity in HTML-based", "orig": "in post-processing complexity, which is an undesired necessity in HTML-based", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 27, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 420.28, "r_x1": 480.59, "r_y1": 420.28, "r_x2": 480.59, "r_y2": 411.49, "r_x3": 134.76, "r_y3": 411.49, "coord_origin": "TOPLEFT" }, "text": "Im2Seq models. Significant novelty lies in OTSL syntactical rules, which are few,", "orig": "Im2Seq models. Significant novelty lies in OTSL syntactical rules, which are few,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 28, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 432.24, "r_x1": 480.59, "r_y1": 432.24, "r_x2": 480.59, "r_y2": 423.44, "r_x3": 134.76, "r_y3": 423.44, "coord_origin": "TOPLEFT" }, "text": "simple and always backwards looking. Each new token can be validated only by", "orig": "simple and always backwards looking. Each new token can be validated only by", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 29, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 444.19, "r_x1": 480.59, "r_y1": 444.19, "r_x2": 480.59, "r_y2": 435.4, "r_x3": 134.76, "r_y3": 435.4, "coord_origin": "TOPLEFT" }, "text": "analyzing the sequence of previous tokens, without requiring the entire sequence", "orig": "analyzing the sequence of previous tokens, without requiring the entire sequence", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 30, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 456.15, "r_x1": 480.59, "r_y1": 456.15, "r_x2": 480.59, "r_y2": 447.35, "r_x3": 134.76, "r_y3": 447.35, "coord_origin": "TOPLEFT" }, "text": "to detect mistakes. This in return allows to perform structural error detection", "orig": "to detect mistakes. This in return allows to perform structural error detection", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 31, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 468.1, "r_x1": 366.78, "r_y1": 468.1, "r_x2": 366.78, "r_y2": 459.31, "r_x3": 134.76, "r_y3": 459.31, "coord_origin": "TOPLEFT" }, "text": "and correction on-the-fly during sequence generation.", "orig": "and correction on-the-fly during sequence generation.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 7, "label": "section_header", "bbox": { "l": 134.76, "t": 493.82, "r": 197.69, "b": 504.39, "coord_origin": "TOPLEFT" }, "confidence": 0.94, "cells": [ { "index": 32, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 504.39, "r_x1": 197.69, "r_y1": 504.39, "r_x2": 197.69, "r_y2": 493.82, "r_x3": 134.76, "r_y3": 493.82, "coord_origin": "TOPLEFT" }, "text": "References", "orig": "References", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 5, "label": "list_item", "bbox": { "l": 139.37, "t": 522.88, "r": 480.59, "b": 563.87, "coord_origin": "TOPLEFT" }, "confidence": 0.97, "cells": [ { "index": 33, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 139.37, "r_y0": 530.95, "r_x1": 146.46, "r_y1": 530.95, "r_x2": 146.46, "r_y2": 522.88, "r_x3": 139.37, "r_y3": 522.88, "coord_origin": "TOPLEFT" }, "text": "1.", "orig": "1.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 34, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.02, "r_y0": 530.95, "r_x1": 480.59, "r_y1": 530.95, "r_x2": 480.59, "r_y2": 522.88, "r_x3": 151.02, "r_y3": 522.88, "coord_origin": "TOPLEFT" }, "text": "Auer, C., Dolfi, M., Carvalho, A., Ramis, C.B., Staar, P.W.J.: Delivering doc-", "orig": "Auer, C., Dolfi, M., Carvalho, A., Ramis, C.B., Staar, P.W.J.: Delivering doc-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 35, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.52, "r_y0": 541.91, "r_x1": 480.59, "r_y1": 541.91, "r_x2": 480.59, "r_y2": 533.84, "r_x3": 151.52, "r_y3": 533.84, "coord_origin": "TOPLEFT" }, "text": "ument conversion as a cloud service with high throughput and responsiveness.", "orig": "ument conversion as a cloud service with high throughput and responsiveness.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 36, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.52, "r_y0": 552.87, "r_x1": 176.34, "r_y1": 552.87, "r_x2": 176.34, "r_y2": 544.8, "r_x3": 151.52, "r_y3": 544.8, "coord_origin": "TOPLEFT" }, "text": "CoRR", "orig": "CoRR", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 37, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 179.46, "r_y0": 552.66, "r_x1": 250.68, "r_y1": 552.66, "r_x2": 250.68, "r_y2": 544.74, "r_x3": 179.46, "r_y3": 544.74, "coord_origin": "TOPLEFT" }, "text": "abs/2206.00785", "orig": "abs/2206.00785", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 38, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 253.8, "r_y0": 552.87, "r_x1": 281.96, "r_y1": 552.87, "r_x2": 281.96, "r_y2": 544.8, "r_x3": 253.8, "r_y3": 544.8, "coord_origin": "TOPLEFT" }, "text": "(2022).", "orig": "(2022).", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 39, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 285.08, "r_y0": 552.91, "r_x1": 478.03, "r_y1": 552.91, "r_x2": 478.03, "r_y2": 545.44, "r_x3": 285.08, "r_y3": 545.44, "coord_origin": "TOPLEFT" }, "text": "https://doi.org/10.48550/arXiv.2206.00785", "orig": "https://doi.org/10.48550/arXiv.2206.00785", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 40, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 478.03, "r_y0": 552.87, "r_x1": 480.59, "r_y1": 552.87, "r_x2": 480.59, "r_y2": 544.8, "r_x3": 478.03, "r_y3": 544.8, "coord_origin": "TOPLEFT" }, "text": ",", "orig": ",", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 41, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.52, "r_y0": 563.87, "r_x1": 344.47, "r_y1": 563.87, "r_x2": 344.47, "r_y2": 556.4, "r_x3": 151.52, "r_y3": 556.4, "coord_origin": "TOPLEFT" }, "text": "https://doi.org/10.48550/arXiv.2206.00785", "orig": "https://doi.org/10.48550/arXiv.2206.00785", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 4, "label": "list_item", "bbox": { "l": 139.37, "t": 567.52, "r": 480.59, "b": 608.47, "coord_origin": "TOPLEFT" }, "confidence": 0.973, "cells": [ { "index": 42, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 139.37, "r_y0": 575.59, "r_x1": 145.94, "r_y1": 575.59, "r_x2": 145.94, "r_y2": 567.52, "r_x3": 139.37, "r_y3": 567.52, "coord_origin": "TOPLEFT" }, "text": "2.", "orig": "2.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 43, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 150.17, "r_y0": 575.59, "r_x1": 480.59, "r_y1": 575.59, "r_x2": 480.59, "r_y2": 567.52, "r_x3": 150.17, "r_y3": 567.52, "coord_origin": "TOPLEFT" }, "text": "Chen, B., Peng, D., Zhang, J., Ren, Y., Jin, L.: Complex table structure recognition", "orig": "Chen, B., Peng, D., Zhang, J., Ren, Y., Jin, L.: Complex table structure recognition", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 44, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.52, "r_y0": 586.55, "r_x1": 480.59, "r_y1": 586.55, "r_x2": 480.59, "r_y2": 578.48, "r_x3": 151.52, "r_y3": 578.48, "coord_origin": "TOPLEFT" }, "text": "in the wild using transformer and identity matrix-based augmentation. In: Porwal,", "orig": "in the wild using transformer and identity matrix-based augmentation. In: Porwal,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 45, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.52, "r_y0": 597.51, "r_x1": 480.59, "r_y1": 597.51, "r_x2": 480.59, "r_y2": 589.44, "r_x3": 151.52, "r_y3": 589.44, "coord_origin": "TOPLEFT" }, "text": "U., Forn\u00e9s, A., Shafait, F. (eds.) Frontiers in Handwriting Recognition. pp. 545-", "orig": "U., Forn\u00e9s, A., Shafait, F. (eds.) Frontiers in Handwriting Recognition. pp. 545-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 46, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.52, "r_y0": 608.47, "r_x1": 364.18, "r_y1": 608.47, "r_x2": 364.18, "r_y2": 600.4, "r_x3": 151.52, "r_y3": 600.4, "coord_origin": "TOPLEFT" }, "text": "561. Springer International Publishing, Cham (2022)", "orig": "561. Springer International Publishing, Cham (2022)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 6, "label": "list_item", "bbox": { "l": 139.37, "t": 612.16, "r": 480.59, "b": 631.19, "coord_origin": "TOPLEFT" }, "confidence": 0.962, "cells": [ { "index": 47, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 139.37, "r_y0": 620.23, "r_x1": 146.44, "r_y1": 620.23, "r_x2": 146.44, "r_y2": 612.16, "r_x3": 139.37, "r_y3": 612.16, "coord_origin": "TOPLEFT" }, "text": "3.", "orig": "3.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 48, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 150.98, "r_y0": 620.23, "r_x1": 480.59, "r_y1": 620.23, "r_x2": 480.59, "r_y2": 612.16, "r_x3": 150.98, "r_y3": 612.16, "coord_origin": "TOPLEFT" }, "text": "Chi, Z., Huang, H., Xu, H.D., Yu, H., Yin, W., Mao, X.L.: Complicated table", "orig": "Chi, Z., Huang, H., Xu, H.D., Yu, H., Yin, W., Mao, X.L.: Complicated table", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 49, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.52, "r_y0": 631.19, "r_x1": 400.23, "r_y1": 631.19, "r_x2": 400.23, "r_y2": 623.12, "r_x3": 151.52, "r_y3": 623.12, "coord_origin": "TOPLEFT" }, "text": "structure recognition. arXiv preprint arXiv:1908.04729 (2019)", "orig": "structure recognition. arXiv preprint arXiv:1908.04729 (2019)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 3, "label": "list_item", "bbox": { "l": 139.37, "t": 634.88, "r": 480.59, "b": 664.87, "coord_origin": "TOPLEFT" }, "confidence": 0.975, "cells": [ { "index": 50, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 139.37, "r_y0": 642.95, "r_x1": 146.52, "r_y1": 642.95, "r_x2": 146.52, "r_y2": 634.88, "r_x3": 139.37, "r_y3": 634.88, "coord_origin": "TOPLEFT" }, "text": "4.", "orig": "4.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 51, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.12, "r_y0": 642.95, "r_x1": 480.59, "r_y1": 642.95, "r_x2": 480.59, "r_y2": 634.88, "r_x3": 151.12, "r_y3": 634.88, "coord_origin": "TOPLEFT" }, "text": "Deng, Y., Rosenberg, D., Mann, G.: Challenges in end-to-end neural scientific", "orig": "Deng, Y., Rosenberg, D., Mann, G.: Challenges in end-to-end neural scientific", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 52, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.52, "r_y0": 653.91, "r_x1": 480.59, "r_y1": 653.91, "r_x2": 480.59, "r_y2": 645.84, "r_x3": 151.52, "r_y3": 645.84, "coord_origin": "TOPLEFT" }, "text": "table recognition. In: 2019 International Conference on Document Analysis and", "orig": "table recognition. In: 2019 International Conference on Document Analysis and", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 53, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.52, "r_y0": 664.87, "r_x1": 350.11, "r_y1": 664.87, "r_x2": 350.11, "r_y2": 656.8, "r_x3": 151.52, "r_y3": 656.8, "coord_origin": "TOPLEFT" }, "text": "Recognition (ICDAR). pp. 894-901. IEEE (2019)", "orig": "Recognition (ICDAR). pp. 894-901. IEEE (2019)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] } ] }, "tablestructure": { "table_map": {} }, "figures_classification": null, "equations_prediction": null, "vlm_response": null }, "assembled": { "elements": [ { "label": "page_header", "id": 10, "page_no": 11, "cluster": { "id": 10, "label": "page_header", "bbox": { "l": 134.76, "t": 93.77, "r": 143.98, "b": 101.84, "coord_origin": "TOPLEFT" }, "confidence": 0.861, "cells": [ { "index": 0, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 101.84, "r_x1": 143.98, "r_y1": 101.84, "r_x2": 143.98, "r_y2": 93.77, "r_x3": 134.76, "r_y3": 93.77, "coord_origin": "TOPLEFT" }, "text": "12", "orig": "12", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "12" }, { "label": "page_header", "id": 9, "page_no": 11, "cluster": { "id": 9, "label": "page_header", "bbox": { "l": 167.82, "t": 93.77, "r": 231.72, "b": 101.84, "coord_origin": "TOPLEFT" }, "confidence": 0.893, "cells": [ { "index": 1, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 167.82, "r_y0": 101.84, "r_x1": 178.08, "r_y1": 101.84, "r_x2": 178.08, "r_y2": 93.77, "r_x3": 167.82, "r_y3": 93.77, "coord_origin": "TOPLEFT" }, "text": "M.", "orig": "M.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 2, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 182.38, "r_y0": 101.84, "r_x1": 231.72, "r_y1": 101.84, "r_x2": 231.72, "r_y2": 93.77, "r_x3": 182.38, "r_y3": 93.77, "coord_origin": "TOPLEFT" }, "text": "Lysak, et al.", "orig": "Lysak, et al.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "M. Lysak, et al." }, { "label": "section_header", "id": 8, "page_no": 11, "cluster": { "id": 8, "label": "section_header", "bbox": { "l": 134.76, "t": 117.55, "r": 219.25, "b": 128.12, "coord_origin": "TOPLEFT" }, "confidence": 0.916, "cells": [ { "index": 3, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 128.12, "r_x1": 141.49, "r_y1": 128.12, "r_x2": 141.49, "r_y2": 117.55, "r_x3": 134.76, "r_y3": 117.55, "coord_origin": "TOPLEFT" }, "text": "6", "orig": "6", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 4, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 154.94, "r_y0": 128.12, "r_x1": 219.25, "r_y1": 128.12, "r_x2": 219.25, "r_y2": 117.55, "r_x3": 154.94, "r_y3": 117.55, "coord_origin": "TOPLEFT" }, "text": "Conclusion", "orig": "Conclusion", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "6 Conclusion" }, { "label": "text", "id": 2, "page_no": 11, "cluster": { "id": 2, "label": "text", "bbox": { "l": 134.76, "t": 146.86, "r": 480.6, "b": 203.48, "coord_origin": "TOPLEFT" }, "confidence": 0.981, "cells": [ { "index": 5, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 155.66, "r_x1": 480.59, "r_y1": 155.66, "r_x2": 480.59, "r_y2": 146.86, "r_x3": 134.76, "r_y3": 146.86, "coord_origin": "TOPLEFT" }, "text": "We demonstrated that representing tables in HTML for the task of table struc-", "orig": "We demonstrated that representing tables in HTML for the task of table struc-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 6, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 167.62, "r_x1": 480.59, "r_y1": 167.62, "r_x2": 480.59, "r_y2": 158.82, "r_x3": 134.76, "r_y3": 158.82, "coord_origin": "TOPLEFT" }, "text": "ture recognition with Im2Seq models is ill-suited and has serious limitations.", "orig": "ture recognition with Im2Seq models is ill-suited and has serious limitations.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 7, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 179.57, "r_x1": 480.59, "r_y1": 179.57, "r_x2": 480.59, "r_y2": 170.77, "r_x3": 134.76, "r_y3": 170.77, "coord_origin": "TOPLEFT" }, "text": "Furthermore, we presented in this paper an Optimized Table Structure Language", "orig": "Furthermore, we presented in this paper an Optimized Table Structure Language", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 8, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 191.53, "r_x1": 480.6, "r_y1": 191.53, "r_x2": 480.6, "r_y2": 182.73, "r_x3": 134.76, "r_y3": 182.73, "coord_origin": "TOPLEFT" }, "text": "(OTSL) which, when compared to commonly used general purpose languages,", "orig": "(OTSL) which, when compared to commonly used general purpose languages,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 9, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 203.48, "r_x1": 239.54, "r_y1": 203.48, "r_x2": 239.54, "r_y2": 194.68, "r_x3": 134.76, "r_y3": 194.68, "coord_origin": "TOPLEFT" }, "text": "has several key benefits.", "orig": "has several key benefits.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "We demonstrated that representing tables in HTML for the task of table structure recognition with Im2Seq models is ill-suited and has serious limitations. Furthermore, we presented in this paper an Optimized Table Structure Language (OTSL) which, when compared to commonly used general purpose languages, has several key benefits." }, { "label": "text", "id": 0, "page_no": 11, "cluster": { "id": 0, "label": "text", "bbox": { "l": 134.76, "t": 207.44, "r": 480.59, "b": 323.84, "coord_origin": "TOPLEFT" }, "confidence": 0.987, "cells": [ { "index": 10, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 149.71, "r_y0": 216.24, "r_x1": 480.59, "r_y1": 216.24, "r_x2": 480.59, "r_y2": 207.44, "r_x3": 149.71, "r_y3": 207.44, "coord_origin": "TOPLEFT" }, "text": "First and foremost, given the same network configuration, inference time for", "orig": "First and foremost, given the same network configuration, inference time for", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 11, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 228.2, "r_x1": 480.59, "r_y1": 228.2, "r_x2": 480.59, "r_y2": 219.4, "r_x3": 134.76, "r_y3": 219.4, "coord_origin": "TOPLEFT" }, "text": "a table-structure prediction is about 2 times faster compared to the conventional", "orig": "a table-structure prediction is about 2 times faster compared to the conventional", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 12, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 240.15, "r_x1": 480.59, "r_y1": 240.15, "r_x2": 480.59, "r_y2": 231.35, "r_x3": 134.76, "r_y3": 231.35, "coord_origin": "TOPLEFT" }, "text": "HTML approach. This is primarily owed to the shorter sequence length of the", "orig": "HTML approach. This is primarily owed to the shorter sequence length of the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 13, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 252.11, "r_x1": 480.59, "r_y1": 252.11, "r_x2": 480.59, "r_y2": 243.31, "r_x3": 134.76, "r_y3": 243.31, "coord_origin": "TOPLEFT" }, "text": "OTSL representation. Additional performance benefits can be obtained with", "orig": "OTSL representation. Additional performance benefits can be obtained with", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 14, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 264.06, "r_x1": 480.59, "r_y1": 264.06, "r_x2": 480.59, "r_y2": 255.26, "r_x3": 134.76, "r_y3": 255.26, "coord_origin": "TOPLEFT" }, "text": "HPO (hyper parameter optimization). As we demonstrate in our experiments,", "orig": "HPO (hyper parameter optimization). As we demonstrate in our experiments,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 15, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 276.02, "r_x1": 480.59, "r_y1": 276.02, "r_x2": 480.59, "r_y2": 267.22, "r_x3": 134.76, "r_y3": 267.22, "coord_origin": "TOPLEFT" }, "text": "models trained on OTSL can be significantly smaller, e.g. by reducing the number", "orig": "models trained on OTSL can be significantly smaller, e.g. by reducing the number", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 16, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 287.97, "r_x1": 480.59, "r_y1": 287.97, "r_x2": 480.59, "r_y2": 279.17, "r_x3": 134.76, "r_y3": 279.17, "coord_origin": "TOPLEFT" }, "text": "of encoder and decoder layers, while preserving comparatively good prediction", "orig": "of encoder and decoder layers, while preserving comparatively good prediction", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 17, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 299.93, "r_x1": 480.59, "r_y1": 299.93, "r_x2": 480.59, "r_y2": 291.13, "r_x3": 134.76, "r_y3": 291.13, "coord_origin": "TOPLEFT" }, "text": "quality. This can further improve inference performance, yielding 5-6 times faster", "orig": "quality. This can further improve inference performance, yielding 5-6 times faster", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 18, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 311.88, "r_x1": 480.59, "r_y1": 311.88, "r_x2": 480.59, "r_y2": 303.08, "r_x3": 134.76, "r_y3": 303.08, "coord_origin": "TOPLEFT" }, "text": "inference speed in OTSL with prediction quality comparable to models trained", "orig": "inference speed in OTSL with prediction quality comparable to models trained", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 19, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 323.84, "r_x1": 240.92, "r_y1": 323.84, "r_x2": 240.92, "r_y2": 315.04, "r_x3": 134.76, "r_y3": 315.04, "coord_origin": "TOPLEFT" }, "text": "on HTML (see Table 1).", "orig": "on HTML (see Table 1).", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "First and foremost, given the same network configuration, inference time for a table-structure prediction is about 2 times faster compared to the conventional HTML approach. This is primarily owed to the shorter sequence length of the OTSL representation. Additional performance benefits can be obtained with HPO (hyper parameter optimization). As we demonstrate in our experiments, models trained on OTSL can be significantly smaller, e.g. by reducing the number of encoder and decoder layers, while preserving comparatively good prediction quality. This can further improve inference performance, yielding 5-6 times faster inference speed in OTSL with prediction quality comparable to models trained on HTML (see Table 1)." }, { "label": "text", "id": 1, "page_no": 11, "cluster": { "id": 1, "label": "text", "bbox": { "l": 134.76, "t": 327.8, "r": 480.59, "b": 468.1, "coord_origin": "TOPLEFT" }, "confidence": 0.987, "cells": [ { "index": 20, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 149.71, "r_y0": 336.6, "r_x1": 480.59, "r_y1": 336.6, "r_x2": 480.59, "r_y2": 327.8, "r_x3": 149.71, "r_y3": 327.8, "coord_origin": "TOPLEFT" }, "text": "Secondly, OTSL has more inherent structure and a significantly restricted vo-", "orig": "Secondly, OTSL has more inherent structure and a significantly restricted vo-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 21, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 348.55, "r_x1": 480.59, "r_y1": 348.55, "r_x2": 480.59, "r_y2": 339.75, "r_x3": 134.76, "r_y3": 339.75, "coord_origin": "TOPLEFT" }, "text": "cabulary size. This allows autoregressive models to perform better in the TED", "orig": "cabulary size. This allows autoregressive models to perform better in the TED", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 22, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 360.51, "r_x1": 480.59, "r_y1": 360.51, "r_x2": 480.59, "r_y2": 351.71, "r_x3": 134.76, "r_y3": 351.71, "coord_origin": "TOPLEFT" }, "text": "metric, but especially with regards to prediction accuracy of the table-cell bound-", "orig": "metric, but especially with regards to prediction accuracy of the table-cell bound-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 23, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 372.46, "r_x1": 480.59, "r_y1": 372.46, "r_x2": 480.59, "r_y2": 363.66, "r_x3": 134.76, "r_y3": 363.66, "coord_origin": "TOPLEFT" }, "text": "ing boxes (see Table 2). As shown in Figure 5, we observe that the OTSL dras-", "orig": "ing boxes (see Table 2). As shown in Figure 5, we observe that the OTSL dras-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 24, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 384.42, "r_x1": 480.59, "r_y1": 384.42, "r_x2": 480.59, "r_y2": 375.62, "r_x3": 134.76, "r_y3": 375.62, "coord_origin": "TOPLEFT" }, "text": "tically reduces the drift for table cell bounding boxes at high row count and in", "orig": "tically reduces the drift for table cell bounding boxes at high row count and in", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 25, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 396.37, "r_x1": 480.59, "r_y1": 396.37, "r_x2": 480.59, "r_y2": 387.57, "r_x3": 134.76, "r_y3": 387.57, "coord_origin": "TOPLEFT" }, "text": "sparse tables. This leads to more accurate predictions and a significant reduction", "orig": "sparse tables. This leads to more accurate predictions and a significant reduction", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 26, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 408.33, "r_x1": 480.59, "r_y1": 408.33, "r_x2": 480.59, "r_y2": 399.53, "r_x3": 134.76, "r_y3": 399.53, "coord_origin": "TOPLEFT" }, "text": "in post-processing complexity, which is an undesired necessity in HTML-based", "orig": "in post-processing complexity, which is an undesired necessity in HTML-based", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 27, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 420.28, "r_x1": 480.59, "r_y1": 420.28, "r_x2": 480.59, "r_y2": 411.49, "r_x3": 134.76, "r_y3": 411.49, "coord_origin": "TOPLEFT" }, "text": "Im2Seq models. Significant novelty lies in OTSL syntactical rules, which are few,", "orig": "Im2Seq models. Significant novelty lies in OTSL syntactical rules, which are few,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 28, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 432.24, "r_x1": 480.59, "r_y1": 432.24, "r_x2": 480.59, "r_y2": 423.44, "r_x3": 134.76, "r_y3": 423.44, "coord_origin": "TOPLEFT" }, "text": "simple and always backwards looking. Each new token can be validated only by", "orig": "simple and always backwards looking. Each new token can be validated only by", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 29, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 444.19, "r_x1": 480.59, "r_y1": 444.19, "r_x2": 480.59, "r_y2": 435.4, "r_x3": 134.76, "r_y3": 435.4, "coord_origin": "TOPLEFT" }, "text": "analyzing the sequence of previous tokens, without requiring the entire sequence", "orig": "analyzing the sequence of previous tokens, without requiring the entire sequence", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 30, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 456.15, "r_x1": 480.59, "r_y1": 456.15, "r_x2": 480.59, "r_y2": 447.35, "r_x3": 134.76, "r_y3": 447.35, "coord_origin": "TOPLEFT" }, "text": "to detect mistakes. This in return allows to perform structural error detection", "orig": "to detect mistakes. This in return allows to perform structural error detection", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 31, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 468.1, "r_x1": 366.78, "r_y1": 468.1, "r_x2": 366.78, "r_y2": 459.31, "r_x3": 134.76, "r_y3": 459.31, "coord_origin": "TOPLEFT" }, "text": "and correction on-the-fly during sequence generation.", "orig": "and correction on-the-fly during sequence generation.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "Secondly, OTSL has more inherent structure and a significantly restricted vocabulary size. This allows autoregressive models to perform better in the TED metric, but especially with regards to prediction accuracy of the table-cell bounding boxes (see Table 2). As shown in Figure 5, we observe that the OTSL drastically reduces the drift for table cell bounding boxes at high row count and in sparse tables. This leads to more accurate predictions and a significant reduction in post-processing complexity, which is an undesired necessity in HTML-based Im2Seq models. Significant novelty lies in OTSL syntactical rules, which are few, simple and always backwards looking. Each new token can be validated only by analyzing the sequence of previous tokens, without requiring the entire sequence to detect mistakes. This in return allows to perform structural error detection and correction on-the-fly during sequence generation." }, { "label": "section_header", "id": 7, "page_no": 11, "cluster": { "id": 7, "label": "section_header", "bbox": { "l": 134.76, "t": 493.82, "r": 197.69, "b": 504.39, "coord_origin": "TOPLEFT" }, "confidence": 0.94, "cells": [ { "index": 32, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 504.39, "r_x1": 197.69, "r_y1": 504.39, "r_x2": 197.69, "r_y2": 493.82, "r_x3": 134.76, "r_y3": 493.82, "coord_origin": "TOPLEFT" }, "text": "References", "orig": "References", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "References" }, { "label": "list_item", "id": 5, "page_no": 11, "cluster": { "id": 5, "label": "list_item", "bbox": { "l": 139.37, "t": 522.88, "r": 480.59, "b": 563.87, "coord_origin": "TOPLEFT" }, "confidence": 0.97, "cells": [ { "index": 33, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 139.37, "r_y0": 530.95, "r_x1": 146.46, "r_y1": 530.95, "r_x2": 146.46, "r_y2": 522.88, "r_x3": 139.37, "r_y3": 522.88, "coord_origin": "TOPLEFT" }, "text": "1.", "orig": "1.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 34, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.02, "r_y0": 530.95, "r_x1": 480.59, "r_y1": 530.95, "r_x2": 480.59, "r_y2": 522.88, "r_x3": 151.02, "r_y3": 522.88, "coord_origin": "TOPLEFT" }, "text": "Auer, C., Dolfi, M., Carvalho, A., Ramis, C.B., Staar, P.W.J.: Delivering doc-", "orig": "Auer, C., Dolfi, M., Carvalho, A., Ramis, C.B., Staar, P.W.J.: Delivering doc-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 35, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.52, "r_y0": 541.91, "r_x1": 480.59, "r_y1": 541.91, "r_x2": 480.59, "r_y2": 533.84, "r_x3": 151.52, "r_y3": 533.84, "coord_origin": "TOPLEFT" }, "text": "ument conversion as a cloud service with high throughput and responsiveness.", "orig": "ument conversion as a cloud service with high throughput and responsiveness.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 36, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.52, "r_y0": 552.87, "r_x1": 176.34, "r_y1": 552.87, "r_x2": 176.34, "r_y2": 544.8, "r_x3": 151.52, "r_y3": 544.8, "coord_origin": "TOPLEFT" }, "text": "CoRR", "orig": "CoRR", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 37, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 179.46, "r_y0": 552.66, "r_x1": 250.68, "r_y1": 552.66, "r_x2": 250.68, "r_y2": 544.74, "r_x3": 179.46, "r_y3": 544.74, "coord_origin": "TOPLEFT" }, "text": "abs/2206.00785", "orig": "abs/2206.00785", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 38, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 253.8, "r_y0": 552.87, "r_x1": 281.96, "r_y1": 552.87, "r_x2": 281.96, "r_y2": 544.8, "r_x3": 253.8, "r_y3": 544.8, "coord_origin": "TOPLEFT" }, "text": "(2022).", "orig": "(2022).", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 39, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 285.08, "r_y0": 552.91, "r_x1": 478.03, "r_y1": 552.91, "r_x2": 478.03, "r_y2": 545.44, "r_x3": 285.08, "r_y3": 545.44, "coord_origin": "TOPLEFT" }, "text": "https://doi.org/10.48550/arXiv.2206.00785", "orig": "https://doi.org/10.48550/arXiv.2206.00785", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 40, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 478.03, "r_y0": 552.87, "r_x1": 480.59, "r_y1": 552.87, "r_x2": 480.59, "r_y2": 544.8, "r_x3": 478.03, "r_y3": 544.8, "coord_origin": "TOPLEFT" }, "text": ",", "orig": ",", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 41, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.52, "r_y0": 563.87, "r_x1": 344.47, "r_y1": 563.87, "r_x2": 344.47, "r_y2": 556.4, "r_x3": 151.52, "r_y3": 556.4, "coord_origin": "TOPLEFT" }, "text": "https://doi.org/10.48550/arXiv.2206.00785", "orig": "https://doi.org/10.48550/arXiv.2206.00785", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "1. Auer, C., Dolfi, M., Carvalho, A., Ramis, C.B., Staar, P.W.J.: Delivering document conversion as a cloud service with high throughput and responsiveness. CoRR abs/2206.00785 (2022). https://doi.org/10.48550/arXiv.2206.00785 , https://doi.org/10.48550/arXiv.2206.00785" }, { "label": "list_item", "id": 4, "page_no": 11, "cluster": { "id": 4, "label": "list_item", "bbox": { "l": 139.37, "t": 567.52, "r": 480.59, "b": 608.47, "coord_origin": "TOPLEFT" }, "confidence": 0.973, "cells": [ { "index": 42, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 139.37, "r_y0": 575.59, "r_x1": 145.94, "r_y1": 575.59, "r_x2": 145.94, "r_y2": 567.52, "r_x3": 139.37, "r_y3": 567.52, "coord_origin": "TOPLEFT" }, "text": "2.", "orig": "2.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 43, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 150.17, "r_y0": 575.59, "r_x1": 480.59, "r_y1": 575.59, "r_x2": 480.59, "r_y2": 567.52, "r_x3": 150.17, "r_y3": 567.52, "coord_origin": "TOPLEFT" }, "text": "Chen, B., Peng, D., Zhang, J., Ren, Y., Jin, L.: Complex table structure recognition", "orig": "Chen, B., Peng, D., Zhang, J., Ren, Y., Jin, L.: Complex table structure recognition", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 44, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.52, "r_y0": 586.55, "r_x1": 480.59, "r_y1": 586.55, "r_x2": 480.59, "r_y2": 578.48, "r_x3": 151.52, "r_y3": 578.48, "coord_origin": "TOPLEFT" }, "text": "in the wild using transformer and identity matrix-based augmentation. In: Porwal,", "orig": "in the wild using transformer and identity matrix-based augmentation. In: Porwal,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 45, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.52, "r_y0": 597.51, "r_x1": 480.59, "r_y1": 597.51, "r_x2": 480.59, "r_y2": 589.44, "r_x3": 151.52, "r_y3": 589.44, "coord_origin": "TOPLEFT" }, "text": "U., Forn\u00e9s, A., Shafait, F. (eds.) Frontiers in Handwriting Recognition. pp. 545-", "orig": "U., Forn\u00e9s, A., Shafait, F. (eds.) Frontiers in Handwriting Recognition. pp. 545-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 46, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.52, "r_y0": 608.47, "r_x1": 364.18, "r_y1": 608.47, "r_x2": 364.18, "r_y2": 600.4, "r_x3": 151.52, "r_y3": 600.4, "coord_origin": "TOPLEFT" }, "text": "561. Springer International Publishing, Cham (2022)", "orig": "561. Springer International Publishing, Cham (2022)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "2. Chen, B., Peng, D., Zhang, J., Ren, Y., Jin, L.: Complex table structure recognition in the wild using transformer and identity matrix-based augmentation. In: Porwal, U., Forn\u00e9s, A., Shafait, F. (eds.) Frontiers in Handwriting Recognition. pp. 545561. Springer International Publishing, Cham (2022)" }, { "label": "list_item", "id": 6, "page_no": 11, "cluster": { "id": 6, "label": "list_item", "bbox": { "l": 139.37, "t": 612.16, "r": 480.59, "b": 631.19, "coord_origin": "TOPLEFT" }, "confidence": 0.962, "cells": [ { "index": 47, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 139.37, "r_y0": 620.23, "r_x1": 146.44, "r_y1": 620.23, "r_x2": 146.44, "r_y2": 612.16, "r_x3": 139.37, "r_y3": 612.16, "coord_origin": "TOPLEFT" }, "text": "3.", "orig": "3.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 48, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 150.98, "r_y0": 620.23, "r_x1": 480.59, "r_y1": 620.23, "r_x2": 480.59, "r_y2": 612.16, "r_x3": 150.98, "r_y3": 612.16, "coord_origin": "TOPLEFT" }, "text": "Chi, Z., Huang, H., Xu, H.D., Yu, H., Yin, W., Mao, X.L.: Complicated table", "orig": "Chi, Z., Huang, H., Xu, H.D., Yu, H., Yin, W., Mao, X.L.: Complicated table", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 49, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.52, "r_y0": 631.19, "r_x1": 400.23, "r_y1": 631.19, "r_x2": 400.23, "r_y2": 623.12, "r_x3": 151.52, "r_y3": 623.12, "coord_origin": "TOPLEFT" }, "text": "structure recognition. arXiv preprint arXiv:1908.04729 (2019)", "orig": "structure recognition. arXiv preprint arXiv:1908.04729 (2019)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "3. Chi, Z., Huang, H., Xu, H.D., Yu, H., Yin, W., Mao, X.L.: Complicated table structure recognition. arXiv preprint arXiv:1908.04729 (2019)" }, { "label": "list_item", "id": 3, "page_no": 11, "cluster": { "id": 3, "label": "list_item", "bbox": { "l": 139.37, "t": 634.88, "r": 480.59, "b": 664.87, "coord_origin": "TOPLEFT" }, "confidence": 0.975, "cells": [ { "index": 50, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 139.37, "r_y0": 642.95, "r_x1": 146.52, "r_y1": 642.95, "r_x2": 146.52, "r_y2": 634.88, "r_x3": 139.37, "r_y3": 634.88, "coord_origin": "TOPLEFT" }, "text": "4.", "orig": "4.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 51, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.12, "r_y0": 642.95, "r_x1": 480.59, "r_y1": 642.95, "r_x2": 480.59, "r_y2": 634.88, "r_x3": 151.12, "r_y3": 634.88, "coord_origin": "TOPLEFT" }, "text": "Deng, Y., Rosenberg, D., Mann, G.: Challenges in end-to-end neural scientific", "orig": "Deng, Y., Rosenberg, D., Mann, G.: Challenges in end-to-end neural scientific", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 52, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.52, "r_y0": 653.91, "r_x1": 480.59, "r_y1": 653.91, "r_x2": 480.59, "r_y2": 645.84, "r_x3": 151.52, "r_y3": 645.84, "coord_origin": "TOPLEFT" }, "text": "table recognition. In: 2019 International Conference on Document Analysis and", "orig": "table recognition. In: 2019 International Conference on Document Analysis and", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 53, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.52, "r_y0": 664.87, "r_x1": 350.11, "r_y1": 664.87, "r_x2": 350.11, "r_y2": 656.8, "r_x3": 151.52, "r_y3": 656.8, "coord_origin": "TOPLEFT" }, "text": "Recognition (ICDAR). pp. 894-901. IEEE (2019)", "orig": "Recognition (ICDAR). pp. 894-901. IEEE (2019)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "4. Deng, Y., Rosenberg, D., Mann, G.: Challenges in end-to-end neural scientific table recognition. In: 2019 International Conference on Document Analysis and Recognition (ICDAR). pp. 894-901. IEEE (2019)" } ], "body": [ { "label": "section_header", "id": 8, "page_no": 11, "cluster": { "id": 8, "label": "section_header", "bbox": { "l": 134.76, "t": 117.55, "r": 219.25, "b": 128.12, "coord_origin": "TOPLEFT" }, "confidence": 0.916, "cells": [ { "index": 3, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 128.12, "r_x1": 141.49, "r_y1": 128.12, "r_x2": 141.49, "r_y2": 117.55, "r_x3": 134.76, "r_y3": 117.55, "coord_origin": "TOPLEFT" }, "text": "6", "orig": "6", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 4, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 154.94, "r_y0": 128.12, "r_x1": 219.25, "r_y1": 128.12, "r_x2": 219.25, "r_y2": 117.55, "r_x3": 154.94, "r_y3": 117.55, "coord_origin": "TOPLEFT" }, "text": "Conclusion", "orig": "Conclusion", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "6 Conclusion" }, { "label": "text", "id": 2, "page_no": 11, "cluster": { "id": 2, "label": "text", "bbox": { "l": 134.76, "t": 146.86, "r": 480.6, "b": 203.48, "coord_origin": "TOPLEFT" }, "confidence": 0.981, "cells": [ { "index": 5, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 155.66, "r_x1": 480.59, "r_y1": 155.66, "r_x2": 480.59, "r_y2": 146.86, "r_x3": 134.76, "r_y3": 146.86, "coord_origin": "TOPLEFT" }, "text": "We demonstrated that representing tables in HTML for the task of table struc-", "orig": "We demonstrated that representing tables in HTML for the task of table struc-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 6, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 167.62, "r_x1": 480.59, "r_y1": 167.62, "r_x2": 480.59, "r_y2": 158.82, "r_x3": 134.76, "r_y3": 158.82, "coord_origin": "TOPLEFT" }, "text": "ture recognition with Im2Seq models is ill-suited and has serious limitations.", "orig": "ture recognition with Im2Seq models is ill-suited and has serious limitations.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 7, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 179.57, "r_x1": 480.59, "r_y1": 179.57, "r_x2": 480.59, "r_y2": 170.77, "r_x3": 134.76, "r_y3": 170.77, "coord_origin": "TOPLEFT" }, "text": "Furthermore, we presented in this paper an Optimized Table Structure Language", "orig": "Furthermore, we presented in this paper an Optimized Table Structure Language", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 8, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 191.53, "r_x1": 480.6, "r_y1": 191.53, "r_x2": 480.6, "r_y2": 182.73, "r_x3": 134.76, "r_y3": 182.73, "coord_origin": "TOPLEFT" }, "text": "(OTSL) which, when compared to commonly used general purpose languages,", "orig": "(OTSL) which, when compared to commonly used general purpose languages,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 9, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 203.48, "r_x1": 239.54, "r_y1": 203.48, "r_x2": 239.54, "r_y2": 194.68, "r_x3": 134.76, "r_y3": 194.68, "coord_origin": "TOPLEFT" }, "text": "has several key benefits.", "orig": "has several key benefits.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "We demonstrated that representing tables in HTML for the task of table structure recognition with Im2Seq models is ill-suited and has serious limitations. Furthermore, we presented in this paper an Optimized Table Structure Language (OTSL) which, when compared to commonly used general purpose languages, has several key benefits." }, { "label": "text", "id": 0, "page_no": 11, "cluster": { "id": 0, "label": "text", "bbox": { "l": 134.76, "t": 207.44, "r": 480.59, "b": 323.84, "coord_origin": "TOPLEFT" }, "confidence": 0.987, "cells": [ { "index": 10, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 149.71, "r_y0": 216.24, "r_x1": 480.59, "r_y1": 216.24, "r_x2": 480.59, "r_y2": 207.44, "r_x3": 149.71, "r_y3": 207.44, "coord_origin": "TOPLEFT" }, "text": "First and foremost, given the same network configuration, inference time for", "orig": "First and foremost, given the same network configuration, inference time for", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 11, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 228.2, "r_x1": 480.59, "r_y1": 228.2, "r_x2": 480.59, "r_y2": 219.4, "r_x3": 134.76, "r_y3": 219.4, "coord_origin": "TOPLEFT" }, "text": "a table-structure prediction is about 2 times faster compared to the conventional", "orig": "a table-structure prediction is about 2 times faster compared to the conventional", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 12, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 240.15, "r_x1": 480.59, "r_y1": 240.15, "r_x2": 480.59, "r_y2": 231.35, "r_x3": 134.76, "r_y3": 231.35, "coord_origin": "TOPLEFT" }, "text": "HTML approach. This is primarily owed to the shorter sequence length of the", "orig": "HTML approach. This is primarily owed to the shorter sequence length of the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 13, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 252.11, "r_x1": 480.59, "r_y1": 252.11, "r_x2": 480.59, "r_y2": 243.31, "r_x3": 134.76, "r_y3": 243.31, "coord_origin": "TOPLEFT" }, "text": "OTSL representation. Additional performance benefits can be obtained with", "orig": "OTSL representation. Additional performance benefits can be obtained with", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 14, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 264.06, "r_x1": 480.59, "r_y1": 264.06, "r_x2": 480.59, "r_y2": 255.26, "r_x3": 134.76, "r_y3": 255.26, "coord_origin": "TOPLEFT" }, "text": "HPO (hyper parameter optimization). As we demonstrate in our experiments,", "orig": "HPO (hyper parameter optimization). As we demonstrate in our experiments,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 15, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 276.02, "r_x1": 480.59, "r_y1": 276.02, "r_x2": 480.59, "r_y2": 267.22, "r_x3": 134.76, "r_y3": 267.22, "coord_origin": "TOPLEFT" }, "text": "models trained on OTSL can be significantly smaller, e.g. by reducing the number", "orig": "models trained on OTSL can be significantly smaller, e.g. by reducing the number", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 16, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 287.97, "r_x1": 480.59, "r_y1": 287.97, "r_x2": 480.59, "r_y2": 279.17, "r_x3": 134.76, "r_y3": 279.17, "coord_origin": "TOPLEFT" }, "text": "of encoder and decoder layers, while preserving comparatively good prediction", "orig": "of encoder and decoder layers, while preserving comparatively good prediction", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 17, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 299.93, "r_x1": 480.59, "r_y1": 299.93, "r_x2": 480.59, "r_y2": 291.13, "r_x3": 134.76, "r_y3": 291.13, "coord_origin": "TOPLEFT" }, "text": "quality. This can further improve inference performance, yielding 5-6 times faster", "orig": "quality. This can further improve inference performance, yielding 5-6 times faster", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 18, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 311.88, "r_x1": 480.59, "r_y1": 311.88, "r_x2": 480.59, "r_y2": 303.08, "r_x3": 134.76, "r_y3": 303.08, "coord_origin": "TOPLEFT" }, "text": "inference speed in OTSL with prediction quality comparable to models trained", "orig": "inference speed in OTSL with prediction quality comparable to models trained", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 19, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 323.84, "r_x1": 240.92, "r_y1": 323.84, "r_x2": 240.92, "r_y2": 315.04, "r_x3": 134.76, "r_y3": 315.04, "coord_origin": "TOPLEFT" }, "text": "on HTML (see Table 1).", "orig": "on HTML (see Table 1).", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "First and foremost, given the same network configuration, inference time for a table-structure prediction is about 2 times faster compared to the conventional HTML approach. This is primarily owed to the shorter sequence length of the OTSL representation. Additional performance benefits can be obtained with HPO (hyper parameter optimization). As we demonstrate in our experiments, models trained on OTSL can be significantly smaller, e.g. by reducing the number of encoder and decoder layers, while preserving comparatively good prediction quality. This can further improve inference performance, yielding 5-6 times faster inference speed in OTSL with prediction quality comparable to models trained on HTML (see Table 1)." }, { "label": "text", "id": 1, "page_no": 11, "cluster": { "id": 1, "label": "text", "bbox": { "l": 134.76, "t": 327.8, "r": 480.59, "b": 468.1, "coord_origin": "TOPLEFT" }, "confidence": 0.987, "cells": [ { "index": 20, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 149.71, "r_y0": 336.6, "r_x1": 480.59, "r_y1": 336.6, "r_x2": 480.59, "r_y2": 327.8, "r_x3": 149.71, "r_y3": 327.8, "coord_origin": "TOPLEFT" }, "text": "Secondly, OTSL has more inherent structure and a significantly restricted vo-", "orig": "Secondly, OTSL has more inherent structure and a significantly restricted vo-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 21, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 348.55, "r_x1": 480.59, "r_y1": 348.55, "r_x2": 480.59, "r_y2": 339.75, "r_x3": 134.76, "r_y3": 339.75, "coord_origin": "TOPLEFT" }, "text": "cabulary size. This allows autoregressive models to perform better in the TED", "orig": "cabulary size. This allows autoregressive models to perform better in the TED", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 22, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 360.51, "r_x1": 480.59, "r_y1": 360.51, "r_x2": 480.59, "r_y2": 351.71, "r_x3": 134.76, "r_y3": 351.71, "coord_origin": "TOPLEFT" }, "text": "metric, but especially with regards to prediction accuracy of the table-cell bound-", "orig": "metric, but especially with regards to prediction accuracy of the table-cell bound-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 23, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 372.46, "r_x1": 480.59, "r_y1": 372.46, "r_x2": 480.59, "r_y2": 363.66, "r_x3": 134.76, "r_y3": 363.66, "coord_origin": "TOPLEFT" }, "text": "ing boxes (see Table 2). As shown in Figure 5, we observe that the OTSL dras-", "orig": "ing boxes (see Table 2). As shown in Figure 5, we observe that the OTSL dras-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 24, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 384.42, "r_x1": 480.59, "r_y1": 384.42, "r_x2": 480.59, "r_y2": 375.62, "r_x3": 134.76, "r_y3": 375.62, "coord_origin": "TOPLEFT" }, "text": "tically reduces the drift for table cell bounding boxes at high row count and in", "orig": "tically reduces the drift for table cell bounding boxes at high row count and in", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 25, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 396.37, "r_x1": 480.59, "r_y1": 396.37, "r_x2": 480.59, "r_y2": 387.57, "r_x3": 134.76, "r_y3": 387.57, "coord_origin": "TOPLEFT" }, "text": "sparse tables. This leads to more accurate predictions and a significant reduction", "orig": "sparse tables. This leads to more accurate predictions and a significant reduction", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 26, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 408.33, "r_x1": 480.59, "r_y1": 408.33, "r_x2": 480.59, "r_y2": 399.53, "r_x3": 134.76, "r_y3": 399.53, "coord_origin": "TOPLEFT" }, "text": "in post-processing complexity, which is an undesired necessity in HTML-based", "orig": "in post-processing complexity, which is an undesired necessity in HTML-based", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 27, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 420.28, "r_x1": 480.59, "r_y1": 420.28, "r_x2": 480.59, "r_y2": 411.49, "r_x3": 134.76, "r_y3": 411.49, "coord_origin": "TOPLEFT" }, "text": "Im2Seq models. Significant novelty lies in OTSL syntactical rules, which are few,", "orig": "Im2Seq models. Significant novelty lies in OTSL syntactical rules, which are few,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 28, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 432.24, "r_x1": 480.59, "r_y1": 432.24, "r_x2": 480.59, "r_y2": 423.44, "r_x3": 134.76, "r_y3": 423.44, "coord_origin": "TOPLEFT" }, "text": "simple and always backwards looking. Each new token can be validated only by", "orig": "simple and always backwards looking. Each new token can be validated only by", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 29, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 444.19, "r_x1": 480.59, "r_y1": 444.19, "r_x2": 480.59, "r_y2": 435.4, "r_x3": 134.76, "r_y3": 435.4, "coord_origin": "TOPLEFT" }, "text": "analyzing the sequence of previous tokens, without requiring the entire sequence", "orig": "analyzing the sequence of previous tokens, without requiring the entire sequence", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 30, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 456.15, "r_x1": 480.59, "r_y1": 456.15, "r_x2": 480.59, "r_y2": 447.35, "r_x3": 134.76, "r_y3": 447.35, "coord_origin": "TOPLEFT" }, "text": "to detect mistakes. This in return allows to perform structural error detection", "orig": "to detect mistakes. This in return allows to perform structural error detection", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 31, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 468.1, "r_x1": 366.78, "r_y1": 468.1, "r_x2": 366.78, "r_y2": 459.31, "r_x3": 134.76, "r_y3": 459.31, "coord_origin": "TOPLEFT" }, "text": "and correction on-the-fly during sequence generation.", "orig": "and correction on-the-fly during sequence generation.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "Secondly, OTSL has more inherent structure and a significantly restricted vocabulary size. This allows autoregressive models to perform better in the TED metric, but especially with regards to prediction accuracy of the table-cell bounding boxes (see Table 2). As shown in Figure 5, we observe that the OTSL drastically reduces the drift for table cell bounding boxes at high row count and in sparse tables. This leads to more accurate predictions and a significant reduction in post-processing complexity, which is an undesired necessity in HTML-based Im2Seq models. Significant novelty lies in OTSL syntactical rules, which are few, simple and always backwards looking. Each new token can be validated only by analyzing the sequence of previous tokens, without requiring the entire sequence to detect mistakes. This in return allows to perform structural error detection and correction on-the-fly during sequence generation." }, { "label": "section_header", "id": 7, "page_no": 11, "cluster": { "id": 7, "label": "section_header", "bbox": { "l": 134.76, "t": 493.82, "r": 197.69, "b": 504.39, "coord_origin": "TOPLEFT" }, "confidence": 0.94, "cells": [ { "index": 32, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 504.39, "r_x1": 197.69, "r_y1": 504.39, "r_x2": 197.69, "r_y2": 493.82, "r_x3": 134.76, "r_y3": 493.82, "coord_origin": "TOPLEFT" }, "text": "References", "orig": "References", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "References" }, { "label": "list_item", "id": 5, "page_no": 11, "cluster": { "id": 5, "label": "list_item", "bbox": { "l": 139.37, "t": 522.88, "r": 480.59, "b": 563.87, "coord_origin": "TOPLEFT" }, "confidence": 0.97, "cells": [ { "index": 33, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 139.37, "r_y0": 530.95, "r_x1": 146.46, "r_y1": 530.95, "r_x2": 146.46, "r_y2": 522.88, "r_x3": 139.37, "r_y3": 522.88, "coord_origin": "TOPLEFT" }, "text": "1.", "orig": "1.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 34, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.02, "r_y0": 530.95, "r_x1": 480.59, "r_y1": 530.95, "r_x2": 480.59, "r_y2": 522.88, "r_x3": 151.02, "r_y3": 522.88, "coord_origin": "TOPLEFT" }, "text": "Auer, C., Dolfi, M., Carvalho, A., Ramis, C.B., Staar, P.W.J.: Delivering doc-", "orig": "Auer, C., Dolfi, M., Carvalho, A., Ramis, C.B., Staar, P.W.J.: Delivering doc-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 35, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.52, "r_y0": 541.91, "r_x1": 480.59, "r_y1": 541.91, "r_x2": 480.59, "r_y2": 533.84, "r_x3": 151.52, "r_y3": 533.84, "coord_origin": "TOPLEFT" }, "text": "ument conversion as a cloud service with high throughput and responsiveness.", "orig": "ument conversion as a cloud service with high throughput and responsiveness.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 36, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.52, "r_y0": 552.87, "r_x1": 176.34, "r_y1": 552.87, "r_x2": 176.34, "r_y2": 544.8, "r_x3": 151.52, "r_y3": 544.8, "coord_origin": "TOPLEFT" }, "text": "CoRR", "orig": "CoRR", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 37, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 179.46, "r_y0": 552.66, "r_x1": 250.68, "r_y1": 552.66, "r_x2": 250.68, "r_y2": 544.74, "r_x3": 179.46, "r_y3": 544.74, "coord_origin": "TOPLEFT" }, "text": "abs/2206.00785", "orig": "abs/2206.00785", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 38, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 253.8, "r_y0": 552.87, "r_x1": 281.96, "r_y1": 552.87, "r_x2": 281.96, "r_y2": 544.8, "r_x3": 253.8, "r_y3": 544.8, "coord_origin": "TOPLEFT" }, "text": "(2022).", "orig": "(2022).", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 39, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 285.08, "r_y0": 552.91, "r_x1": 478.03, "r_y1": 552.91, "r_x2": 478.03, "r_y2": 545.44, "r_x3": 285.08, "r_y3": 545.44, "coord_origin": "TOPLEFT" }, "text": "https://doi.org/10.48550/arXiv.2206.00785", "orig": "https://doi.org/10.48550/arXiv.2206.00785", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 40, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 478.03, "r_y0": 552.87, "r_x1": 480.59, "r_y1": 552.87, "r_x2": 480.59, "r_y2": 544.8, "r_x3": 478.03, "r_y3": 544.8, "coord_origin": "TOPLEFT" }, "text": ",", "orig": ",", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 41, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.52, "r_y0": 563.87, "r_x1": 344.47, "r_y1": 563.87, "r_x2": 344.47, "r_y2": 556.4, "r_x3": 151.52, "r_y3": 556.4, "coord_origin": "TOPLEFT" }, "text": "https://doi.org/10.48550/arXiv.2206.00785", "orig": "https://doi.org/10.48550/arXiv.2206.00785", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "1. Auer, C., Dolfi, M., Carvalho, A., Ramis, C.B., Staar, P.W.J.: Delivering document conversion as a cloud service with high throughput and responsiveness. CoRR abs/2206.00785 (2022). https://doi.org/10.48550/arXiv.2206.00785 , https://doi.org/10.48550/arXiv.2206.00785" }, { "label": "list_item", "id": 4, "page_no": 11, "cluster": { "id": 4, "label": "list_item", "bbox": { "l": 139.37, "t": 567.52, "r": 480.59, "b": 608.47, "coord_origin": "TOPLEFT" }, "confidence": 0.973, "cells": [ { "index": 42, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 139.37, "r_y0": 575.59, "r_x1": 145.94, "r_y1": 575.59, "r_x2": 145.94, "r_y2": 567.52, "r_x3": 139.37, "r_y3": 567.52, "coord_origin": "TOPLEFT" }, "text": "2.", "orig": "2.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 43, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 150.17, "r_y0": 575.59, "r_x1": 480.59, "r_y1": 575.59, "r_x2": 480.59, "r_y2": 567.52, "r_x3": 150.17, "r_y3": 567.52, "coord_origin": "TOPLEFT" }, "text": "Chen, B., Peng, D., Zhang, J., Ren, Y., Jin, L.: Complex table structure recognition", "orig": "Chen, B., Peng, D., Zhang, J., Ren, Y., Jin, L.: Complex table structure recognition", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 44, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.52, "r_y0": 586.55, "r_x1": 480.59, "r_y1": 586.55, "r_x2": 480.59, "r_y2": 578.48, "r_x3": 151.52, "r_y3": 578.48, "coord_origin": "TOPLEFT" }, "text": "in the wild using transformer and identity matrix-based augmentation. In: Porwal,", "orig": "in the wild using transformer and identity matrix-based augmentation. In: Porwal,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 45, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.52, "r_y0": 597.51, "r_x1": 480.59, "r_y1": 597.51, "r_x2": 480.59, "r_y2": 589.44, "r_x3": 151.52, "r_y3": 589.44, "coord_origin": "TOPLEFT" }, "text": "U., Forn\u00e9s, A., Shafait, F. (eds.) Frontiers in Handwriting Recognition. pp. 545-", "orig": "U., Forn\u00e9s, A., Shafait, F. (eds.) Frontiers in Handwriting Recognition. pp. 545-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 46, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.52, "r_y0": 608.47, "r_x1": 364.18, "r_y1": 608.47, "r_x2": 364.18, "r_y2": 600.4, "r_x3": 151.52, "r_y3": 600.4, "coord_origin": "TOPLEFT" }, "text": "561. Springer International Publishing, Cham (2022)", "orig": "561. Springer International Publishing, Cham (2022)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "2. Chen, B., Peng, D., Zhang, J., Ren, Y., Jin, L.: Complex table structure recognition in the wild using transformer and identity matrix-based augmentation. In: Porwal, U., Forn\u00e9s, A., Shafait, F. (eds.) Frontiers in Handwriting Recognition. pp. 545561. Springer International Publishing, Cham (2022)" }, { "label": "list_item", "id": 6, "page_no": 11, "cluster": { "id": 6, "label": "list_item", "bbox": { "l": 139.37, "t": 612.16, "r": 480.59, "b": 631.19, "coord_origin": "TOPLEFT" }, "confidence": 0.962, "cells": [ { "index": 47, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 139.37, "r_y0": 620.23, "r_x1": 146.44, "r_y1": 620.23, "r_x2": 146.44, "r_y2": 612.16, "r_x3": 139.37, "r_y3": 612.16, "coord_origin": "TOPLEFT" }, "text": "3.", "orig": "3.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 48, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 150.98, "r_y0": 620.23, "r_x1": 480.59, "r_y1": 620.23, "r_x2": 480.59, "r_y2": 612.16, "r_x3": 150.98, "r_y3": 612.16, "coord_origin": "TOPLEFT" }, "text": "Chi, Z., Huang, H., Xu, H.D., Yu, H., Yin, W., Mao, X.L.: Complicated table", "orig": "Chi, Z., Huang, H., Xu, H.D., Yu, H., Yin, W., Mao, X.L.: Complicated table", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 49, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.52, "r_y0": 631.19, "r_x1": 400.23, "r_y1": 631.19, "r_x2": 400.23, "r_y2": 623.12, "r_x3": 151.52, "r_y3": 623.12, "coord_origin": "TOPLEFT" }, "text": "structure recognition. arXiv preprint arXiv:1908.04729 (2019)", "orig": "structure recognition. arXiv preprint arXiv:1908.04729 (2019)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "3. Chi, Z., Huang, H., Xu, H.D., Yu, H., Yin, W., Mao, X.L.: Complicated table structure recognition. arXiv preprint arXiv:1908.04729 (2019)" }, { "label": "list_item", "id": 3, "page_no": 11, "cluster": { "id": 3, "label": "list_item", "bbox": { "l": 139.37, "t": 634.88, "r": 480.59, "b": 664.87, "coord_origin": "TOPLEFT" }, "confidence": 0.975, "cells": [ { "index": 50, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 139.37, "r_y0": 642.95, "r_x1": 146.52, "r_y1": 642.95, "r_x2": 146.52, "r_y2": 634.88, "r_x3": 139.37, "r_y3": 634.88, "coord_origin": "TOPLEFT" }, "text": "4.", "orig": "4.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 51, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.12, "r_y0": 642.95, "r_x1": 480.59, "r_y1": 642.95, "r_x2": 480.59, "r_y2": 634.88, "r_x3": 151.12, "r_y3": 634.88, "coord_origin": "TOPLEFT" }, "text": "Deng, Y., Rosenberg, D., Mann, G.: Challenges in end-to-end neural scientific", "orig": "Deng, Y., Rosenberg, D., Mann, G.: Challenges in end-to-end neural scientific", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 52, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.52, "r_y0": 653.91, "r_x1": 480.59, "r_y1": 653.91, "r_x2": 480.59, "r_y2": 645.84, "r_x3": 151.52, "r_y3": 645.84, "coord_origin": "TOPLEFT" }, "text": "table recognition. In: 2019 International Conference on Document Analysis and", "orig": "table recognition. In: 2019 International Conference on Document Analysis and", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 53, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.52, "r_y0": 664.87, "r_x1": 350.11, "r_y1": 664.87, "r_x2": 350.11, "r_y2": 656.8, "r_x3": 151.52, "r_y3": 656.8, "coord_origin": "TOPLEFT" }, "text": "Recognition (ICDAR). pp. 894-901. IEEE (2019)", "orig": "Recognition (ICDAR). pp. 894-901. IEEE (2019)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "4. Deng, Y., Rosenberg, D., Mann, G.: Challenges in end-to-end neural scientific table recognition. In: 2019 International Conference on Document Analysis and Recognition (ICDAR). pp. 894-901. IEEE (2019)" } ], "headers": [ { "label": "page_header", "id": 10, "page_no": 11, "cluster": { "id": 10, "label": "page_header", "bbox": { "l": 134.76, "t": 93.77, "r": 143.98, "b": 101.84, "coord_origin": "TOPLEFT" }, "confidence": 0.861, "cells": [ { "index": 0, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 101.84, "r_x1": 143.98, "r_y1": 101.84, "r_x2": 143.98, "r_y2": 93.77, "r_x3": 134.76, "r_y3": 93.77, "coord_origin": "TOPLEFT" }, "text": "12", "orig": "12", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "12" }, { "label": "page_header", "id": 9, "page_no": 11, "cluster": { "id": 9, "label": "page_header", "bbox": { "l": 167.82, "t": 93.77, "r": 231.72, "b": 101.84, "coord_origin": "TOPLEFT" }, "confidence": 0.893, "cells": [ { "index": 1, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 167.82, "r_y0": 101.84, "r_x1": 178.08, "r_y1": 101.84, "r_x2": 178.08, "r_y2": 93.77, "r_x3": 167.82, "r_y3": 93.77, "coord_origin": "TOPLEFT" }, "text": "M.", "orig": "M.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 2, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 182.38, "r_y0": 101.84, "r_x1": 231.72, "r_y1": 101.84, "r_x2": 231.72, "r_y2": 93.77, "r_x3": 182.38, "r_y3": 93.77, "coord_origin": "TOPLEFT" }, "text": "Lysak, et al.", "orig": "Lysak, et al.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "M. Lysak, et al." } ] } }, { "page_no": 12, "size": { "width": 612.0, "height": 792.0 }, "parsed_page": { "dimension": { "angle": 0.0, "rect": { "r_x0": 0.0, "r_y0": 0.0, "r_x1": 612.0, "r_y1": 0.0, "r_x2": 612.0, "r_y2": 792.0, "r_x3": 0.0, "r_y3": 792.0, "coord_origin": "BOTTOMLEFT" }, "boundary_type": "crop_box", "art_bbox": { "l": 0.0, "t": 792.0, "r": 612.0, "b": 0.0, "coord_origin": "BOTTOMLEFT" }, "bleed_bbox": { "l": 0.0, "t": 792.0, "r": 612.0, "b": 0.0, "coord_origin": "BOTTOMLEFT" }, "crop_bbox": { "l": 0.0, "t": 792.0, "r": 612.0, "b": 0.0, "coord_origin": "BOTTOMLEFT" }, "media_bbox": { "l": 0.0, "t": 792.0, "r": 612.0, "b": 0.0, "coord_origin": "BOTTOMLEFT" }, "trim_bbox": { "l": 0.0, "t": 792.0, "r": 612.0, "b": 0.0, "coord_origin": "BOTTOMLEFT" } }, "bitmap_resources": [], "char_cells": [], "word_cells": [], "textline_cells": [ { "index": 0, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 194.48, "r_y0": 101.84, "r_x1": 447.54, "r_y1": 101.84, "r_x2": 447.54, "r_y2": 93.77, "r_x3": 194.48, "r_y3": 93.77, "coord_origin": "TOPLEFT" }, "text": "Optimized Table Tokenization for Table Structure Recognition", "orig": "Optimized Table Tokenization for Table Structure Recognition", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 1, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 471.38, "r_y0": 101.84, "r_x1": 480.59, "r_y1": 101.84, "r_x2": 480.59, "r_y2": 93.77, "r_x3": 471.38, "r_y3": 93.77, "coord_origin": "TOPLEFT" }, "text": "13", "orig": "13", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 2, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 139.37, "r_y0": 127.74, "r_x1": 146.05, "r_y1": 127.74, "r_x2": 146.05, "r_y2": 119.67, "r_x3": 139.37, "r_y3": 119.67, "coord_origin": "TOPLEFT" }, "text": "5.", "orig": "5.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 3, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 150.34, "r_y0": 127.74, "r_x1": 480.59, "r_y1": 127.74, "r_x2": 480.59, "r_y2": 119.67, "r_x3": 150.34, "r_y3": 119.67, "coord_origin": "TOPLEFT" }, "text": "Kayal, P., Anand, M., Desai, H., Singh, M.: Tables to latex: structure and content", "orig": "Kayal, P., Anand, M., Desai, H., Singh, M.: Tables to latex: structure and content", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 4, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.52, "r_y0": 138.7, "r_x1": 480.59, "r_y1": 138.7, "r_x2": 480.59, "r_y2": 130.63, "r_x3": 151.52, "r_y3": 130.63, "coord_origin": "TOPLEFT" }, "text": "extraction from scientific tables. International Journal on Document Analysis and", "orig": "extraction from scientific tables. International Journal on Document Analysis and", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 5, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.52, "r_y0": 149.66, "r_x1": 304.04, "r_y1": 149.66, "r_x2": 304.04, "r_y2": 141.59, "r_x3": 151.52, "r_y3": 141.59, "coord_origin": "TOPLEFT" }, "text": "Recognition (IJDAR) pp. 1-10 (2022)", "orig": "Recognition (IJDAR) pp. 1-10 (2022)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 6, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 139.37, "r_y0": 160.63, "r_x1": 145.94, "r_y1": 160.63, "r_x2": 145.94, "r_y2": 152.56, "r_x3": 139.37, "r_y3": 152.56, "coord_origin": "TOPLEFT" }, "text": "6.", "orig": "6.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 7, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 150.16, "r_y0": 160.63, "r_x1": 480.59, "r_y1": 160.63, "r_x2": 480.59, "r_y2": 152.56, "r_x3": 150.16, "r_y3": 152.56, "coord_origin": "TOPLEFT" }, "text": "Lee, E., Kwon, J., Yang, H., Park, J., Lee, S., Koo, H.I., Cho, N.I.: Table structure", "orig": "Lee, E., Kwon, J., Yang, H., Park, J., Lee, S., Koo, H.I., Cho, N.I.: Table structure", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 8, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.52, "r_y0": 171.59, "r_x1": 480.59, "r_y1": 171.59, "r_x2": 480.59, "r_y2": 163.52, "r_x3": 151.52, "r_y3": 163.52, "coord_origin": "TOPLEFT" }, "text": "recognition based on grid shape graph. In: 2022 Asia-Pacific Signal and Information", "orig": "recognition based on grid shape graph. In: 2022 Asia-Pacific Signal and Information", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 9, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.52, "r_y0": 182.55, "r_x1": 480.59, "r_y1": 182.55, "r_x2": 480.59, "r_y2": 174.48, "r_x3": 151.52, "r_y3": 174.48, "coord_origin": "TOPLEFT" }, "text": "Processing Association Annual Summit and Conference (APSIPA ASC). pp. 1868-", "orig": "Processing Association Annual Summit and Conference (APSIPA ASC). pp. 1868-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 10, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.52, "r_y0": 193.51, "r_x1": 226.37, "r_y1": 193.51, "r_x2": 226.37, "r_y2": 185.44, "r_x3": 151.52, "r_y3": 185.44, "coord_origin": "TOPLEFT" }, "text": "1873. IEEE (2022)", "orig": "1873. IEEE (2022)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 11, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 139.37, "r_y0": 204.48, "r_x1": 146.31, "r_y1": 204.48, "r_x2": 146.31, "r_y2": 196.41, "r_x3": 139.37, "r_y3": 196.41, "coord_origin": "TOPLEFT" }, "text": "7.", "orig": "7.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 12, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 150.78, "r_y0": 204.48, "r_x1": 480.59, "r_y1": 204.48, "r_x2": 480.59, "r_y2": 196.41, "r_x3": 150.78, "r_y3": 196.41, "coord_origin": "TOPLEFT" }, "text": "Li, M., Cui, L., Huang, S., Wei, F., Zhou, M., Li, Z.: Tablebank: A benchmark", "orig": "Li, M., Cui, L., Huang, S., Wei, F., Zhou, M., Li, Z.: Tablebank: A benchmark", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 13, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.52, "r_y0": 215.44, "r_x1": 352.02, "r_y1": 215.44, "r_x2": 352.02, "r_y2": 207.37, "r_x3": 151.52, "r_y3": 207.37, "coord_origin": "TOPLEFT" }, "text": "dataset for table detection and recognition (2019)", "orig": "dataset for table detection and recognition (2019)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 14, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 139.37, "r_y0": 226.41, "r_x1": 146.37, "r_y1": 226.41, "r_x2": 146.37, "r_y2": 218.34, "r_x3": 139.37, "r_y3": 218.34, "coord_origin": "TOPLEFT" }, "text": "8.", "orig": "8.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 15, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 150.87, "r_y0": 226.41, "r_x1": 480.59, "r_y1": 226.41, "r_x2": 480.59, "r_y2": 218.34, "r_x3": 150.87, "r_y3": 218.34, "coord_origin": "TOPLEFT" }, "text": "Livathinos, N., Berrospi, C., Lysak, M., Kuropiatnyk, V., Nassar, A., Carvalho,", "orig": "Livathinos, N., Berrospi, C., Lysak, M., Kuropiatnyk, V., Nassar, A., Carvalho,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 16, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.52, "r_y0": 237.37, "r_x1": 480.59, "r_y1": 237.37, "r_x2": 480.59, "r_y2": 229.3, "r_x3": 151.52, "r_y3": 229.3, "coord_origin": "TOPLEFT" }, "text": "A., Dolfi, M., Auer, C., Dinkla, K., Staar, P.: Robust pdf document conversion", "orig": "A., Dolfi, M., Auer, C., Dinkla, K., Staar, P.: Robust pdf document conversion", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 17, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.52, "r_y0": 248.33, "r_x1": 480.59, "r_y1": 248.33, "r_x2": 480.59, "r_y2": 240.26, "r_x3": 151.52, "r_y3": 240.26, "coord_origin": "TOPLEFT" }, "text": "using recurrent neural networks. Proceedings of the AAAI Conference on Artificial", "orig": "using recurrent neural networks. Proceedings of the AAAI Conference on Artificial", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 18, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.52, "r_y0": 259.29, "r_x1": 197.09, "r_y1": 259.29, "r_x2": 197.09, "r_y2": 251.22, "r_x3": 151.52, "r_y3": 251.22, "coord_origin": "TOPLEFT" }, "text": "Intelligence", "orig": "Intelligence", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 19, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 199.4, "r_y0": 259.08, "r_x1": 210.01, "r_y1": 259.08, "r_x2": 210.01, "r_y2": 251.15, "r_x3": 199.4, "r_y3": 251.15, "coord_origin": "TOPLEFT" }, "text": "35", "orig": "35", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 20, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 210.01, "r_y0": 259.29, "r_x1": 332.38, "r_y1": 259.29, "r_x2": 332.38, "r_y2": 251.22, "r_x3": 210.01, "r_y3": 251.22, "coord_origin": "TOPLEFT" }, "text": "(17), 15137-15145 (May 2021),", "orig": "(17), 15137-15145 (May 2021),", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 21, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 334.7, "r_y0": 259.33, "r_x1": 480.59, "r_y1": 259.33, "r_x2": 480.59, "r_y2": 251.86, "r_x3": 334.7, "r_y3": 251.86, "coord_origin": "TOPLEFT" }, "text": "https://ojs.aaai.org/index.php/", "orig": "https://ojs.aaai.org/index.php/", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 22, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.52, "r_y0": 270.29, "r_x1": 259.76, "r_y1": 270.29, "r_x2": 259.76, "r_y2": 262.82, "r_x3": 151.52, "r_y3": 262.82, "coord_origin": "TOPLEFT" }, "text": "AAAI/article/view/17777", "orig": "AAAI/article/view/17777", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 23, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 139.37, "r_y0": 281.21, "r_x1": 146.14, "r_y1": 281.21, "r_x2": 146.14, "r_y2": 273.14, "r_x3": 139.37, "r_y3": 273.14, "coord_origin": "TOPLEFT" }, "text": "9.", "orig": "9.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 24, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 150.5, "r_y0": 281.21, "r_x1": 480.59, "r_y1": 281.21, "r_x2": 480.59, "r_y2": 273.14, "r_x3": 150.5, "r_y3": 273.14, "coord_origin": "TOPLEFT" }, "text": "Nassar, A., Livathinos, N., Lysak, M., Staar, P.: Tableformer: Table structure un-", "orig": "Nassar, A., Livathinos, N., Lysak, M., Staar, P.: Tableformer: Table structure un-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 25, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.52, "r_y0": 292.17, "r_x1": 480.59, "r_y1": 292.17, "r_x2": 480.59, "r_y2": 284.1, "r_x3": 151.52, "r_y3": 284.1, "coord_origin": "TOPLEFT" }, "text": "derstanding with transformers. In: Proceedings of the IEEE/CVF Conference on", "orig": "derstanding with transformers. In: Proceedings of the IEEE/CVF Conference on", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 26, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.52, "r_y0": 303.13, "r_x1": 473.44, "r_y1": 303.13, "r_x2": 473.44, "r_y2": 295.06, "r_x3": 151.52, "r_y3": 295.06, "coord_origin": "TOPLEFT" }, "text": "Computer Vision and Pattern Recognition (CVPR). pp. 4614-4623 (June 2022)", "orig": "Computer Vision and Pattern Recognition (CVPR). pp. 4614-4623 (June 2022)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 27, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 314.1, "r_x1": 146.5, "r_y1": 314.1, "r_x2": 146.5, "r_y2": 306.03, "r_x3": 134.76, "r_y3": 306.03, "coord_origin": "TOPLEFT" }, "text": "10.", "orig": "10.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 28, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.09, "r_y0": 314.1, "r_x1": 480.59, "r_y1": 314.1, "r_x2": 480.59, "r_y2": 306.03, "r_x3": 151.09, "r_y3": 306.03, "coord_origin": "TOPLEFT" }, "text": "Pfitzmann, B., Auer, C., Dolfi, M., Nassar, A.S., Staar, P.W.J.: Doclaynet: A", "orig": "Pfitzmann, B., Auer, C., Dolfi, M., Nassar, A.S., Staar, P.W.J.: Doclaynet: A", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 29, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.52, "r_y0": 325.06, "r_x1": 480.59, "r_y1": 325.06, "r_x2": 480.59, "r_y2": 316.99, "r_x3": 151.52, "r_y3": 316.99, "coord_origin": "TOPLEFT" }, "text": "large human-annotated dataset for document-layout segmentation. In: Zhang, A.,", "orig": "large human-annotated dataset for document-layout segmentation. In: Zhang, A.,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 30, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.52, "r_y0": 336.02, "r_x1": 480.59, "r_y1": 336.02, "r_x2": 480.59, "r_y2": 327.95, "r_x3": 151.52, "r_y3": 327.95, "coord_origin": "TOPLEFT" }, "text": "Rangwala, H. (eds.) KDD \u201922: The 28th ACM SIGKDD Conference on Knowledge", "orig": "Rangwala, H. (eds.) KDD \u201922: The 28th ACM SIGKDD Conference on Knowledge", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 31, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.52, "r_y0": 346.98, "r_x1": 480.59, "r_y1": 346.98, "r_x2": 480.59, "r_y2": 338.91, "r_x3": 151.52, "r_y3": 338.91, "coord_origin": "TOPLEFT" }, "text": "Discovery and Data Mining, Washington, DC, USA, August 14 - 18, 2022. pp.", "orig": "Discovery and Data Mining, Washington, DC, USA, August 14 - 18, 2022. pp.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 32, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.52, "r_y0": 357.94, "r_x1": 251.14, "r_y1": 357.94, "r_x2": 251.14, "r_y2": 349.87, "r_x3": 151.52, "r_y3": 349.87, "coord_origin": "TOPLEFT" }, "text": "3743-3751. ACM (2022).", "orig": "3743-3751. ACM (2022).", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 33, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 253.99, "r_y0": 357.98, "r_x1": 437.53, "r_y1": 357.98, "r_x2": 437.53, "r_y2": 350.51, "r_x3": 253.99, "r_y3": 350.51, "coord_origin": "TOPLEFT" }, "text": "https://doi.org/10.1145/3534678.3539043", "orig": "https://doi.org/10.1145/3534678.3539043", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 34, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 437.53, "r_y0": 357.94, "r_x1": 440.09, "r_y1": 357.94, "r_x2": 440.09, "r_y2": 349.87, "r_x3": 437.53, "r_y3": 349.87, "coord_origin": "TOPLEFT" }, "text": ",", "orig": ",", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 35, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 442.94, "r_y0": 357.98, "r_x1": 480.59, "r_y1": 357.98, "r_x2": 480.59, "r_y2": 350.51, "r_x3": 442.94, "r_y3": 350.51, "coord_origin": "TOPLEFT" }, "text": "https://", "orig": "https://", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 36, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.52, "r_y0": 368.94, "r_x1": 297.41, "r_y1": 368.94, "r_x2": 297.41, "r_y2": 361.47, "r_x3": 151.52, "r_y3": 361.47, "coord_origin": "TOPLEFT" }, "text": "doi.org/10.1145/3534678.3539043", "orig": "doi.org/10.1145/3534678.3539043", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 37, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 379.87, "r_x1": 146.04, "r_y1": 379.87, "r_x2": 146.04, "r_y2": 371.8, "r_x3": 134.76, "r_y3": 371.8, "coord_origin": "TOPLEFT" }, "text": "11.", "orig": "11.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 38, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 150.45, "r_y0": 379.87, "r_x1": 480.59, "r_y1": 379.87, "r_x2": 480.59, "r_y2": 371.8, "r_x3": 150.45, "r_y3": 371.8, "coord_origin": "TOPLEFT" }, "text": "Prasad, D., Gadpal, A., Kapadni, K., Visave, M., Sultanpure, K.: Cascadetabnet:", "orig": "Prasad, D., Gadpal, A., Kapadni, K., Visave, M., Sultanpure, K.: Cascadetabnet:", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 39, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.52, "r_y0": 390.83, "r_x1": 480.59, "r_y1": 390.83, "r_x2": 480.59, "r_y2": 382.76, "r_x3": 151.52, "r_y3": 382.76, "coord_origin": "TOPLEFT" }, "text": "An approach for end to end table detection and structure recognition from image-", "orig": "An approach for end to end table detection and structure recognition from image-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 40, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.52, "r_y0": 401.79, "r_x1": 480.59, "r_y1": 401.79, "r_x2": 480.59, "r_y2": 393.72, "r_x3": 151.52, "r_y3": 393.72, "coord_origin": "TOPLEFT" }, "text": "based documents. In: Proceedings of the IEEE/CVF conference on computer vision", "orig": "based documents. In: Proceedings of the IEEE/CVF conference on computer vision", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 41, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.52, "r_y0": 412.74, "r_x1": 373.83, "r_y1": 412.74, "r_x2": 373.83, "r_y2": 404.67, "r_x3": 151.52, "r_y3": 404.67, "coord_origin": "TOPLEFT" }, "text": "and pattern recognition workshops. pp. 572-573 (2020)", "orig": "and pattern recognition workshops. pp. 572-573 (2020)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 42, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 423.71, "r_x1": 145.91, "r_y1": 423.71, "r_x2": 145.91, "r_y2": 415.64, "r_x3": 134.76, "r_y3": 415.64, "coord_origin": "TOPLEFT" }, "text": "12.", "orig": "12.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 43, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 150.27, "r_y0": 423.71, "r_x1": 480.59, "r_y1": 423.71, "r_x2": 480.59, "r_y2": 415.64, "r_x3": 150.27, "r_y3": 415.64, "coord_origin": "TOPLEFT" }, "text": "Schreiber, S., Agne, S., Wolf, I., Dengel, A., Ahmed, S.: Deepdesrt: Deep learning", "orig": "Schreiber, S., Agne, S., Wolf, I., Dengel, A., Ahmed, S.: Deepdesrt: Deep learning", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 44, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.52, "r_y0": 434.67, "r_x1": 480.59, "r_y1": 434.67, "r_x2": 480.59, "r_y2": 426.6, "r_x3": 151.52, "r_y3": 426.6, "coord_origin": "TOPLEFT" }, "text": "for detection and structure recognition of tables in document images. In: 2017 14th", "orig": "for detection and structure recognition of tables in document images. In: 2017 14th", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 45, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.52, "r_y0": 445.63, "r_x1": 480.59, "r_y1": 445.63, "r_x2": 480.59, "r_y2": 437.56, "r_x3": 151.52, "r_y3": 437.56, "coord_origin": "TOPLEFT" }, "text": "IAPR international conference on document analysis and recognition (ICDAR).", "orig": "IAPR international conference on document analysis and recognition (ICDAR).", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 46, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.52, "r_y0": 456.59, "r_x1": 292.91, "r_y1": 456.59, "r_x2": 292.91, "r_y2": 448.52, "r_x3": 151.52, "r_y3": 448.52, "coord_origin": "TOPLEFT" }, "text": "vol. 1, pp. 1162-1167. IEEE (2017)", "orig": "vol. 1, pp. 1162-1167. IEEE (2017)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 47, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 467.56, "r_x1": 145.78, "r_y1": 467.56, "r_x2": 145.78, "r_y2": 459.49, "r_x3": 134.76, "r_y3": 459.49, "coord_origin": "TOPLEFT" }, "text": "13.", "orig": "13.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 48, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 150.09, "r_y0": 467.56, "r_x1": 480.59, "r_y1": 467.56, "r_x2": 480.59, "r_y2": 459.49, "r_x3": 150.09, "r_y3": 459.49, "coord_origin": "TOPLEFT" }, "text": "Siddiqui, S.A., Fateh, I.A., Rizvi, S.T.R., Dengel, A., Ahmed, S.: Deeptabstr: Deep", "orig": "Siddiqui, S.A., Fateh, I.A., Rizvi, S.T.R., Dengel, A., Ahmed, S.: Deeptabstr: Deep", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 49, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.52, "r_y0": 478.52, "r_x1": 480.59, "r_y1": 478.52, "r_x2": 480.59, "r_y2": 470.45, "r_x3": 151.52, "r_y3": 470.45, "coord_origin": "TOPLEFT" }, "text": "learning based table structure recognition. In: 2019 International Conference on", "orig": "learning based table structure recognition. In: 2019 International Conference on", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 50, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.52, "r_y0": 489.48, "r_x1": 439.06, "r_y1": 489.48, "r_x2": 439.06, "r_y2": 481.41, "r_x3": 151.52, "r_y3": 481.41, "coord_origin": "TOPLEFT" }, "text": "Document Analysis and Recognition (ICDAR). pp. 1403-1409 (2019).", "orig": "Document Analysis and Recognition (ICDAR). pp. 1403-1409 (2019).", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 51, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 442.94, "r_y0": 489.52, "r_x1": 480.59, "r_y1": 489.52, "r_x2": 480.59, "r_y2": 482.06, "r_x3": 442.94, "r_y3": 482.06, "coord_origin": "TOPLEFT" }, "text": "https://", "orig": "https://", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 52, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.52, "r_y0": 500.48, "r_x1": 302.12, "r_y1": 500.48, "r_x2": 302.12, "r_y2": 493.01, "r_x3": 151.52, "r_y3": 493.01, "coord_origin": "TOPLEFT" }, "text": "doi.org/10.1109/ICDAR.2019.00226", "orig": "doi.org/10.1109/ICDAR.2019.00226", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 53, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 511.41, "r_x1": 146.16, "r_y1": 511.41, "r_x2": 146.16, "r_y2": 503.34, "r_x3": 134.76, "r_y3": 503.34, "coord_origin": "TOPLEFT" }, "text": "14.", "orig": "14.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 54, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 150.61, "r_y0": 511.41, "r_x1": 480.59, "r_y1": 511.41, "r_x2": 480.59, "r_y2": 503.34, "r_x3": 150.61, "r_y3": 503.34, "coord_origin": "TOPLEFT" }, "text": "Smock, B., Pesala, R., Abraham, R.: PubTables-1M: Towards comprehensive ta-", "orig": "Smock, B., Pesala, R., Abraham, R.: PubTables-1M: Towards comprehensive ta-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 55, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.52, "r_y0": 522.37, "r_x1": 480.59, "r_y1": 522.37, "r_x2": 480.59, "r_y2": 514.3, "r_x3": 151.52, "r_y3": 514.3, "coord_origin": "TOPLEFT" }, "text": "ble extraction from unstructured documents. In: Proceedings of the IEEE/CVF", "orig": "ble extraction from unstructured documents. In: Proceedings of the IEEE/CVF", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 56, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.52, "r_y0": 533.33, "r_x1": 480.59, "r_y1": 533.33, "r_x2": 480.59, "r_y2": 525.26, "r_x3": 151.52, "r_y3": 525.26, "coord_origin": "TOPLEFT" }, "text": "Conference on Computer Vision and Pattern Recognition (CVPR). pp. 4634-4642", "orig": "Conference on Computer Vision and Pattern Recognition (CVPR). pp. 4634-4642", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 57, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.52, "r_y0": 544.29, "r_x1": 199.25, "r_y1": 544.29, "r_x2": 199.25, "r_y2": 536.22, "r_x3": 151.52, "r_y3": 536.22, "coord_origin": "TOPLEFT" }, "text": "(June 2022)", "orig": "(June 2022)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 58, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 555.26, "r_x1": 146.17, "r_y1": 555.26, "r_x2": 146.17, "r_y2": 547.19, "r_x3": 134.76, "r_y3": 547.19, "coord_origin": "TOPLEFT" }, "text": "15.", "orig": "15.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 59, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 150.63, "r_y0": 555.26, "r_x1": 480.59, "r_y1": 555.26, "r_x2": 480.59, "r_y2": 547.19, "r_x3": 150.63, "r_y3": 547.19, "coord_origin": "TOPLEFT" }, "text": "Staar, P.W.J., Dolfi, M., Auer, C., Bekas, C.: Corpus conversion service: A ma-", "orig": "Staar, P.W.J., Dolfi, M., Auer, C., Bekas, C.: Corpus conversion service: A ma-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 60, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.52, "r_y0": 566.21, "r_x1": 480.59, "r_y1": 566.21, "r_x2": 480.59, "r_y2": 558.14, "r_x3": 151.52, "r_y3": 558.14, "coord_origin": "TOPLEFT" }, "text": "chine learning platform to ingest documents at scale. In: Proceedings of the 24th", "orig": "chine learning platform to ingest documents at scale. In: Proceedings of the 24th", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 61, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.52, "r_y0": 577.17, "r_x1": 480.59, "r_y1": 577.17, "r_x2": 480.59, "r_y2": 569.1, "r_x3": 151.52, "r_y3": 569.1, "coord_origin": "TOPLEFT" }, "text": "ACM SIGKDD International Conference on Knowledge Discovery & Data Min-", "orig": "ACM SIGKDD International Conference on Knowledge Discovery & Data Min-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 62, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.52, "r_y0": 588.13, "r_x1": 480.59, "r_y1": 588.13, "r_x2": 480.59, "r_y2": 580.06, "r_x3": 151.52, "r_y3": 580.06, "coord_origin": "TOPLEFT" }, "text": "ing. pp. 774-782. KDD \u201918, Association for Computing Machinery, New York, NY,", "orig": "ing. pp. 774-782. KDD \u201918, Association for Computing Machinery, New York, NY,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 63, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.52, "r_y0": 599.09, "r_x1": 200.76, "r_y1": 599.09, "r_x2": 200.76, "r_y2": 591.02, "r_x3": 151.52, "r_y3": 591.02, "coord_origin": "TOPLEFT" }, "text": "USA (2018).", "orig": "USA (2018).", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 64, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 202.92, "r_y0": 599.14, "r_x1": 386.46, "r_y1": 599.14, "r_x2": 386.46, "r_y2": 591.67, "r_x3": 202.92, "r_y3": 591.67, "coord_origin": "TOPLEFT" }, "text": "https://doi.org/10.1145/3219819.3219834", "orig": "https://doi.org/10.1145/3219819.3219834", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 65, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 386.46, "r_y0": 599.09, "r_x1": 389.02, "r_y1": 599.09, "r_x2": 389.02, "r_y2": 591.02, "r_x3": 386.46, "r_y3": 591.02, "coord_origin": "TOPLEFT" }, "text": ",", "orig": ",", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 66, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 391.17, "r_y0": 599.14, "r_x1": 480.6, "r_y1": 599.14, "r_x2": 480.6, "r_y2": 591.67, "r_x3": 391.17, "r_y3": 591.67, "coord_origin": "TOPLEFT" }, "text": "https://doi.org/10.", "orig": "https://doi.org/10.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 67, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.52, "r_y0": 610.1, "r_x1": 245.64, "r_y1": 610.1, "r_x2": 245.64, "r_y2": 602.63, "r_x3": 151.52, "r_y3": 602.63, "coord_origin": "TOPLEFT" }, "text": "1145/3219819.3219834", "orig": "1145/3219819.3219834", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 68, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 621.02, "r_x1": 146.62, "r_y1": 621.02, "r_x2": 146.62, "r_y2": 612.95, "r_x3": 134.76, "r_y3": 612.95, "coord_origin": "TOPLEFT" }, "text": "16.", "orig": "16.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 69, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.26, "r_y0": 621.02, "r_x1": 480.6, "r_y1": 621.02, "r_x2": 480.6, "r_y2": 612.95, "r_x3": 151.26, "r_y3": 612.95, "coord_origin": "TOPLEFT" }, "text": "Wang, X.: Tabular Abstraction, Editing, and Formatting. Ph.D. thesis, CAN", "orig": "Wang, X.: Tabular Abstraction, Editing, and Formatting. Ph.D. thesis, CAN", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 70, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.52, "r_y0": 631.98, "r_x1": 234.43, "r_y1": 631.98, "r_x2": 234.43, "r_y2": 623.91, "r_x3": 151.52, "r_y3": 623.91, "coord_origin": "TOPLEFT" }, "text": "(1996), aAINN09397", "orig": "(1996), aAINN09397", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 71, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 642.95, "r_x1": 146.31, "r_y1": 642.95, "r_x2": 146.31, "r_y2": 634.88, "r_x3": 134.76, "r_y3": 634.88, "coord_origin": "TOPLEFT" }, "text": "17.", "orig": "17.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 72, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 150.82, "r_y0": 642.95, "r_x1": 480.59, "r_y1": 642.95, "r_x2": 480.59, "r_y2": 634.88, "r_x3": 150.82, "r_y3": 634.88, "coord_origin": "TOPLEFT" }, "text": "Xue, W., Li, Q., Tao, D.: Res2tim: Reconstruct syntactic structures from table", "orig": "Xue, W., Li, Q., Tao, D.: Res2tim: Reconstruct syntactic structures from table", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 73, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.52, "r_y0": 653.91, "r_x1": 480.59, "r_y1": 653.91, "r_x2": 480.59, "r_y2": 645.84, "r_x3": 151.52, "r_y3": 645.84, "coord_origin": "TOPLEFT" }, "text": "images. In: 2019 International Conference on Document Analysis and Recognition", "orig": "images. In: 2019 International Conference on Document Analysis and Recognition", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 74, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.52, "r_y0": 664.87, "r_x1": 299.3, "r_y1": 664.87, "r_x2": 299.3, "r_y2": 656.8, "r_x3": 151.52, "r_y3": 656.8, "coord_origin": "TOPLEFT" }, "text": "(ICDAR). pp. 749-755. IEEE (2019)", "orig": "(ICDAR). pp. 749-755. IEEE (2019)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "has_chars": false, "has_words": false, "has_lines": true, "image": null, "lines": [] }, "predictions": { "layout": { "clusters": [ { "id": 13, "label": "page_header", "bbox": { "l": 194.48, "t": 93.77, "r": 447.54, "b": 101.84, "coord_origin": "TOPLEFT" }, "confidence": 0.916, "cells": [ { "index": 0, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 194.48, "r_y0": 101.84, "r_x1": 447.54, "r_y1": 101.84, "r_x2": 447.54, "r_y2": 93.77, "r_x3": 194.48, "r_y3": 93.77, "coord_origin": "TOPLEFT" }, "text": "Optimized Table Tokenization for Table Structure Recognition", "orig": "Optimized Table Tokenization for Table Structure Recognition", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 14, "label": "page_header", "bbox": { "l": 471.38, "t": 93.77, "r": 480.59, "b": 101.84, "coord_origin": "TOPLEFT" }, "confidence": 0.906, "cells": [ { "index": 1, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 471.38, "r_y0": 101.84, "r_x1": 480.59, "r_y1": 101.84, "r_x2": 480.59, "r_y2": 93.77, "r_x3": 471.38, "r_y3": 93.77, "coord_origin": "TOPLEFT" }, "text": "13", "orig": "13", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 5, "label": "list_item", "bbox": { "l": 139.37, "t": 119.67, "r": 480.59, "b": 149.66, "coord_origin": "TOPLEFT" }, "confidence": 0.968, "cells": [ { "index": 2, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 139.37, "r_y0": 127.74, "r_x1": 146.05, "r_y1": 127.74, "r_x2": 146.05, "r_y2": 119.67, "r_x3": 139.37, "r_y3": 119.67, "coord_origin": "TOPLEFT" }, "text": "5.", "orig": "5.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 3, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 150.34, "r_y0": 127.74, "r_x1": 480.59, "r_y1": 127.74, "r_x2": 480.59, "r_y2": 119.67, "r_x3": 150.34, "r_y3": 119.67, "coord_origin": "TOPLEFT" }, "text": "Kayal, P., Anand, M., Desai, H., Singh, M.: Tables to latex: structure and content", "orig": "Kayal, P., Anand, M., Desai, H., Singh, M.: Tables to latex: structure and content", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 4, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.52, "r_y0": 138.7, "r_x1": 480.59, "r_y1": 138.7, "r_x2": 480.59, "r_y2": 130.63, "r_x3": 151.52, "r_y3": 130.63, "coord_origin": "TOPLEFT" }, "text": "extraction from scientific tables. International Journal on Document Analysis and", "orig": "extraction from scientific tables. International Journal on Document Analysis and", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 5, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.52, "r_y0": 149.66, "r_x1": 304.04, "r_y1": 149.66, "r_x2": 304.04, "r_y2": 141.59, "r_x3": 151.52, "r_y3": 141.59, "coord_origin": "TOPLEFT" }, "text": "Recognition (IJDAR) pp. 1-10 (2022)", "orig": "Recognition (IJDAR) pp. 1-10 (2022)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 1, "label": "list_item", "bbox": { "l": 139.37, "t": 152.56, "r": 480.59, "b": 193.51, "coord_origin": "TOPLEFT" }, "confidence": 0.973, "cells": [ { "index": 6, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 139.37, "r_y0": 160.63, "r_x1": 145.94, "r_y1": 160.63, "r_x2": 145.94, "r_y2": 152.56, "r_x3": 139.37, "r_y3": 152.56, "coord_origin": "TOPLEFT" }, "text": "6.", "orig": "6.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 7, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 150.16, "r_y0": 160.63, "r_x1": 480.59, "r_y1": 160.63, "r_x2": 480.59, "r_y2": 152.56, "r_x3": 150.16, "r_y3": 152.56, "coord_origin": "TOPLEFT" }, "text": "Lee, E., Kwon, J., Yang, H., Park, J., Lee, S., Koo, H.I., Cho, N.I.: Table structure", "orig": "Lee, E., Kwon, J., Yang, H., Park, J., Lee, S., Koo, H.I., Cho, N.I.: Table structure", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 8, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.52, "r_y0": 171.59, "r_x1": 480.59, "r_y1": 171.59, "r_x2": 480.59, "r_y2": 163.52, "r_x3": 151.52, "r_y3": 163.52, "coord_origin": "TOPLEFT" }, "text": "recognition based on grid shape graph. In: 2022 Asia-Pacific Signal and Information", "orig": "recognition based on grid shape graph. In: 2022 Asia-Pacific Signal and Information", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 9, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.52, "r_y0": 182.55, "r_x1": 480.59, "r_y1": 182.55, "r_x2": 480.59, "r_y2": 174.48, "r_x3": 151.52, "r_y3": 174.48, "coord_origin": "TOPLEFT" }, "text": "Processing Association Annual Summit and Conference (APSIPA ASC). pp. 1868-", "orig": "Processing Association Annual Summit and Conference (APSIPA ASC). pp. 1868-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 10, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.52, "r_y0": 193.51, "r_x1": 226.37, "r_y1": 193.51, "r_x2": 226.37, "r_y2": 185.44, "r_x3": 151.52, "r_y3": 185.44, "coord_origin": "TOPLEFT" }, "text": "1873. IEEE (2022)", "orig": "1873. IEEE (2022)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 10, "label": "list_item", "bbox": { "l": 139.37, "t": 196.41, "r": 480.59, "b": 215.44, "coord_origin": "TOPLEFT" }, "confidence": 0.958, "cells": [ { "index": 11, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 139.37, "r_y0": 204.48, "r_x1": 146.31, "r_y1": 204.48, "r_x2": 146.31, "r_y2": 196.41, "r_x3": 139.37, "r_y3": 196.41, "coord_origin": "TOPLEFT" }, "text": "7.", "orig": "7.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 12, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 150.78, "r_y0": 204.48, "r_x1": 480.59, "r_y1": 204.48, "r_x2": 480.59, "r_y2": 196.41, "r_x3": 150.78, "r_y3": 196.41, "coord_origin": "TOPLEFT" }, "text": "Li, M., Cui, L., Huang, S., Wei, F., Zhou, M., Li, Z.: Tablebank: A benchmark", "orig": "Li, M., Cui, L., Huang, S., Wei, F., Zhou, M., Li, Z.: Tablebank: A benchmark", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 13, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.52, "r_y0": 215.44, "r_x1": 352.02, "r_y1": 215.44, "r_x2": 352.02, "r_y2": 207.37, "r_x3": 151.52, "r_y3": 207.37, "coord_origin": "TOPLEFT" }, "text": "dataset for table detection and recognition (2019)", "orig": "dataset for table detection and recognition (2019)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 4, "label": "list_item", "bbox": { "l": 139.37, "t": 218.34, "r": 480.59, "b": 270.29, "coord_origin": "TOPLEFT" }, "confidence": 0.968, "cells": [ { "index": 14, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 139.37, "r_y0": 226.41, "r_x1": 146.37, "r_y1": 226.41, "r_x2": 146.37, "r_y2": 218.34, "r_x3": 139.37, "r_y3": 218.34, "coord_origin": "TOPLEFT" }, "text": "8.", "orig": "8.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 15, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 150.87, "r_y0": 226.41, "r_x1": 480.59, "r_y1": 226.41, "r_x2": 480.59, "r_y2": 218.34, "r_x3": 150.87, "r_y3": 218.34, "coord_origin": "TOPLEFT" }, "text": "Livathinos, N., Berrospi, C., Lysak, M., Kuropiatnyk, V., Nassar, A., Carvalho,", "orig": "Livathinos, N., Berrospi, C., Lysak, M., Kuropiatnyk, V., Nassar, A., Carvalho,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 16, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.52, "r_y0": 237.37, "r_x1": 480.59, "r_y1": 237.37, "r_x2": 480.59, "r_y2": 229.3, "r_x3": 151.52, "r_y3": 229.3, "coord_origin": "TOPLEFT" }, "text": "A., Dolfi, M., Auer, C., Dinkla, K., Staar, P.: Robust pdf document conversion", "orig": "A., Dolfi, M., Auer, C., Dinkla, K., Staar, P.: Robust pdf document conversion", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 17, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.52, "r_y0": 248.33, "r_x1": 480.59, "r_y1": 248.33, "r_x2": 480.59, "r_y2": 240.26, "r_x3": 151.52, "r_y3": 240.26, "coord_origin": "TOPLEFT" }, "text": "using recurrent neural networks. Proceedings of the AAAI Conference on Artificial", "orig": "using recurrent neural networks. Proceedings of the AAAI Conference on Artificial", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 18, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.52, "r_y0": 259.29, "r_x1": 197.09, "r_y1": 259.29, "r_x2": 197.09, "r_y2": 251.22, "r_x3": 151.52, "r_y3": 251.22, "coord_origin": "TOPLEFT" }, "text": "Intelligence", "orig": "Intelligence", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 19, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 199.4, "r_y0": 259.08, "r_x1": 210.01, "r_y1": 259.08, "r_x2": 210.01, "r_y2": 251.15, "r_x3": 199.4, "r_y3": 251.15, "coord_origin": "TOPLEFT" }, "text": "35", "orig": "35", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 20, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 210.01, "r_y0": 259.29, "r_x1": 332.38, "r_y1": 259.29, "r_x2": 332.38, "r_y2": 251.22, "r_x3": 210.01, "r_y3": 251.22, "coord_origin": "TOPLEFT" }, "text": "(17), 15137-15145 (May 2021),", "orig": "(17), 15137-15145 (May 2021),", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 21, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 334.7, "r_y0": 259.33, "r_x1": 480.59, "r_y1": 259.33, "r_x2": 480.59, "r_y2": 251.86, "r_x3": 334.7, "r_y3": 251.86, "coord_origin": "TOPLEFT" }, "text": "https://ojs.aaai.org/index.php/", "orig": "https://ojs.aaai.org/index.php/", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 22, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.52, "r_y0": 270.29, "r_x1": 259.76, "r_y1": 270.29, "r_x2": 259.76, "r_y2": 262.82, "r_x3": 151.52, "r_y3": 262.82, "coord_origin": "TOPLEFT" }, "text": "AAAI/article/view/17777", "orig": "AAAI/article/view/17777", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 11, "label": "list_item", "bbox": { "l": 139.37, "t": 273.14, "r": 480.59, "b": 303.13, "coord_origin": "TOPLEFT" }, "confidence": 0.956, "cells": [ { "index": 23, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 139.37, "r_y0": 281.21, "r_x1": 146.14, "r_y1": 281.21, "r_x2": 146.14, "r_y2": 273.14, "r_x3": 139.37, "r_y3": 273.14, "coord_origin": "TOPLEFT" }, "text": "9.", "orig": "9.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 24, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 150.5, "r_y0": 281.21, "r_x1": 480.59, "r_y1": 281.21, "r_x2": 480.59, "r_y2": 273.14, "r_x3": 150.5, "r_y3": 273.14, "coord_origin": "TOPLEFT" }, "text": "Nassar, A., Livathinos, N., Lysak, M., Staar, P.: Tableformer: Table structure un-", "orig": "Nassar, A., Livathinos, N., Lysak, M., Staar, P.: Tableformer: Table structure un-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 25, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.52, "r_y0": 292.17, "r_x1": 480.59, "r_y1": 292.17, "r_x2": 480.59, "r_y2": 284.1, "r_x3": 151.52, "r_y3": 284.1, "coord_origin": "TOPLEFT" }, "text": "derstanding with transformers. In: Proceedings of the IEEE/CVF Conference on", "orig": "derstanding with transformers. In: Proceedings of the IEEE/CVF Conference on", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 26, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.52, "r_y0": 303.13, "r_x1": 473.44, "r_y1": 303.13, "r_x2": 473.44, "r_y2": 295.06, "r_x3": 151.52, "r_y3": 295.06, "coord_origin": "TOPLEFT" }, "text": "Computer Vision and Pattern Recognition (CVPR). pp. 4614-4623 (June 2022)", "orig": "Computer Vision and Pattern Recognition (CVPR). pp. 4614-4623 (June 2022)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 9, "label": "list_item", "bbox": { "l": 134.76, "t": 306.03, "r": 480.59, "b": 368.94, "coord_origin": "TOPLEFT" }, "confidence": 0.964, "cells": [ { "index": 27, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 314.1, "r_x1": 146.5, "r_y1": 314.1, "r_x2": 146.5, "r_y2": 306.03, "r_x3": 134.76, "r_y3": 306.03, "coord_origin": "TOPLEFT" }, "text": "10.", "orig": "10.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 28, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.09, "r_y0": 314.1, "r_x1": 480.59, "r_y1": 314.1, "r_x2": 480.59, "r_y2": 306.03, "r_x3": 151.09, "r_y3": 306.03, "coord_origin": "TOPLEFT" }, "text": "Pfitzmann, B., Auer, C., Dolfi, M., Nassar, A.S., Staar, P.W.J.: Doclaynet: A", "orig": "Pfitzmann, B., Auer, C., Dolfi, M., Nassar, A.S., Staar, P.W.J.: Doclaynet: A", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 29, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.52, "r_y0": 325.06, "r_x1": 480.59, "r_y1": 325.06, "r_x2": 480.59, "r_y2": 316.99, "r_x3": 151.52, "r_y3": 316.99, "coord_origin": "TOPLEFT" }, "text": "large human-annotated dataset for document-layout segmentation. In: Zhang, A.,", "orig": "large human-annotated dataset for document-layout segmentation. In: Zhang, A.,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 30, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.52, "r_y0": 336.02, "r_x1": 480.59, "r_y1": 336.02, "r_x2": 480.59, "r_y2": 327.95, "r_x3": 151.52, "r_y3": 327.95, "coord_origin": "TOPLEFT" }, "text": "Rangwala, H. (eds.) KDD \u201922: The 28th ACM SIGKDD Conference on Knowledge", "orig": "Rangwala, H. (eds.) KDD \u201922: The 28th ACM SIGKDD Conference on Knowledge", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 31, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.52, "r_y0": 346.98, "r_x1": 480.59, "r_y1": 346.98, "r_x2": 480.59, "r_y2": 338.91, "r_x3": 151.52, "r_y3": 338.91, "coord_origin": "TOPLEFT" }, "text": "Discovery and Data Mining, Washington, DC, USA, August 14 - 18, 2022. pp.", "orig": "Discovery and Data Mining, Washington, DC, USA, August 14 - 18, 2022. pp.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 32, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.52, "r_y0": 357.94, "r_x1": 251.14, "r_y1": 357.94, "r_x2": 251.14, "r_y2": 349.87, "r_x3": 151.52, "r_y3": 349.87, "coord_origin": "TOPLEFT" }, "text": "3743-3751. ACM (2022).", "orig": "3743-3751. ACM (2022).", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 33, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 253.99, "r_y0": 357.98, "r_x1": 437.53, "r_y1": 357.98, "r_x2": 437.53, "r_y2": 350.51, "r_x3": 253.99, "r_y3": 350.51, "coord_origin": "TOPLEFT" }, "text": "https://doi.org/10.1145/3534678.3539043", "orig": "https://doi.org/10.1145/3534678.3539043", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 34, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 437.53, "r_y0": 357.94, "r_x1": 440.09, "r_y1": 357.94, "r_x2": 440.09, "r_y2": 349.87, "r_x3": 437.53, "r_y3": 349.87, "coord_origin": "TOPLEFT" }, "text": ",", "orig": ",", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 35, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 442.94, "r_y0": 357.98, "r_x1": 480.59, "r_y1": 357.98, "r_x2": 480.59, "r_y2": 350.51, "r_x3": 442.94, "r_y3": 350.51, "coord_origin": "TOPLEFT" }, "text": "https://", "orig": "https://", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 36, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.52, "r_y0": 368.94, "r_x1": 297.41, "r_y1": 368.94, "r_x2": 297.41, "r_y2": 361.47, "r_x3": 151.52, "r_y3": 361.47, "coord_origin": "TOPLEFT" }, "text": "doi.org/10.1145/3534678.3539043", "orig": "doi.org/10.1145/3534678.3539043", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 0, "label": "list_item", "bbox": { "l": 134.76, "t": 371.8, "r": 480.59, "b": 412.74, "coord_origin": "TOPLEFT" }, "confidence": 0.975, "cells": [ { "index": 37, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 379.87, "r_x1": 146.04, "r_y1": 379.87, "r_x2": 146.04, "r_y2": 371.8, "r_x3": 134.76, "r_y3": 371.8, "coord_origin": "TOPLEFT" }, "text": "11.", "orig": "11.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 38, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 150.45, "r_y0": 379.87, "r_x1": 480.59, "r_y1": 379.87, "r_x2": 480.59, "r_y2": 371.8, "r_x3": 150.45, "r_y3": 371.8, "coord_origin": "TOPLEFT" }, "text": "Prasad, D., Gadpal, A., Kapadni, K., Visave, M., Sultanpure, K.: Cascadetabnet:", "orig": "Prasad, D., Gadpal, A., Kapadni, K., Visave, M., Sultanpure, K.: Cascadetabnet:", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 39, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.52, "r_y0": 390.83, "r_x1": 480.59, "r_y1": 390.83, "r_x2": 480.59, "r_y2": 382.76, "r_x3": 151.52, "r_y3": 382.76, "coord_origin": "TOPLEFT" }, "text": "An approach for end to end table detection and structure recognition from image-", "orig": "An approach for end to end table detection and structure recognition from image-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 40, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.52, "r_y0": 401.79, "r_x1": 480.59, "r_y1": 401.79, "r_x2": 480.59, "r_y2": 393.72, "r_x3": 151.52, "r_y3": 393.72, "coord_origin": "TOPLEFT" }, "text": "based documents. In: Proceedings of the IEEE/CVF conference on computer vision", "orig": "based documents. In: Proceedings of the IEEE/CVF conference on computer vision", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 41, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.52, "r_y0": 412.74, "r_x1": 373.83, "r_y1": 412.74, "r_x2": 373.83, "r_y2": 404.67, "r_x3": 151.52, "r_y3": 404.67, "coord_origin": "TOPLEFT" }, "text": "and pattern recognition workshops. pp. 572-573 (2020)", "orig": "and pattern recognition workshops. pp. 572-573 (2020)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 3, "label": "list_item", "bbox": { "l": 134.76, "t": 415.64, "r": 480.59, "b": 456.59, "coord_origin": "TOPLEFT" }, "confidence": 0.971, "cells": [ { "index": 42, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 423.71, "r_x1": 145.91, "r_y1": 423.71, "r_x2": 145.91, "r_y2": 415.64, "r_x3": 134.76, "r_y3": 415.64, "coord_origin": "TOPLEFT" }, "text": "12.", "orig": "12.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 43, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 150.27, "r_y0": 423.71, "r_x1": 480.59, "r_y1": 423.71, "r_x2": 480.59, "r_y2": 415.64, "r_x3": 150.27, "r_y3": 415.64, "coord_origin": "TOPLEFT" }, "text": "Schreiber, S., Agne, S., Wolf, I., Dengel, A., Ahmed, S.: Deepdesrt: Deep learning", "orig": "Schreiber, S., Agne, S., Wolf, I., Dengel, A., Ahmed, S.: Deepdesrt: Deep learning", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 44, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.52, "r_y0": 434.67, "r_x1": 480.59, "r_y1": 434.67, "r_x2": 480.59, "r_y2": 426.6, "r_x3": 151.52, "r_y3": 426.6, "coord_origin": "TOPLEFT" }, "text": "for detection and structure recognition of tables in document images. In: 2017 14th", "orig": "for detection and structure recognition of tables in document images. In: 2017 14th", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 45, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.52, "r_y0": 445.63, "r_x1": 480.59, "r_y1": 445.63, "r_x2": 480.59, "r_y2": 437.56, "r_x3": 151.52, "r_y3": 437.56, "coord_origin": "TOPLEFT" }, "text": "IAPR international conference on document analysis and recognition (ICDAR).", "orig": "IAPR international conference on document analysis and recognition (ICDAR).", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 46, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.52, "r_y0": 456.59, "r_x1": 292.91, "r_y1": 456.59, "r_x2": 292.91, "r_y2": 448.52, "r_x3": 151.52, "r_y3": 448.52, "coord_origin": "TOPLEFT" }, "text": "vol. 1, pp. 1162-1167. IEEE (2017)", "orig": "vol. 1, pp. 1162-1167. IEEE (2017)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 7, "label": "list_item", "bbox": { "l": 134.76, "t": 459.49, "r": 480.59, "b": 500.48, "coord_origin": "TOPLEFT" }, "confidence": 0.966, "cells": [ { "index": 47, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 467.56, "r_x1": 145.78, "r_y1": 467.56, "r_x2": 145.78, "r_y2": 459.49, "r_x3": 134.76, "r_y3": 459.49, "coord_origin": "TOPLEFT" }, "text": "13.", "orig": "13.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 48, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 150.09, "r_y0": 467.56, "r_x1": 480.59, "r_y1": 467.56, "r_x2": 480.59, "r_y2": 459.49, "r_x3": 150.09, "r_y3": 459.49, "coord_origin": "TOPLEFT" }, "text": "Siddiqui, S.A., Fateh, I.A., Rizvi, S.T.R., Dengel, A., Ahmed, S.: Deeptabstr: Deep", "orig": "Siddiqui, S.A., Fateh, I.A., Rizvi, S.T.R., Dengel, A., Ahmed, S.: Deeptabstr: Deep", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 49, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.52, "r_y0": 478.52, "r_x1": 480.59, "r_y1": 478.52, "r_x2": 480.59, "r_y2": 470.45, "r_x3": 151.52, "r_y3": 470.45, "coord_origin": "TOPLEFT" }, "text": "learning based table structure recognition. In: 2019 International Conference on", "orig": "learning based table structure recognition. In: 2019 International Conference on", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 50, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.52, "r_y0": 489.48, "r_x1": 439.06, "r_y1": 489.48, "r_x2": 439.06, "r_y2": 481.41, "r_x3": 151.52, "r_y3": 481.41, "coord_origin": "TOPLEFT" }, "text": "Document Analysis and Recognition (ICDAR). pp. 1403-1409 (2019).", "orig": "Document Analysis and Recognition (ICDAR). pp. 1403-1409 (2019).", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 51, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 442.94, "r_y0": 489.52, "r_x1": 480.59, "r_y1": 489.52, "r_x2": 480.59, "r_y2": 482.06, "r_x3": 442.94, "r_y3": 482.06, "coord_origin": "TOPLEFT" }, "text": "https://", "orig": "https://", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 52, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.52, "r_y0": 500.48, "r_x1": 302.12, "r_y1": 500.48, "r_x2": 302.12, "r_y2": 493.01, "r_x3": 151.52, "r_y3": 493.01, "coord_origin": "TOPLEFT" }, "text": "doi.org/10.1109/ICDAR.2019.00226", "orig": "doi.org/10.1109/ICDAR.2019.00226", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 2, "label": "list_item", "bbox": { "l": 134.76, "t": 503.34, "r": 480.59, "b": 544.29, "coord_origin": "TOPLEFT" }, "confidence": 0.972, "cells": [ { "index": 53, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 511.41, "r_x1": 146.16, "r_y1": 511.41, "r_x2": 146.16, "r_y2": 503.34, "r_x3": 134.76, "r_y3": 503.34, "coord_origin": "TOPLEFT" }, "text": "14.", "orig": "14.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 54, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 150.61, "r_y0": 511.41, "r_x1": 480.59, "r_y1": 511.41, "r_x2": 480.59, "r_y2": 503.34, "r_x3": 150.61, "r_y3": 503.34, "coord_origin": "TOPLEFT" }, "text": "Smock, B., Pesala, R., Abraham, R.: PubTables-1M: Towards comprehensive ta-", "orig": "Smock, B., Pesala, R., Abraham, R.: PubTables-1M: Towards comprehensive ta-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 55, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.52, "r_y0": 522.37, "r_x1": 480.59, "r_y1": 522.37, "r_x2": 480.59, "r_y2": 514.3, "r_x3": 151.52, "r_y3": 514.3, "coord_origin": "TOPLEFT" }, "text": "ble extraction from unstructured documents. In: Proceedings of the IEEE/CVF", "orig": "ble extraction from unstructured documents. In: Proceedings of the IEEE/CVF", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 56, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.52, "r_y0": 533.33, "r_x1": 480.59, "r_y1": 533.33, "r_x2": 480.59, "r_y2": 525.26, "r_x3": 151.52, "r_y3": 525.26, "coord_origin": "TOPLEFT" }, "text": "Conference on Computer Vision and Pattern Recognition (CVPR). pp. 4634-4642", "orig": "Conference on Computer Vision and Pattern Recognition (CVPR). pp. 4634-4642", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 57, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.52, "r_y0": 544.29, "r_x1": 199.25, "r_y1": 544.29, "r_x2": 199.25, "r_y2": 536.22, "r_x3": 151.52, "r_y3": 536.22, "coord_origin": "TOPLEFT" }, "text": "(June 2022)", "orig": "(June 2022)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 6, "label": "list_item", "bbox": { "l": 134.76, "t": 547.19, "r": 480.6, "b": 610.1, "coord_origin": "TOPLEFT" }, "confidence": 0.967, "cells": [ { "index": 58, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 555.26, "r_x1": 146.17, "r_y1": 555.26, "r_x2": 146.17, "r_y2": 547.19, "r_x3": 134.76, "r_y3": 547.19, "coord_origin": "TOPLEFT" }, "text": "15.", "orig": "15.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 59, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 150.63, "r_y0": 555.26, "r_x1": 480.59, "r_y1": 555.26, "r_x2": 480.59, "r_y2": 547.19, "r_x3": 150.63, "r_y3": 547.19, "coord_origin": "TOPLEFT" }, "text": "Staar, P.W.J., Dolfi, M., Auer, C., Bekas, C.: Corpus conversion service: A ma-", "orig": "Staar, P.W.J., Dolfi, M., Auer, C., Bekas, C.: Corpus conversion service: A ma-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 60, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.52, "r_y0": 566.21, "r_x1": 480.59, "r_y1": 566.21, "r_x2": 480.59, "r_y2": 558.14, "r_x3": 151.52, "r_y3": 558.14, "coord_origin": "TOPLEFT" }, "text": "chine learning platform to ingest documents at scale. In: Proceedings of the 24th", "orig": "chine learning platform to ingest documents at scale. In: Proceedings of the 24th", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 61, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.52, "r_y0": 577.17, "r_x1": 480.59, "r_y1": 577.17, "r_x2": 480.59, "r_y2": 569.1, "r_x3": 151.52, "r_y3": 569.1, "coord_origin": "TOPLEFT" }, "text": "ACM SIGKDD International Conference on Knowledge Discovery & Data Min-", "orig": "ACM SIGKDD International Conference on Knowledge Discovery & Data Min-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 62, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.52, "r_y0": 588.13, "r_x1": 480.59, "r_y1": 588.13, "r_x2": 480.59, "r_y2": 580.06, "r_x3": 151.52, "r_y3": 580.06, "coord_origin": "TOPLEFT" }, "text": "ing. pp. 774-782. KDD \u201918, Association for Computing Machinery, New York, NY,", "orig": "ing. pp. 774-782. KDD \u201918, Association for Computing Machinery, New York, NY,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 63, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.52, "r_y0": 599.09, "r_x1": 200.76, "r_y1": 599.09, "r_x2": 200.76, "r_y2": 591.02, "r_x3": 151.52, "r_y3": 591.02, "coord_origin": "TOPLEFT" }, "text": "USA (2018).", "orig": "USA (2018).", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 64, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 202.92, "r_y0": 599.14, "r_x1": 386.46, "r_y1": 599.14, "r_x2": 386.46, "r_y2": 591.67, "r_x3": 202.92, "r_y3": 591.67, "coord_origin": "TOPLEFT" }, "text": "https://doi.org/10.1145/3219819.3219834", "orig": "https://doi.org/10.1145/3219819.3219834", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 65, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 386.46, "r_y0": 599.09, "r_x1": 389.02, "r_y1": 599.09, "r_x2": 389.02, "r_y2": 591.02, "r_x3": 386.46, "r_y3": 591.02, "coord_origin": "TOPLEFT" }, "text": ",", "orig": ",", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 66, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 391.17, "r_y0": 599.14, "r_x1": 480.6, "r_y1": 599.14, "r_x2": 480.6, "r_y2": 591.67, "r_x3": 391.17, "r_y3": 591.67, "coord_origin": "TOPLEFT" }, "text": "https://doi.org/10.", "orig": "https://doi.org/10.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 67, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.52, "r_y0": 610.1, "r_x1": 245.64, "r_y1": 610.1, "r_x2": 245.64, "r_y2": 602.63, "r_x3": 151.52, "r_y3": 602.63, "coord_origin": "TOPLEFT" }, "text": "1145/3219819.3219834", "orig": "1145/3219819.3219834", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 12, "label": "list_item", "bbox": { "l": 134.76, "t": 612.95, "r": 480.6, "b": 631.98, "coord_origin": "TOPLEFT" }, "confidence": 0.942, "cells": [ { "index": 68, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 621.02, "r_x1": 146.62, "r_y1": 621.02, "r_x2": 146.62, "r_y2": 612.95, "r_x3": 134.76, "r_y3": 612.95, "coord_origin": "TOPLEFT" }, "text": "16.", "orig": "16.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 69, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.26, "r_y0": 621.02, "r_x1": 480.6, "r_y1": 621.02, "r_x2": 480.6, "r_y2": 612.95, "r_x3": 151.26, "r_y3": 612.95, "coord_origin": "TOPLEFT" }, "text": "Wang, X.: Tabular Abstraction, Editing, and Formatting. Ph.D. thesis, CAN", "orig": "Wang, X.: Tabular Abstraction, Editing, and Formatting. Ph.D. thesis, CAN", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 70, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.52, "r_y0": 631.98, "r_x1": 234.43, "r_y1": 631.98, "r_x2": 234.43, "r_y2": 623.91, "r_x3": 151.52, "r_y3": 623.91, "coord_origin": "TOPLEFT" }, "text": "(1996), aAINN09397", "orig": "(1996), aAINN09397", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 8, "label": "list_item", "bbox": { "l": 134.76, "t": 634.88, "r": 480.59, "b": 664.87, "coord_origin": "TOPLEFT" }, "confidence": 0.965, "cells": [ { "index": 71, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 642.95, "r_x1": 146.31, "r_y1": 642.95, "r_x2": 146.31, "r_y2": 634.88, "r_x3": 134.76, "r_y3": 634.88, "coord_origin": "TOPLEFT" }, "text": "17.", "orig": "17.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 72, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 150.82, "r_y0": 642.95, "r_x1": 480.59, "r_y1": 642.95, "r_x2": 480.59, "r_y2": 634.88, "r_x3": 150.82, "r_y3": 634.88, "coord_origin": "TOPLEFT" }, "text": "Xue, W., Li, Q., Tao, D.: Res2tim: Reconstruct syntactic structures from table", "orig": "Xue, W., Li, Q., Tao, D.: Res2tim: Reconstruct syntactic structures from table", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 73, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.52, "r_y0": 653.91, "r_x1": 480.59, "r_y1": 653.91, "r_x2": 480.59, "r_y2": 645.84, "r_x3": 151.52, "r_y3": 645.84, "coord_origin": "TOPLEFT" }, "text": "images. In: 2019 International Conference on Document Analysis and Recognition", "orig": "images. In: 2019 International Conference on Document Analysis and Recognition", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 74, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.52, "r_y0": 664.87, "r_x1": 299.3, "r_y1": 664.87, "r_x2": 299.3, "r_y2": 656.8, "r_x3": 151.52, "r_y3": 656.8, "coord_origin": "TOPLEFT" }, "text": "(ICDAR). pp. 749-755. IEEE (2019)", "orig": "(ICDAR). pp. 749-755. IEEE (2019)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] } ] }, "tablestructure": { "table_map": {} }, "figures_classification": null, "equations_prediction": null, "vlm_response": null }, "assembled": { "elements": [ { "label": "page_header", "id": 13, "page_no": 12, "cluster": { "id": 13, "label": "page_header", "bbox": { "l": 194.48, "t": 93.77, "r": 447.54, "b": 101.84, "coord_origin": "TOPLEFT" }, "confidence": 0.916, "cells": [ { "index": 0, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 194.48, "r_y0": 101.84, "r_x1": 447.54, "r_y1": 101.84, "r_x2": 447.54, "r_y2": 93.77, "r_x3": 194.48, "r_y3": 93.77, "coord_origin": "TOPLEFT" }, "text": "Optimized Table Tokenization for Table Structure Recognition", "orig": "Optimized Table Tokenization for Table Structure Recognition", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "Optimized Table Tokenization for Table Structure Recognition" }, { "label": "page_header", "id": 14, "page_no": 12, "cluster": { "id": 14, "label": "page_header", "bbox": { "l": 471.38, "t": 93.77, "r": 480.59, "b": 101.84, "coord_origin": "TOPLEFT" }, "confidence": 0.906, "cells": [ { "index": 1, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 471.38, "r_y0": 101.84, "r_x1": 480.59, "r_y1": 101.84, "r_x2": 480.59, "r_y2": 93.77, "r_x3": 471.38, "r_y3": 93.77, "coord_origin": "TOPLEFT" }, "text": "13", "orig": "13", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "13" }, { "label": "list_item", "id": 5, "page_no": 12, "cluster": { "id": 5, "label": "list_item", "bbox": { "l": 139.37, "t": 119.67, "r": 480.59, "b": 149.66, "coord_origin": "TOPLEFT" }, "confidence": 0.968, "cells": [ { "index": 2, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 139.37, "r_y0": 127.74, "r_x1": 146.05, "r_y1": 127.74, "r_x2": 146.05, "r_y2": 119.67, "r_x3": 139.37, "r_y3": 119.67, "coord_origin": "TOPLEFT" }, "text": "5.", "orig": "5.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 3, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 150.34, "r_y0": 127.74, "r_x1": 480.59, "r_y1": 127.74, "r_x2": 480.59, "r_y2": 119.67, "r_x3": 150.34, "r_y3": 119.67, "coord_origin": "TOPLEFT" }, "text": "Kayal, P., Anand, M., Desai, H., Singh, M.: Tables to latex: structure and content", "orig": "Kayal, P., Anand, M., Desai, H., Singh, M.: Tables to latex: structure and content", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 4, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.52, "r_y0": 138.7, "r_x1": 480.59, "r_y1": 138.7, "r_x2": 480.59, "r_y2": 130.63, "r_x3": 151.52, "r_y3": 130.63, "coord_origin": "TOPLEFT" }, "text": "extraction from scientific tables. International Journal on Document Analysis and", "orig": "extraction from scientific tables. International Journal on Document Analysis and", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 5, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.52, "r_y0": 149.66, "r_x1": 304.04, "r_y1": 149.66, "r_x2": 304.04, "r_y2": 141.59, "r_x3": 151.52, "r_y3": 141.59, "coord_origin": "TOPLEFT" }, "text": "Recognition (IJDAR) pp. 1-10 (2022)", "orig": "Recognition (IJDAR) pp. 1-10 (2022)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "5. Kayal, P., Anand, M., Desai, H., Singh, M.: Tables to latex: structure and content extraction from scientific tables. International Journal on Document Analysis and Recognition (IJDAR) pp. 1-10 (2022)" }, { "label": "list_item", "id": 1, "page_no": 12, "cluster": { "id": 1, "label": "list_item", "bbox": { "l": 139.37, "t": 152.56, "r": 480.59, "b": 193.51, "coord_origin": "TOPLEFT" }, "confidence": 0.973, "cells": [ { "index": 6, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 139.37, "r_y0": 160.63, "r_x1": 145.94, "r_y1": 160.63, "r_x2": 145.94, "r_y2": 152.56, "r_x3": 139.37, "r_y3": 152.56, "coord_origin": "TOPLEFT" }, "text": "6.", "orig": "6.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 7, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 150.16, "r_y0": 160.63, "r_x1": 480.59, "r_y1": 160.63, "r_x2": 480.59, "r_y2": 152.56, "r_x3": 150.16, "r_y3": 152.56, "coord_origin": "TOPLEFT" }, "text": "Lee, E., Kwon, J., Yang, H., Park, J., Lee, S., Koo, H.I., Cho, N.I.: Table structure", "orig": "Lee, E., Kwon, J., Yang, H., Park, J., Lee, S., Koo, H.I., Cho, N.I.: Table structure", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 8, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.52, "r_y0": 171.59, "r_x1": 480.59, "r_y1": 171.59, "r_x2": 480.59, "r_y2": 163.52, "r_x3": 151.52, "r_y3": 163.52, "coord_origin": "TOPLEFT" }, "text": "recognition based on grid shape graph. In: 2022 Asia-Pacific Signal and Information", "orig": "recognition based on grid shape graph. In: 2022 Asia-Pacific Signal and Information", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 9, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.52, "r_y0": 182.55, "r_x1": 480.59, "r_y1": 182.55, "r_x2": 480.59, "r_y2": 174.48, "r_x3": 151.52, "r_y3": 174.48, "coord_origin": "TOPLEFT" }, "text": "Processing Association Annual Summit and Conference (APSIPA ASC). pp. 1868-", "orig": "Processing Association Annual Summit and Conference (APSIPA ASC). pp. 1868-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 10, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.52, "r_y0": 193.51, "r_x1": 226.37, "r_y1": 193.51, "r_x2": 226.37, "r_y2": 185.44, "r_x3": 151.52, "r_y3": 185.44, "coord_origin": "TOPLEFT" }, "text": "1873. IEEE (2022)", "orig": "1873. IEEE (2022)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "6. Lee, E., Kwon, J., Yang, H., Park, J., Lee, S., Koo, H.I., Cho, N.I.: Table structure recognition based on grid shape graph. In: 2022 Asia-Pacific Signal and Information Processing Association Annual Summit and Conference (APSIPA ASC). pp. 18681873. IEEE (2022)" }, { "label": "list_item", "id": 10, "page_no": 12, "cluster": { "id": 10, "label": "list_item", "bbox": { "l": 139.37, "t": 196.41, "r": 480.59, "b": 215.44, "coord_origin": "TOPLEFT" }, "confidence": 0.958, "cells": [ { "index": 11, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 139.37, "r_y0": 204.48, "r_x1": 146.31, "r_y1": 204.48, "r_x2": 146.31, "r_y2": 196.41, "r_x3": 139.37, "r_y3": 196.41, "coord_origin": "TOPLEFT" }, "text": "7.", "orig": "7.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 12, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 150.78, "r_y0": 204.48, "r_x1": 480.59, "r_y1": 204.48, "r_x2": 480.59, "r_y2": 196.41, "r_x3": 150.78, "r_y3": 196.41, "coord_origin": "TOPLEFT" }, "text": "Li, M., Cui, L., Huang, S., Wei, F., Zhou, M., Li, Z.: Tablebank: A benchmark", "orig": "Li, M., Cui, L., Huang, S., Wei, F., Zhou, M., Li, Z.: Tablebank: A benchmark", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 13, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.52, "r_y0": 215.44, "r_x1": 352.02, "r_y1": 215.44, "r_x2": 352.02, "r_y2": 207.37, "r_x3": 151.52, "r_y3": 207.37, "coord_origin": "TOPLEFT" }, "text": "dataset for table detection and recognition (2019)", "orig": "dataset for table detection and recognition (2019)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "7. Li, M., Cui, L., Huang, S., Wei, F., Zhou, M., Li, Z.: Tablebank: A benchmark dataset for table detection and recognition (2019)" }, { "label": "list_item", "id": 4, "page_no": 12, "cluster": { "id": 4, "label": "list_item", "bbox": { "l": 139.37, "t": 218.34, "r": 480.59, "b": 270.29, "coord_origin": "TOPLEFT" }, "confidence": 0.968, "cells": [ { "index": 14, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 139.37, "r_y0": 226.41, "r_x1": 146.37, "r_y1": 226.41, "r_x2": 146.37, "r_y2": 218.34, "r_x3": 139.37, "r_y3": 218.34, "coord_origin": "TOPLEFT" }, "text": "8.", "orig": "8.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 15, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 150.87, "r_y0": 226.41, "r_x1": 480.59, "r_y1": 226.41, "r_x2": 480.59, "r_y2": 218.34, "r_x3": 150.87, "r_y3": 218.34, "coord_origin": "TOPLEFT" }, "text": "Livathinos, N., Berrospi, C., Lysak, M., Kuropiatnyk, V., Nassar, A., Carvalho,", "orig": "Livathinos, N., Berrospi, C., Lysak, M., Kuropiatnyk, V., Nassar, A., Carvalho,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 16, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.52, "r_y0": 237.37, "r_x1": 480.59, "r_y1": 237.37, "r_x2": 480.59, "r_y2": 229.3, "r_x3": 151.52, "r_y3": 229.3, "coord_origin": "TOPLEFT" }, "text": "A., Dolfi, M., Auer, C., Dinkla, K., Staar, P.: Robust pdf document conversion", "orig": "A., Dolfi, M., Auer, C., Dinkla, K., Staar, P.: Robust pdf document conversion", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 17, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.52, "r_y0": 248.33, "r_x1": 480.59, "r_y1": 248.33, "r_x2": 480.59, "r_y2": 240.26, "r_x3": 151.52, "r_y3": 240.26, "coord_origin": "TOPLEFT" }, "text": "using recurrent neural networks. Proceedings of the AAAI Conference on Artificial", "orig": "using recurrent neural networks. Proceedings of the AAAI Conference on Artificial", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 18, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.52, "r_y0": 259.29, "r_x1": 197.09, "r_y1": 259.29, "r_x2": 197.09, "r_y2": 251.22, "r_x3": 151.52, "r_y3": 251.22, "coord_origin": "TOPLEFT" }, "text": "Intelligence", "orig": "Intelligence", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 19, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 199.4, "r_y0": 259.08, "r_x1": 210.01, "r_y1": 259.08, "r_x2": 210.01, "r_y2": 251.15, "r_x3": 199.4, "r_y3": 251.15, "coord_origin": "TOPLEFT" }, "text": "35", "orig": "35", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 20, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 210.01, "r_y0": 259.29, "r_x1": 332.38, "r_y1": 259.29, "r_x2": 332.38, "r_y2": 251.22, "r_x3": 210.01, "r_y3": 251.22, "coord_origin": "TOPLEFT" }, "text": "(17), 15137-15145 (May 2021),", "orig": "(17), 15137-15145 (May 2021),", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 21, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 334.7, "r_y0": 259.33, "r_x1": 480.59, "r_y1": 259.33, "r_x2": 480.59, "r_y2": 251.86, "r_x3": 334.7, "r_y3": 251.86, "coord_origin": "TOPLEFT" }, "text": "https://ojs.aaai.org/index.php/", "orig": "https://ojs.aaai.org/index.php/", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 22, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.52, "r_y0": 270.29, "r_x1": 259.76, "r_y1": 270.29, "r_x2": 259.76, "r_y2": 262.82, "r_x3": 151.52, "r_y3": 262.82, "coord_origin": "TOPLEFT" }, "text": "AAAI/article/view/17777", "orig": "AAAI/article/view/17777", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "8. Livathinos, N., Berrospi, C., Lysak, M., Kuropiatnyk, V., Nassar, A., Carvalho, A., Dolfi, M., Auer, C., Dinkla, K., Staar, P.: Robust pdf document conversion using recurrent neural networks. Proceedings of the AAAI Conference on Artificial Intelligence 35 (17), 15137-15145 (May 2021), https://ojs.aaai.org/index.php/ AAAI/article/view/17777" }, { "label": "list_item", "id": 11, "page_no": 12, "cluster": { "id": 11, "label": "list_item", "bbox": { "l": 139.37, "t": 273.14, "r": 480.59, "b": 303.13, "coord_origin": "TOPLEFT" }, "confidence": 0.956, "cells": [ { "index": 23, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 139.37, "r_y0": 281.21, "r_x1": 146.14, "r_y1": 281.21, "r_x2": 146.14, "r_y2": 273.14, "r_x3": 139.37, "r_y3": 273.14, "coord_origin": "TOPLEFT" }, "text": "9.", "orig": "9.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 24, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 150.5, "r_y0": 281.21, "r_x1": 480.59, "r_y1": 281.21, "r_x2": 480.59, "r_y2": 273.14, "r_x3": 150.5, "r_y3": 273.14, "coord_origin": "TOPLEFT" }, "text": "Nassar, A., Livathinos, N., Lysak, M., Staar, P.: Tableformer: Table structure un-", "orig": "Nassar, A., Livathinos, N., Lysak, M., Staar, P.: Tableformer: Table structure un-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 25, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.52, "r_y0": 292.17, "r_x1": 480.59, "r_y1": 292.17, "r_x2": 480.59, "r_y2": 284.1, "r_x3": 151.52, "r_y3": 284.1, "coord_origin": "TOPLEFT" }, "text": "derstanding with transformers. In: Proceedings of the IEEE/CVF Conference on", "orig": "derstanding with transformers. In: Proceedings of the IEEE/CVF Conference on", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 26, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.52, "r_y0": 303.13, "r_x1": 473.44, "r_y1": 303.13, "r_x2": 473.44, "r_y2": 295.06, "r_x3": 151.52, "r_y3": 295.06, "coord_origin": "TOPLEFT" }, "text": "Computer Vision and Pattern Recognition (CVPR). pp. 4614-4623 (June 2022)", "orig": "Computer Vision and Pattern Recognition (CVPR). pp. 4614-4623 (June 2022)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "9. Nassar, A., Livathinos, N., Lysak, M., Staar, P.: Tableformer: Table structure understanding with transformers. In: Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR). pp. 4614-4623 (June 2022)" }, { "label": "list_item", "id": 9, "page_no": 12, "cluster": { "id": 9, "label": "list_item", "bbox": { "l": 134.76, "t": 306.03, "r": 480.59, "b": 368.94, "coord_origin": "TOPLEFT" }, "confidence": 0.964, "cells": [ { "index": 27, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 314.1, "r_x1": 146.5, "r_y1": 314.1, "r_x2": 146.5, "r_y2": 306.03, "r_x3": 134.76, "r_y3": 306.03, "coord_origin": "TOPLEFT" }, "text": "10.", "orig": "10.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 28, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.09, "r_y0": 314.1, "r_x1": 480.59, "r_y1": 314.1, "r_x2": 480.59, "r_y2": 306.03, "r_x3": 151.09, "r_y3": 306.03, "coord_origin": "TOPLEFT" }, "text": "Pfitzmann, B., Auer, C., Dolfi, M., Nassar, A.S., Staar, P.W.J.: Doclaynet: A", "orig": "Pfitzmann, B., Auer, C., Dolfi, M., Nassar, A.S., Staar, P.W.J.: Doclaynet: A", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 29, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.52, "r_y0": 325.06, "r_x1": 480.59, "r_y1": 325.06, "r_x2": 480.59, "r_y2": 316.99, "r_x3": 151.52, "r_y3": 316.99, "coord_origin": "TOPLEFT" }, "text": "large human-annotated dataset for document-layout segmentation. In: Zhang, A.,", "orig": "large human-annotated dataset for document-layout segmentation. In: Zhang, A.,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 30, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.52, "r_y0": 336.02, "r_x1": 480.59, "r_y1": 336.02, "r_x2": 480.59, "r_y2": 327.95, "r_x3": 151.52, "r_y3": 327.95, "coord_origin": "TOPLEFT" }, "text": "Rangwala, H. (eds.) KDD \u201922: The 28th ACM SIGKDD Conference on Knowledge", "orig": "Rangwala, H. (eds.) KDD \u201922: The 28th ACM SIGKDD Conference on Knowledge", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 31, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.52, "r_y0": 346.98, "r_x1": 480.59, "r_y1": 346.98, "r_x2": 480.59, "r_y2": 338.91, "r_x3": 151.52, "r_y3": 338.91, "coord_origin": "TOPLEFT" }, "text": "Discovery and Data Mining, Washington, DC, USA, August 14 - 18, 2022. pp.", "orig": "Discovery and Data Mining, Washington, DC, USA, August 14 - 18, 2022. pp.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 32, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.52, "r_y0": 357.94, "r_x1": 251.14, "r_y1": 357.94, "r_x2": 251.14, "r_y2": 349.87, "r_x3": 151.52, "r_y3": 349.87, "coord_origin": "TOPLEFT" }, "text": "3743-3751. ACM (2022).", "orig": "3743-3751. ACM (2022).", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 33, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 253.99, "r_y0": 357.98, "r_x1": 437.53, "r_y1": 357.98, "r_x2": 437.53, "r_y2": 350.51, "r_x3": 253.99, "r_y3": 350.51, "coord_origin": "TOPLEFT" }, "text": "https://doi.org/10.1145/3534678.3539043", "orig": "https://doi.org/10.1145/3534678.3539043", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 34, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 437.53, "r_y0": 357.94, "r_x1": 440.09, "r_y1": 357.94, "r_x2": 440.09, "r_y2": 349.87, "r_x3": 437.53, "r_y3": 349.87, "coord_origin": "TOPLEFT" }, "text": ",", "orig": ",", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 35, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 442.94, "r_y0": 357.98, "r_x1": 480.59, "r_y1": 357.98, "r_x2": 480.59, "r_y2": 350.51, "r_x3": 442.94, "r_y3": 350.51, "coord_origin": "TOPLEFT" }, "text": "https://", "orig": "https://", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 36, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.52, "r_y0": 368.94, "r_x1": 297.41, "r_y1": 368.94, "r_x2": 297.41, "r_y2": 361.47, "r_x3": 151.52, "r_y3": 361.47, "coord_origin": "TOPLEFT" }, "text": "doi.org/10.1145/3534678.3539043", "orig": "doi.org/10.1145/3534678.3539043", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "10. Pfitzmann, B., Auer, C., Dolfi, M., Nassar, A.S., Staar, P.W.J.: Doclaynet: A large human-annotated dataset for document-layout segmentation. In: Zhang, A., Rangwala, H. (eds.) KDD '22: The 28th ACM SIGKDD Conference on Knowledge Discovery and Data Mining, Washington, DC, USA, August 14 - 18, 2022. pp. 3743-3751. ACM (2022). https://doi.org/10.1145/3534678.3539043 , https:// doi.org/10.1145/3534678.3539043" }, { "label": "list_item", "id": 0, "page_no": 12, "cluster": { "id": 0, "label": "list_item", "bbox": { "l": 134.76, "t": 371.8, "r": 480.59, "b": 412.74, "coord_origin": "TOPLEFT" }, "confidence": 0.975, "cells": [ { "index": 37, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 379.87, "r_x1": 146.04, "r_y1": 379.87, "r_x2": 146.04, "r_y2": 371.8, "r_x3": 134.76, "r_y3": 371.8, "coord_origin": "TOPLEFT" }, "text": "11.", "orig": "11.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 38, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 150.45, "r_y0": 379.87, "r_x1": 480.59, "r_y1": 379.87, "r_x2": 480.59, "r_y2": 371.8, "r_x3": 150.45, "r_y3": 371.8, "coord_origin": "TOPLEFT" }, "text": "Prasad, D., Gadpal, A., Kapadni, K., Visave, M., Sultanpure, K.: Cascadetabnet:", "orig": "Prasad, D., Gadpal, A., Kapadni, K., Visave, M., Sultanpure, K.: Cascadetabnet:", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 39, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.52, "r_y0": 390.83, "r_x1": 480.59, "r_y1": 390.83, "r_x2": 480.59, "r_y2": 382.76, "r_x3": 151.52, "r_y3": 382.76, "coord_origin": "TOPLEFT" }, "text": "An approach for end to end table detection and structure recognition from image-", "orig": "An approach for end to end table detection and structure recognition from image-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 40, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.52, "r_y0": 401.79, "r_x1": 480.59, "r_y1": 401.79, "r_x2": 480.59, "r_y2": 393.72, "r_x3": 151.52, "r_y3": 393.72, "coord_origin": "TOPLEFT" }, "text": "based documents. In: Proceedings of the IEEE/CVF conference on computer vision", "orig": "based documents. In: Proceedings of the IEEE/CVF conference on computer vision", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 41, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.52, "r_y0": 412.74, "r_x1": 373.83, "r_y1": 412.74, "r_x2": 373.83, "r_y2": 404.67, "r_x3": 151.52, "r_y3": 404.67, "coord_origin": "TOPLEFT" }, "text": "and pattern recognition workshops. pp. 572-573 (2020)", "orig": "and pattern recognition workshops. pp. 572-573 (2020)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "11. Prasad, D., Gadpal, A., Kapadni, K., Visave, M., Sultanpure, K.: Cascadetabnet: An approach for end to end table detection and structure recognition from imagebased documents. In: Proceedings of the IEEE/CVF conference on computer vision and pattern recognition workshops. pp. 572-573 (2020)" }, { "label": "list_item", "id": 3, "page_no": 12, "cluster": { "id": 3, "label": "list_item", "bbox": { "l": 134.76, "t": 415.64, "r": 480.59, "b": 456.59, "coord_origin": "TOPLEFT" }, "confidence": 0.971, "cells": [ { "index": 42, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 423.71, "r_x1": 145.91, "r_y1": 423.71, "r_x2": 145.91, "r_y2": 415.64, "r_x3": 134.76, "r_y3": 415.64, "coord_origin": "TOPLEFT" }, "text": "12.", "orig": "12.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 43, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 150.27, "r_y0": 423.71, "r_x1": 480.59, "r_y1": 423.71, "r_x2": 480.59, "r_y2": 415.64, "r_x3": 150.27, "r_y3": 415.64, "coord_origin": "TOPLEFT" }, "text": "Schreiber, S., Agne, S., Wolf, I., Dengel, A., Ahmed, S.: Deepdesrt: Deep learning", "orig": "Schreiber, S., Agne, S., Wolf, I., Dengel, A., Ahmed, S.: Deepdesrt: Deep learning", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 44, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.52, "r_y0": 434.67, "r_x1": 480.59, "r_y1": 434.67, "r_x2": 480.59, "r_y2": 426.6, "r_x3": 151.52, "r_y3": 426.6, "coord_origin": "TOPLEFT" }, "text": "for detection and structure recognition of tables in document images. In: 2017 14th", "orig": "for detection and structure recognition of tables in document images. In: 2017 14th", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 45, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.52, "r_y0": 445.63, "r_x1": 480.59, "r_y1": 445.63, "r_x2": 480.59, "r_y2": 437.56, "r_x3": 151.52, "r_y3": 437.56, "coord_origin": "TOPLEFT" }, "text": "IAPR international conference on document analysis and recognition (ICDAR).", "orig": "IAPR international conference on document analysis and recognition (ICDAR).", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 46, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.52, "r_y0": 456.59, "r_x1": 292.91, "r_y1": 456.59, "r_x2": 292.91, "r_y2": 448.52, "r_x3": 151.52, "r_y3": 448.52, "coord_origin": "TOPLEFT" }, "text": "vol. 1, pp. 1162-1167. IEEE (2017)", "orig": "vol. 1, pp. 1162-1167. IEEE (2017)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "12. Schreiber, S., Agne, S., Wolf, I., Dengel, A., Ahmed, S.: Deepdesrt: Deep learning for detection and structure recognition of tables in document images. In: 2017 14th IAPR international conference on document analysis and recognition (ICDAR). vol. 1, pp. 1162-1167. IEEE (2017)" }, { "label": "list_item", "id": 7, "page_no": 12, "cluster": { "id": 7, "label": "list_item", "bbox": { "l": 134.76, "t": 459.49, "r": 480.59, "b": 500.48, "coord_origin": "TOPLEFT" }, "confidence": 0.966, "cells": [ { "index": 47, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 467.56, "r_x1": 145.78, "r_y1": 467.56, "r_x2": 145.78, "r_y2": 459.49, "r_x3": 134.76, "r_y3": 459.49, "coord_origin": "TOPLEFT" }, "text": "13.", "orig": "13.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 48, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 150.09, "r_y0": 467.56, "r_x1": 480.59, "r_y1": 467.56, "r_x2": 480.59, "r_y2": 459.49, "r_x3": 150.09, "r_y3": 459.49, "coord_origin": "TOPLEFT" }, "text": "Siddiqui, S.A., Fateh, I.A., Rizvi, S.T.R., Dengel, A., Ahmed, S.: Deeptabstr: Deep", "orig": "Siddiqui, S.A., Fateh, I.A., Rizvi, S.T.R., Dengel, A., Ahmed, S.: Deeptabstr: Deep", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 49, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.52, "r_y0": 478.52, "r_x1": 480.59, "r_y1": 478.52, "r_x2": 480.59, "r_y2": 470.45, "r_x3": 151.52, "r_y3": 470.45, "coord_origin": "TOPLEFT" }, "text": "learning based table structure recognition. In: 2019 International Conference on", "orig": "learning based table structure recognition. In: 2019 International Conference on", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 50, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.52, "r_y0": 489.48, "r_x1": 439.06, "r_y1": 489.48, "r_x2": 439.06, "r_y2": 481.41, "r_x3": 151.52, "r_y3": 481.41, "coord_origin": "TOPLEFT" }, "text": "Document Analysis and Recognition (ICDAR). pp. 1403-1409 (2019).", "orig": "Document Analysis and Recognition (ICDAR). pp. 1403-1409 (2019).", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 51, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 442.94, "r_y0": 489.52, "r_x1": 480.59, "r_y1": 489.52, "r_x2": 480.59, "r_y2": 482.06, "r_x3": 442.94, "r_y3": 482.06, "coord_origin": "TOPLEFT" }, "text": "https://", "orig": "https://", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 52, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.52, "r_y0": 500.48, "r_x1": 302.12, "r_y1": 500.48, "r_x2": 302.12, "r_y2": 493.01, "r_x3": 151.52, "r_y3": 493.01, "coord_origin": "TOPLEFT" }, "text": "doi.org/10.1109/ICDAR.2019.00226", "orig": "doi.org/10.1109/ICDAR.2019.00226", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "13. Siddiqui, S.A., Fateh, I.A., Rizvi, S.T.R., Dengel, A., Ahmed, S.: Deeptabstr: Deep learning based table structure recognition. In: 2019 International Conference on Document Analysis and Recognition (ICDAR). pp. 1403-1409 (2019). https:// doi.org/10.1109/ICDAR.2019.00226" }, { "label": "list_item", "id": 2, "page_no": 12, "cluster": { "id": 2, "label": "list_item", "bbox": { "l": 134.76, "t": 503.34, "r": 480.59, "b": 544.29, "coord_origin": "TOPLEFT" }, "confidence": 0.972, "cells": [ { "index": 53, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 511.41, "r_x1": 146.16, "r_y1": 511.41, "r_x2": 146.16, "r_y2": 503.34, "r_x3": 134.76, "r_y3": 503.34, "coord_origin": "TOPLEFT" }, "text": "14.", "orig": "14.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 54, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 150.61, "r_y0": 511.41, "r_x1": 480.59, "r_y1": 511.41, "r_x2": 480.59, "r_y2": 503.34, "r_x3": 150.61, "r_y3": 503.34, "coord_origin": "TOPLEFT" }, "text": "Smock, B., Pesala, R., Abraham, R.: PubTables-1M: Towards comprehensive ta-", "orig": "Smock, B., Pesala, R., Abraham, R.: PubTables-1M: Towards comprehensive ta-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 55, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.52, "r_y0": 522.37, "r_x1": 480.59, "r_y1": 522.37, "r_x2": 480.59, "r_y2": 514.3, "r_x3": 151.52, "r_y3": 514.3, "coord_origin": "TOPLEFT" }, "text": "ble extraction from unstructured documents. In: Proceedings of the IEEE/CVF", "orig": "ble extraction from unstructured documents. In: Proceedings of the IEEE/CVF", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 56, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.52, "r_y0": 533.33, "r_x1": 480.59, "r_y1": 533.33, "r_x2": 480.59, "r_y2": 525.26, "r_x3": 151.52, "r_y3": 525.26, "coord_origin": "TOPLEFT" }, "text": "Conference on Computer Vision and Pattern Recognition (CVPR). pp. 4634-4642", "orig": "Conference on Computer Vision and Pattern Recognition (CVPR). pp. 4634-4642", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 57, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.52, "r_y0": 544.29, "r_x1": 199.25, "r_y1": 544.29, "r_x2": 199.25, "r_y2": 536.22, "r_x3": 151.52, "r_y3": 536.22, "coord_origin": "TOPLEFT" }, "text": "(June 2022)", "orig": "(June 2022)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "14. Smock, B., Pesala, R., Abraham, R.: PubTables-1M: Towards comprehensive table extraction from unstructured documents. In: Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR). pp. 4634-4642 (June 2022)" }, { "label": "list_item", "id": 6, "page_no": 12, "cluster": { "id": 6, "label": "list_item", "bbox": { "l": 134.76, "t": 547.19, "r": 480.6, "b": 610.1, "coord_origin": "TOPLEFT" }, "confidence": 0.967, "cells": [ { "index": 58, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 555.26, "r_x1": 146.17, "r_y1": 555.26, "r_x2": 146.17, "r_y2": 547.19, "r_x3": 134.76, "r_y3": 547.19, "coord_origin": "TOPLEFT" }, "text": "15.", "orig": "15.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 59, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 150.63, "r_y0": 555.26, "r_x1": 480.59, "r_y1": 555.26, "r_x2": 480.59, "r_y2": 547.19, "r_x3": 150.63, "r_y3": 547.19, "coord_origin": "TOPLEFT" }, "text": "Staar, P.W.J., Dolfi, M., Auer, C., Bekas, C.: Corpus conversion service: A ma-", "orig": "Staar, P.W.J., Dolfi, M., Auer, C., Bekas, C.: Corpus conversion service: A ma-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 60, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.52, "r_y0": 566.21, "r_x1": 480.59, "r_y1": 566.21, "r_x2": 480.59, "r_y2": 558.14, "r_x3": 151.52, "r_y3": 558.14, "coord_origin": "TOPLEFT" }, "text": "chine learning platform to ingest documents at scale. In: Proceedings of the 24th", "orig": "chine learning platform to ingest documents at scale. In: Proceedings of the 24th", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 61, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.52, "r_y0": 577.17, "r_x1": 480.59, "r_y1": 577.17, "r_x2": 480.59, "r_y2": 569.1, "r_x3": 151.52, "r_y3": 569.1, "coord_origin": "TOPLEFT" }, "text": "ACM SIGKDD International Conference on Knowledge Discovery & Data Min-", "orig": "ACM SIGKDD International Conference on Knowledge Discovery & Data Min-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 62, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.52, "r_y0": 588.13, "r_x1": 480.59, "r_y1": 588.13, "r_x2": 480.59, "r_y2": 580.06, "r_x3": 151.52, "r_y3": 580.06, "coord_origin": "TOPLEFT" }, "text": "ing. pp. 774-782. KDD \u201918, Association for Computing Machinery, New York, NY,", "orig": "ing. pp. 774-782. KDD \u201918, Association for Computing Machinery, New York, NY,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 63, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.52, "r_y0": 599.09, "r_x1": 200.76, "r_y1": 599.09, "r_x2": 200.76, "r_y2": 591.02, "r_x3": 151.52, "r_y3": 591.02, "coord_origin": "TOPLEFT" }, "text": "USA (2018).", "orig": "USA (2018).", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 64, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 202.92, "r_y0": 599.14, "r_x1": 386.46, "r_y1": 599.14, "r_x2": 386.46, "r_y2": 591.67, "r_x3": 202.92, "r_y3": 591.67, "coord_origin": "TOPLEFT" }, "text": "https://doi.org/10.1145/3219819.3219834", "orig": "https://doi.org/10.1145/3219819.3219834", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 65, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 386.46, "r_y0": 599.09, "r_x1": 389.02, "r_y1": 599.09, "r_x2": 389.02, "r_y2": 591.02, "r_x3": 386.46, "r_y3": 591.02, "coord_origin": "TOPLEFT" }, "text": ",", "orig": ",", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 66, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 391.17, "r_y0": 599.14, "r_x1": 480.6, "r_y1": 599.14, "r_x2": 480.6, "r_y2": 591.67, "r_x3": 391.17, "r_y3": 591.67, "coord_origin": "TOPLEFT" }, "text": "https://doi.org/10.", "orig": "https://doi.org/10.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 67, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.52, "r_y0": 610.1, "r_x1": 245.64, "r_y1": 610.1, "r_x2": 245.64, "r_y2": 602.63, "r_x3": 151.52, "r_y3": 602.63, "coord_origin": "TOPLEFT" }, "text": "1145/3219819.3219834", "orig": "1145/3219819.3219834", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "15. Staar, P.W.J., Dolfi, M., Auer, C., Bekas, C.: Corpus conversion service: A machine learning platform to ingest documents at scale. In: Proceedings of the 24th ACM SIGKDD International Conference on Knowledge Discovery & Data Mining. pp. 774-782. KDD '18, Association for Computing Machinery, New York, NY, USA (2018). https://doi.org/10.1145/3219819.3219834 , https://doi.org/10. 1145/3219819.3219834" }, { "label": "list_item", "id": 12, "page_no": 12, "cluster": { "id": 12, "label": "list_item", "bbox": { "l": 134.76, "t": 612.95, "r": 480.6, "b": 631.98, "coord_origin": "TOPLEFT" }, "confidence": 0.942, "cells": [ { "index": 68, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 621.02, "r_x1": 146.62, "r_y1": 621.02, "r_x2": 146.62, "r_y2": 612.95, "r_x3": 134.76, "r_y3": 612.95, "coord_origin": "TOPLEFT" }, "text": "16.", "orig": "16.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 69, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.26, "r_y0": 621.02, "r_x1": 480.6, "r_y1": 621.02, "r_x2": 480.6, "r_y2": 612.95, "r_x3": 151.26, "r_y3": 612.95, "coord_origin": "TOPLEFT" }, "text": "Wang, X.: Tabular Abstraction, Editing, and Formatting. Ph.D. thesis, CAN", "orig": "Wang, X.: Tabular Abstraction, Editing, and Formatting. Ph.D. thesis, CAN", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 70, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.52, "r_y0": 631.98, "r_x1": 234.43, "r_y1": 631.98, "r_x2": 234.43, "r_y2": 623.91, "r_x3": 151.52, "r_y3": 623.91, "coord_origin": "TOPLEFT" }, "text": "(1996), aAINN09397", "orig": "(1996), aAINN09397", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "16. Wang, X.: Tabular Abstraction, Editing, and Formatting. Ph.D. thesis, CAN (1996), aAINN09397" }, { "label": "list_item", "id": 8, "page_no": 12, "cluster": { "id": 8, "label": "list_item", "bbox": { "l": 134.76, "t": 634.88, "r": 480.59, "b": 664.87, "coord_origin": "TOPLEFT" }, "confidence": 0.965, "cells": [ { "index": 71, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 642.95, "r_x1": 146.31, "r_y1": 642.95, "r_x2": 146.31, "r_y2": 634.88, "r_x3": 134.76, "r_y3": 634.88, "coord_origin": "TOPLEFT" }, "text": "17.", "orig": "17.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 72, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 150.82, "r_y0": 642.95, "r_x1": 480.59, "r_y1": 642.95, "r_x2": 480.59, "r_y2": 634.88, "r_x3": 150.82, "r_y3": 634.88, "coord_origin": "TOPLEFT" }, "text": "Xue, W., Li, Q., Tao, D.: Res2tim: Reconstruct syntactic structures from table", "orig": "Xue, W., Li, Q., Tao, D.: Res2tim: Reconstruct syntactic structures from table", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 73, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.52, "r_y0": 653.91, "r_x1": 480.59, "r_y1": 653.91, "r_x2": 480.59, "r_y2": 645.84, "r_x3": 151.52, "r_y3": 645.84, "coord_origin": "TOPLEFT" }, "text": "images. In: 2019 International Conference on Document Analysis and Recognition", "orig": "images. In: 2019 International Conference on Document Analysis and Recognition", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 74, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.52, "r_y0": 664.87, "r_x1": 299.3, "r_y1": 664.87, "r_x2": 299.3, "r_y2": 656.8, "r_x3": 151.52, "r_y3": 656.8, "coord_origin": "TOPLEFT" }, "text": "(ICDAR). pp. 749-755. IEEE (2019)", "orig": "(ICDAR). pp. 749-755. IEEE (2019)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "17. Xue, W., Li, Q., Tao, D.: Res2tim: Reconstruct syntactic structures from table images. In: 2019 International Conference on Document Analysis and Recognition (ICDAR). pp. 749-755. IEEE (2019)" } ], "body": [ { "label": "list_item", "id": 5, "page_no": 12, "cluster": { "id": 5, "label": "list_item", "bbox": { "l": 139.37, "t": 119.67, "r": 480.59, "b": 149.66, "coord_origin": "TOPLEFT" }, "confidence": 0.968, "cells": [ { "index": 2, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 139.37, "r_y0": 127.74, "r_x1": 146.05, "r_y1": 127.74, "r_x2": 146.05, "r_y2": 119.67, "r_x3": 139.37, "r_y3": 119.67, "coord_origin": "TOPLEFT" }, "text": "5.", "orig": "5.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 3, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 150.34, "r_y0": 127.74, "r_x1": 480.59, "r_y1": 127.74, "r_x2": 480.59, "r_y2": 119.67, "r_x3": 150.34, "r_y3": 119.67, "coord_origin": "TOPLEFT" }, "text": "Kayal, P., Anand, M., Desai, H., Singh, M.: Tables to latex: structure and content", "orig": "Kayal, P., Anand, M., Desai, H., Singh, M.: Tables to latex: structure and content", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 4, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.52, "r_y0": 138.7, "r_x1": 480.59, "r_y1": 138.7, "r_x2": 480.59, "r_y2": 130.63, "r_x3": 151.52, "r_y3": 130.63, "coord_origin": "TOPLEFT" }, "text": "extraction from scientific tables. International Journal on Document Analysis and", "orig": "extraction from scientific tables. International Journal on Document Analysis and", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 5, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.52, "r_y0": 149.66, "r_x1": 304.04, "r_y1": 149.66, "r_x2": 304.04, "r_y2": 141.59, "r_x3": 151.52, "r_y3": 141.59, "coord_origin": "TOPLEFT" }, "text": "Recognition (IJDAR) pp. 1-10 (2022)", "orig": "Recognition (IJDAR) pp. 1-10 (2022)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "5. Kayal, P., Anand, M., Desai, H., Singh, M.: Tables to latex: structure and content extraction from scientific tables. International Journal on Document Analysis and Recognition (IJDAR) pp. 1-10 (2022)" }, { "label": "list_item", "id": 1, "page_no": 12, "cluster": { "id": 1, "label": "list_item", "bbox": { "l": 139.37, "t": 152.56, "r": 480.59, "b": 193.51, "coord_origin": "TOPLEFT" }, "confidence": 0.973, "cells": [ { "index": 6, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 139.37, "r_y0": 160.63, "r_x1": 145.94, "r_y1": 160.63, "r_x2": 145.94, "r_y2": 152.56, "r_x3": 139.37, "r_y3": 152.56, "coord_origin": "TOPLEFT" }, "text": "6.", "orig": "6.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 7, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 150.16, "r_y0": 160.63, "r_x1": 480.59, "r_y1": 160.63, "r_x2": 480.59, "r_y2": 152.56, "r_x3": 150.16, "r_y3": 152.56, "coord_origin": "TOPLEFT" }, "text": "Lee, E., Kwon, J., Yang, H., Park, J., Lee, S., Koo, H.I., Cho, N.I.: Table structure", "orig": "Lee, E., Kwon, J., Yang, H., Park, J., Lee, S., Koo, H.I., Cho, N.I.: Table structure", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 8, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.52, "r_y0": 171.59, "r_x1": 480.59, "r_y1": 171.59, "r_x2": 480.59, "r_y2": 163.52, "r_x3": 151.52, "r_y3": 163.52, "coord_origin": "TOPLEFT" }, "text": "recognition based on grid shape graph. In: 2022 Asia-Pacific Signal and Information", "orig": "recognition based on grid shape graph. In: 2022 Asia-Pacific Signal and Information", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 9, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.52, "r_y0": 182.55, "r_x1": 480.59, "r_y1": 182.55, "r_x2": 480.59, "r_y2": 174.48, "r_x3": 151.52, "r_y3": 174.48, "coord_origin": "TOPLEFT" }, "text": "Processing Association Annual Summit and Conference (APSIPA ASC). pp. 1868-", "orig": "Processing Association Annual Summit and Conference (APSIPA ASC). pp. 1868-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 10, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.52, "r_y0": 193.51, "r_x1": 226.37, "r_y1": 193.51, "r_x2": 226.37, "r_y2": 185.44, "r_x3": 151.52, "r_y3": 185.44, "coord_origin": "TOPLEFT" }, "text": "1873. IEEE (2022)", "orig": "1873. IEEE (2022)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "6. Lee, E., Kwon, J., Yang, H., Park, J., Lee, S., Koo, H.I., Cho, N.I.: Table structure recognition based on grid shape graph. In: 2022 Asia-Pacific Signal and Information Processing Association Annual Summit and Conference (APSIPA ASC). pp. 18681873. IEEE (2022)" }, { "label": "list_item", "id": 10, "page_no": 12, "cluster": { "id": 10, "label": "list_item", "bbox": { "l": 139.37, "t": 196.41, "r": 480.59, "b": 215.44, "coord_origin": "TOPLEFT" }, "confidence": 0.958, "cells": [ { "index": 11, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 139.37, "r_y0": 204.48, "r_x1": 146.31, "r_y1": 204.48, "r_x2": 146.31, "r_y2": 196.41, "r_x3": 139.37, "r_y3": 196.41, "coord_origin": "TOPLEFT" }, "text": "7.", "orig": "7.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 12, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 150.78, "r_y0": 204.48, "r_x1": 480.59, "r_y1": 204.48, "r_x2": 480.59, "r_y2": 196.41, "r_x3": 150.78, "r_y3": 196.41, "coord_origin": "TOPLEFT" }, "text": "Li, M., Cui, L., Huang, S., Wei, F., Zhou, M., Li, Z.: Tablebank: A benchmark", "orig": "Li, M., Cui, L., Huang, S., Wei, F., Zhou, M., Li, Z.: Tablebank: A benchmark", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 13, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.52, "r_y0": 215.44, "r_x1": 352.02, "r_y1": 215.44, "r_x2": 352.02, "r_y2": 207.37, "r_x3": 151.52, "r_y3": 207.37, "coord_origin": "TOPLEFT" }, "text": "dataset for table detection and recognition (2019)", "orig": "dataset for table detection and recognition (2019)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "7. Li, M., Cui, L., Huang, S., Wei, F., Zhou, M., Li, Z.: Tablebank: A benchmark dataset for table detection and recognition (2019)" }, { "label": "list_item", "id": 4, "page_no": 12, "cluster": { "id": 4, "label": "list_item", "bbox": { "l": 139.37, "t": 218.34, "r": 480.59, "b": 270.29, "coord_origin": "TOPLEFT" }, "confidence": 0.968, "cells": [ { "index": 14, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 139.37, "r_y0": 226.41, "r_x1": 146.37, "r_y1": 226.41, "r_x2": 146.37, "r_y2": 218.34, "r_x3": 139.37, "r_y3": 218.34, "coord_origin": "TOPLEFT" }, "text": "8.", "orig": "8.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 15, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 150.87, "r_y0": 226.41, "r_x1": 480.59, "r_y1": 226.41, "r_x2": 480.59, "r_y2": 218.34, "r_x3": 150.87, "r_y3": 218.34, "coord_origin": "TOPLEFT" }, "text": "Livathinos, N., Berrospi, C., Lysak, M., Kuropiatnyk, V., Nassar, A., Carvalho,", "orig": "Livathinos, N., Berrospi, C., Lysak, M., Kuropiatnyk, V., Nassar, A., Carvalho,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 16, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.52, "r_y0": 237.37, "r_x1": 480.59, "r_y1": 237.37, "r_x2": 480.59, "r_y2": 229.3, "r_x3": 151.52, "r_y3": 229.3, "coord_origin": "TOPLEFT" }, "text": "A., Dolfi, M., Auer, C., Dinkla, K., Staar, P.: Robust pdf document conversion", "orig": "A., Dolfi, M., Auer, C., Dinkla, K., Staar, P.: Robust pdf document conversion", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 17, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.52, "r_y0": 248.33, "r_x1": 480.59, "r_y1": 248.33, "r_x2": 480.59, "r_y2": 240.26, "r_x3": 151.52, "r_y3": 240.26, "coord_origin": "TOPLEFT" }, "text": "using recurrent neural networks. Proceedings of the AAAI Conference on Artificial", "orig": "using recurrent neural networks. Proceedings of the AAAI Conference on Artificial", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 18, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.52, "r_y0": 259.29, "r_x1": 197.09, "r_y1": 259.29, "r_x2": 197.09, "r_y2": 251.22, "r_x3": 151.52, "r_y3": 251.22, "coord_origin": "TOPLEFT" }, "text": "Intelligence", "orig": "Intelligence", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 19, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 199.4, "r_y0": 259.08, "r_x1": 210.01, "r_y1": 259.08, "r_x2": 210.01, "r_y2": 251.15, "r_x3": 199.4, "r_y3": 251.15, "coord_origin": "TOPLEFT" }, "text": "35", "orig": "35", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 20, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 210.01, "r_y0": 259.29, "r_x1": 332.38, "r_y1": 259.29, "r_x2": 332.38, "r_y2": 251.22, "r_x3": 210.01, "r_y3": 251.22, "coord_origin": "TOPLEFT" }, "text": "(17), 15137-15145 (May 2021),", "orig": "(17), 15137-15145 (May 2021),", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 21, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 334.7, "r_y0": 259.33, "r_x1": 480.59, "r_y1": 259.33, "r_x2": 480.59, "r_y2": 251.86, "r_x3": 334.7, "r_y3": 251.86, "coord_origin": "TOPLEFT" }, "text": "https://ojs.aaai.org/index.php/", "orig": "https://ojs.aaai.org/index.php/", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 22, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.52, "r_y0": 270.29, "r_x1": 259.76, "r_y1": 270.29, "r_x2": 259.76, "r_y2": 262.82, "r_x3": 151.52, "r_y3": 262.82, "coord_origin": "TOPLEFT" }, "text": "AAAI/article/view/17777", "orig": "AAAI/article/view/17777", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "8. Livathinos, N., Berrospi, C., Lysak, M., Kuropiatnyk, V., Nassar, A., Carvalho, A., Dolfi, M., Auer, C., Dinkla, K., Staar, P.: Robust pdf document conversion using recurrent neural networks. Proceedings of the AAAI Conference on Artificial Intelligence 35 (17), 15137-15145 (May 2021), https://ojs.aaai.org/index.php/ AAAI/article/view/17777" }, { "label": "list_item", "id": 11, "page_no": 12, "cluster": { "id": 11, "label": "list_item", "bbox": { "l": 139.37, "t": 273.14, "r": 480.59, "b": 303.13, "coord_origin": "TOPLEFT" }, "confidence": 0.956, "cells": [ { "index": 23, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 139.37, "r_y0": 281.21, "r_x1": 146.14, "r_y1": 281.21, "r_x2": 146.14, "r_y2": 273.14, "r_x3": 139.37, "r_y3": 273.14, "coord_origin": "TOPLEFT" }, "text": "9.", "orig": "9.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 24, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 150.5, "r_y0": 281.21, "r_x1": 480.59, "r_y1": 281.21, "r_x2": 480.59, "r_y2": 273.14, "r_x3": 150.5, "r_y3": 273.14, "coord_origin": "TOPLEFT" }, "text": "Nassar, A., Livathinos, N., Lysak, M., Staar, P.: Tableformer: Table structure un-", "orig": "Nassar, A., Livathinos, N., Lysak, M., Staar, P.: Tableformer: Table structure un-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 25, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.52, "r_y0": 292.17, "r_x1": 480.59, "r_y1": 292.17, "r_x2": 480.59, "r_y2": 284.1, "r_x3": 151.52, "r_y3": 284.1, "coord_origin": "TOPLEFT" }, "text": "derstanding with transformers. In: Proceedings of the IEEE/CVF Conference on", "orig": "derstanding with transformers. In: Proceedings of the IEEE/CVF Conference on", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 26, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.52, "r_y0": 303.13, "r_x1": 473.44, "r_y1": 303.13, "r_x2": 473.44, "r_y2": 295.06, "r_x3": 151.52, "r_y3": 295.06, "coord_origin": "TOPLEFT" }, "text": "Computer Vision and Pattern Recognition (CVPR). pp. 4614-4623 (June 2022)", "orig": "Computer Vision and Pattern Recognition (CVPR). pp. 4614-4623 (June 2022)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "9. Nassar, A., Livathinos, N., Lysak, M., Staar, P.: Tableformer: Table structure understanding with transformers. In: Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR). pp. 4614-4623 (June 2022)" }, { "label": "list_item", "id": 9, "page_no": 12, "cluster": { "id": 9, "label": "list_item", "bbox": { "l": 134.76, "t": 306.03, "r": 480.59, "b": 368.94, "coord_origin": "TOPLEFT" }, "confidence": 0.964, "cells": [ { "index": 27, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 314.1, "r_x1": 146.5, "r_y1": 314.1, "r_x2": 146.5, "r_y2": 306.03, "r_x3": 134.76, "r_y3": 306.03, "coord_origin": "TOPLEFT" }, "text": "10.", "orig": "10.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 28, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.09, "r_y0": 314.1, "r_x1": 480.59, "r_y1": 314.1, "r_x2": 480.59, "r_y2": 306.03, "r_x3": 151.09, "r_y3": 306.03, "coord_origin": "TOPLEFT" }, "text": "Pfitzmann, B., Auer, C., Dolfi, M., Nassar, A.S., Staar, P.W.J.: Doclaynet: A", "orig": "Pfitzmann, B., Auer, C., Dolfi, M., Nassar, A.S., Staar, P.W.J.: Doclaynet: A", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 29, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.52, "r_y0": 325.06, "r_x1": 480.59, "r_y1": 325.06, "r_x2": 480.59, "r_y2": 316.99, "r_x3": 151.52, "r_y3": 316.99, "coord_origin": "TOPLEFT" }, "text": "large human-annotated dataset for document-layout segmentation. In: Zhang, A.,", "orig": "large human-annotated dataset for document-layout segmentation. In: Zhang, A.,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 30, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.52, "r_y0": 336.02, "r_x1": 480.59, "r_y1": 336.02, "r_x2": 480.59, "r_y2": 327.95, "r_x3": 151.52, "r_y3": 327.95, "coord_origin": "TOPLEFT" }, "text": "Rangwala, H. (eds.) KDD \u201922: The 28th ACM SIGKDD Conference on Knowledge", "orig": "Rangwala, H. (eds.) KDD \u201922: The 28th ACM SIGKDD Conference on Knowledge", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 31, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.52, "r_y0": 346.98, "r_x1": 480.59, "r_y1": 346.98, "r_x2": 480.59, "r_y2": 338.91, "r_x3": 151.52, "r_y3": 338.91, "coord_origin": "TOPLEFT" }, "text": "Discovery and Data Mining, Washington, DC, USA, August 14 - 18, 2022. pp.", "orig": "Discovery and Data Mining, Washington, DC, USA, August 14 - 18, 2022. pp.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 32, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.52, "r_y0": 357.94, "r_x1": 251.14, "r_y1": 357.94, "r_x2": 251.14, "r_y2": 349.87, "r_x3": 151.52, "r_y3": 349.87, "coord_origin": "TOPLEFT" }, "text": "3743-3751. ACM (2022).", "orig": "3743-3751. ACM (2022).", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 33, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 253.99, "r_y0": 357.98, "r_x1": 437.53, "r_y1": 357.98, "r_x2": 437.53, "r_y2": 350.51, "r_x3": 253.99, "r_y3": 350.51, "coord_origin": "TOPLEFT" }, "text": "https://doi.org/10.1145/3534678.3539043", "orig": "https://doi.org/10.1145/3534678.3539043", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 34, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 437.53, "r_y0": 357.94, "r_x1": 440.09, "r_y1": 357.94, "r_x2": 440.09, "r_y2": 349.87, "r_x3": 437.53, "r_y3": 349.87, "coord_origin": "TOPLEFT" }, "text": ",", "orig": ",", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 35, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 442.94, "r_y0": 357.98, "r_x1": 480.59, "r_y1": 357.98, "r_x2": 480.59, "r_y2": 350.51, "r_x3": 442.94, "r_y3": 350.51, "coord_origin": "TOPLEFT" }, "text": "https://", "orig": "https://", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 36, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.52, "r_y0": 368.94, "r_x1": 297.41, "r_y1": 368.94, "r_x2": 297.41, "r_y2": 361.47, "r_x3": 151.52, "r_y3": 361.47, "coord_origin": "TOPLEFT" }, "text": "doi.org/10.1145/3534678.3539043", "orig": "doi.org/10.1145/3534678.3539043", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "10. Pfitzmann, B., Auer, C., Dolfi, M., Nassar, A.S., Staar, P.W.J.: Doclaynet: A large human-annotated dataset for document-layout segmentation. In: Zhang, A., Rangwala, H. (eds.) KDD '22: The 28th ACM SIGKDD Conference on Knowledge Discovery and Data Mining, Washington, DC, USA, August 14 - 18, 2022. pp. 3743-3751. ACM (2022). https://doi.org/10.1145/3534678.3539043 , https:// doi.org/10.1145/3534678.3539043" }, { "label": "list_item", "id": 0, "page_no": 12, "cluster": { "id": 0, "label": "list_item", "bbox": { "l": 134.76, "t": 371.8, "r": 480.59, "b": 412.74, "coord_origin": "TOPLEFT" }, "confidence": 0.975, "cells": [ { "index": 37, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 379.87, "r_x1": 146.04, "r_y1": 379.87, "r_x2": 146.04, "r_y2": 371.8, "r_x3": 134.76, "r_y3": 371.8, "coord_origin": "TOPLEFT" }, "text": "11.", "orig": "11.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 38, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 150.45, "r_y0": 379.87, "r_x1": 480.59, "r_y1": 379.87, "r_x2": 480.59, "r_y2": 371.8, "r_x3": 150.45, "r_y3": 371.8, "coord_origin": "TOPLEFT" }, "text": "Prasad, D., Gadpal, A., Kapadni, K., Visave, M., Sultanpure, K.: Cascadetabnet:", "orig": "Prasad, D., Gadpal, A., Kapadni, K., Visave, M., Sultanpure, K.: Cascadetabnet:", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 39, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.52, "r_y0": 390.83, "r_x1": 480.59, "r_y1": 390.83, "r_x2": 480.59, "r_y2": 382.76, "r_x3": 151.52, "r_y3": 382.76, "coord_origin": "TOPLEFT" }, "text": "An approach for end to end table detection and structure recognition from image-", "orig": "An approach for end to end table detection and structure recognition from image-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 40, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.52, "r_y0": 401.79, "r_x1": 480.59, "r_y1": 401.79, "r_x2": 480.59, "r_y2": 393.72, "r_x3": 151.52, "r_y3": 393.72, "coord_origin": "TOPLEFT" }, "text": "based documents. In: Proceedings of the IEEE/CVF conference on computer vision", "orig": "based documents. In: Proceedings of the IEEE/CVF conference on computer vision", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 41, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.52, "r_y0": 412.74, "r_x1": 373.83, "r_y1": 412.74, "r_x2": 373.83, "r_y2": 404.67, "r_x3": 151.52, "r_y3": 404.67, "coord_origin": "TOPLEFT" }, "text": "and pattern recognition workshops. pp. 572-573 (2020)", "orig": "and pattern recognition workshops. pp. 572-573 (2020)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "11. Prasad, D., Gadpal, A., Kapadni, K., Visave, M., Sultanpure, K.: Cascadetabnet: An approach for end to end table detection and structure recognition from imagebased documents. In: Proceedings of the IEEE/CVF conference on computer vision and pattern recognition workshops. pp. 572-573 (2020)" }, { "label": "list_item", "id": 3, "page_no": 12, "cluster": { "id": 3, "label": "list_item", "bbox": { "l": 134.76, "t": 415.64, "r": 480.59, "b": 456.59, "coord_origin": "TOPLEFT" }, "confidence": 0.971, "cells": [ { "index": 42, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 423.71, "r_x1": 145.91, "r_y1": 423.71, "r_x2": 145.91, "r_y2": 415.64, "r_x3": 134.76, "r_y3": 415.64, "coord_origin": "TOPLEFT" }, "text": "12.", "orig": "12.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 43, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 150.27, "r_y0": 423.71, "r_x1": 480.59, "r_y1": 423.71, "r_x2": 480.59, "r_y2": 415.64, "r_x3": 150.27, "r_y3": 415.64, "coord_origin": "TOPLEFT" }, "text": "Schreiber, S., Agne, S., Wolf, I., Dengel, A., Ahmed, S.: Deepdesrt: Deep learning", "orig": "Schreiber, S., Agne, S., Wolf, I., Dengel, A., Ahmed, S.: Deepdesrt: Deep learning", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 44, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.52, "r_y0": 434.67, "r_x1": 480.59, "r_y1": 434.67, "r_x2": 480.59, "r_y2": 426.6, "r_x3": 151.52, "r_y3": 426.6, "coord_origin": "TOPLEFT" }, "text": "for detection and structure recognition of tables in document images. In: 2017 14th", "orig": "for detection and structure recognition of tables in document images. In: 2017 14th", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 45, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.52, "r_y0": 445.63, "r_x1": 480.59, "r_y1": 445.63, "r_x2": 480.59, "r_y2": 437.56, "r_x3": 151.52, "r_y3": 437.56, "coord_origin": "TOPLEFT" }, "text": "IAPR international conference on document analysis and recognition (ICDAR).", "orig": "IAPR international conference on document analysis and recognition (ICDAR).", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 46, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.52, "r_y0": 456.59, "r_x1": 292.91, "r_y1": 456.59, "r_x2": 292.91, "r_y2": 448.52, "r_x3": 151.52, "r_y3": 448.52, "coord_origin": "TOPLEFT" }, "text": "vol. 1, pp. 1162-1167. IEEE (2017)", "orig": "vol. 1, pp. 1162-1167. IEEE (2017)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "12. Schreiber, S., Agne, S., Wolf, I., Dengel, A., Ahmed, S.: Deepdesrt: Deep learning for detection and structure recognition of tables in document images. In: 2017 14th IAPR international conference on document analysis and recognition (ICDAR). vol. 1, pp. 1162-1167. IEEE (2017)" }, { "label": "list_item", "id": 7, "page_no": 12, "cluster": { "id": 7, "label": "list_item", "bbox": { "l": 134.76, "t": 459.49, "r": 480.59, "b": 500.48, "coord_origin": "TOPLEFT" }, "confidence": 0.966, "cells": [ { "index": 47, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 467.56, "r_x1": 145.78, "r_y1": 467.56, "r_x2": 145.78, "r_y2": 459.49, "r_x3": 134.76, "r_y3": 459.49, "coord_origin": "TOPLEFT" }, "text": "13.", "orig": "13.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 48, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 150.09, "r_y0": 467.56, "r_x1": 480.59, "r_y1": 467.56, "r_x2": 480.59, "r_y2": 459.49, "r_x3": 150.09, "r_y3": 459.49, "coord_origin": "TOPLEFT" }, "text": "Siddiqui, S.A., Fateh, I.A., Rizvi, S.T.R., Dengel, A., Ahmed, S.: Deeptabstr: Deep", "orig": "Siddiqui, S.A., Fateh, I.A., Rizvi, S.T.R., Dengel, A., Ahmed, S.: Deeptabstr: Deep", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 49, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.52, "r_y0": 478.52, "r_x1": 480.59, "r_y1": 478.52, "r_x2": 480.59, "r_y2": 470.45, "r_x3": 151.52, "r_y3": 470.45, "coord_origin": "TOPLEFT" }, "text": "learning based table structure recognition. In: 2019 International Conference on", "orig": "learning based table structure recognition. In: 2019 International Conference on", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 50, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.52, "r_y0": 489.48, "r_x1": 439.06, "r_y1": 489.48, "r_x2": 439.06, "r_y2": 481.41, "r_x3": 151.52, "r_y3": 481.41, "coord_origin": "TOPLEFT" }, "text": "Document Analysis and Recognition (ICDAR). pp. 1403-1409 (2019).", "orig": "Document Analysis and Recognition (ICDAR). pp. 1403-1409 (2019).", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 51, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 442.94, "r_y0": 489.52, "r_x1": 480.59, "r_y1": 489.52, "r_x2": 480.59, "r_y2": 482.06, "r_x3": 442.94, "r_y3": 482.06, "coord_origin": "TOPLEFT" }, "text": "https://", "orig": "https://", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 52, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.52, "r_y0": 500.48, "r_x1": 302.12, "r_y1": 500.48, "r_x2": 302.12, "r_y2": 493.01, "r_x3": 151.52, "r_y3": 493.01, "coord_origin": "TOPLEFT" }, "text": "doi.org/10.1109/ICDAR.2019.00226", "orig": "doi.org/10.1109/ICDAR.2019.00226", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "13. Siddiqui, S.A., Fateh, I.A., Rizvi, S.T.R., Dengel, A., Ahmed, S.: Deeptabstr: Deep learning based table structure recognition. In: 2019 International Conference on Document Analysis and Recognition (ICDAR). pp. 1403-1409 (2019). https:// doi.org/10.1109/ICDAR.2019.00226" }, { "label": "list_item", "id": 2, "page_no": 12, "cluster": { "id": 2, "label": "list_item", "bbox": { "l": 134.76, "t": 503.34, "r": 480.59, "b": 544.29, "coord_origin": "TOPLEFT" }, "confidence": 0.972, "cells": [ { "index": 53, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 511.41, "r_x1": 146.16, "r_y1": 511.41, "r_x2": 146.16, "r_y2": 503.34, "r_x3": 134.76, "r_y3": 503.34, "coord_origin": "TOPLEFT" }, "text": "14.", "orig": "14.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 54, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 150.61, "r_y0": 511.41, "r_x1": 480.59, "r_y1": 511.41, "r_x2": 480.59, "r_y2": 503.34, "r_x3": 150.61, "r_y3": 503.34, "coord_origin": "TOPLEFT" }, "text": "Smock, B., Pesala, R., Abraham, R.: PubTables-1M: Towards comprehensive ta-", "orig": "Smock, B., Pesala, R., Abraham, R.: PubTables-1M: Towards comprehensive ta-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 55, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.52, "r_y0": 522.37, "r_x1": 480.59, "r_y1": 522.37, "r_x2": 480.59, "r_y2": 514.3, "r_x3": 151.52, "r_y3": 514.3, "coord_origin": "TOPLEFT" }, "text": "ble extraction from unstructured documents. In: Proceedings of the IEEE/CVF", "orig": "ble extraction from unstructured documents. In: Proceedings of the IEEE/CVF", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 56, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.52, "r_y0": 533.33, "r_x1": 480.59, "r_y1": 533.33, "r_x2": 480.59, "r_y2": 525.26, "r_x3": 151.52, "r_y3": 525.26, "coord_origin": "TOPLEFT" }, "text": "Conference on Computer Vision and Pattern Recognition (CVPR). pp. 4634-4642", "orig": "Conference on Computer Vision and Pattern Recognition (CVPR). pp. 4634-4642", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 57, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.52, "r_y0": 544.29, "r_x1": 199.25, "r_y1": 544.29, "r_x2": 199.25, "r_y2": 536.22, "r_x3": 151.52, "r_y3": 536.22, "coord_origin": "TOPLEFT" }, "text": "(June 2022)", "orig": "(June 2022)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "14. Smock, B., Pesala, R., Abraham, R.: PubTables-1M: Towards comprehensive table extraction from unstructured documents. In: Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR). pp. 4634-4642 (June 2022)" }, { "label": "list_item", "id": 6, "page_no": 12, "cluster": { "id": 6, "label": "list_item", "bbox": { "l": 134.76, "t": 547.19, "r": 480.6, "b": 610.1, "coord_origin": "TOPLEFT" }, "confidence": 0.967, "cells": [ { "index": 58, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 555.26, "r_x1": 146.17, "r_y1": 555.26, "r_x2": 146.17, "r_y2": 547.19, "r_x3": 134.76, "r_y3": 547.19, "coord_origin": "TOPLEFT" }, "text": "15.", "orig": "15.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 59, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 150.63, "r_y0": 555.26, "r_x1": 480.59, "r_y1": 555.26, "r_x2": 480.59, "r_y2": 547.19, "r_x3": 150.63, "r_y3": 547.19, "coord_origin": "TOPLEFT" }, "text": "Staar, P.W.J., Dolfi, M., Auer, C., Bekas, C.: Corpus conversion service: A ma-", "orig": "Staar, P.W.J., Dolfi, M., Auer, C., Bekas, C.: Corpus conversion service: A ma-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 60, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.52, "r_y0": 566.21, "r_x1": 480.59, "r_y1": 566.21, "r_x2": 480.59, "r_y2": 558.14, "r_x3": 151.52, "r_y3": 558.14, "coord_origin": "TOPLEFT" }, "text": "chine learning platform to ingest documents at scale. In: Proceedings of the 24th", "orig": "chine learning platform to ingest documents at scale. In: Proceedings of the 24th", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 61, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.52, "r_y0": 577.17, "r_x1": 480.59, "r_y1": 577.17, "r_x2": 480.59, "r_y2": 569.1, "r_x3": 151.52, "r_y3": 569.1, "coord_origin": "TOPLEFT" }, "text": "ACM SIGKDD International Conference on Knowledge Discovery & Data Min-", "orig": "ACM SIGKDD International Conference on Knowledge Discovery & Data Min-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 62, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.52, "r_y0": 588.13, "r_x1": 480.59, "r_y1": 588.13, "r_x2": 480.59, "r_y2": 580.06, "r_x3": 151.52, "r_y3": 580.06, "coord_origin": "TOPLEFT" }, "text": "ing. pp. 774-782. KDD \u201918, Association for Computing Machinery, New York, NY,", "orig": "ing. pp. 774-782. KDD \u201918, Association for Computing Machinery, New York, NY,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 63, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.52, "r_y0": 599.09, "r_x1": 200.76, "r_y1": 599.09, "r_x2": 200.76, "r_y2": 591.02, "r_x3": 151.52, "r_y3": 591.02, "coord_origin": "TOPLEFT" }, "text": "USA (2018).", "orig": "USA (2018).", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 64, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 202.92, "r_y0": 599.14, "r_x1": 386.46, "r_y1": 599.14, "r_x2": 386.46, "r_y2": 591.67, "r_x3": 202.92, "r_y3": 591.67, "coord_origin": "TOPLEFT" }, "text": "https://doi.org/10.1145/3219819.3219834", "orig": "https://doi.org/10.1145/3219819.3219834", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 65, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 386.46, "r_y0": 599.09, "r_x1": 389.02, "r_y1": 599.09, "r_x2": 389.02, "r_y2": 591.02, "r_x3": 386.46, "r_y3": 591.02, "coord_origin": "TOPLEFT" }, "text": ",", "orig": ",", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 66, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 391.17, "r_y0": 599.14, "r_x1": 480.6, "r_y1": 599.14, "r_x2": 480.6, "r_y2": 591.67, "r_x3": 391.17, "r_y3": 591.67, "coord_origin": "TOPLEFT" }, "text": "https://doi.org/10.", "orig": "https://doi.org/10.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 67, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.52, "r_y0": 610.1, "r_x1": 245.64, "r_y1": 610.1, "r_x2": 245.64, "r_y2": 602.63, "r_x3": 151.52, "r_y3": 602.63, "coord_origin": "TOPLEFT" }, "text": "1145/3219819.3219834", "orig": "1145/3219819.3219834", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "15. Staar, P.W.J., Dolfi, M., Auer, C., Bekas, C.: Corpus conversion service: A machine learning platform to ingest documents at scale. In: Proceedings of the 24th ACM SIGKDD International Conference on Knowledge Discovery & Data Mining. pp. 774-782. KDD '18, Association for Computing Machinery, New York, NY, USA (2018). https://doi.org/10.1145/3219819.3219834 , https://doi.org/10. 1145/3219819.3219834" }, { "label": "list_item", "id": 12, "page_no": 12, "cluster": { "id": 12, "label": "list_item", "bbox": { "l": 134.76, "t": 612.95, "r": 480.6, "b": 631.98, "coord_origin": "TOPLEFT" }, "confidence": 0.942, "cells": [ { "index": 68, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 621.02, "r_x1": 146.62, "r_y1": 621.02, "r_x2": 146.62, "r_y2": 612.95, "r_x3": 134.76, "r_y3": 612.95, "coord_origin": "TOPLEFT" }, "text": "16.", "orig": "16.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 69, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.26, "r_y0": 621.02, "r_x1": 480.6, "r_y1": 621.02, "r_x2": 480.6, "r_y2": 612.95, "r_x3": 151.26, "r_y3": 612.95, "coord_origin": "TOPLEFT" }, "text": "Wang, X.: Tabular Abstraction, Editing, and Formatting. Ph.D. thesis, CAN", "orig": "Wang, X.: Tabular Abstraction, Editing, and Formatting. Ph.D. thesis, CAN", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 70, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.52, "r_y0": 631.98, "r_x1": 234.43, "r_y1": 631.98, "r_x2": 234.43, "r_y2": 623.91, "r_x3": 151.52, "r_y3": 623.91, "coord_origin": "TOPLEFT" }, "text": "(1996), aAINN09397", "orig": "(1996), aAINN09397", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "16. Wang, X.: Tabular Abstraction, Editing, and Formatting. Ph.D. thesis, CAN (1996), aAINN09397" }, { "label": "list_item", "id": 8, "page_no": 12, "cluster": { "id": 8, "label": "list_item", "bbox": { "l": 134.76, "t": 634.88, "r": 480.59, "b": 664.87, "coord_origin": "TOPLEFT" }, "confidence": 0.965, "cells": [ { "index": 71, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 642.95, "r_x1": 146.31, "r_y1": 642.95, "r_x2": 146.31, "r_y2": 634.88, "r_x3": 134.76, "r_y3": 634.88, "coord_origin": "TOPLEFT" }, "text": "17.", "orig": "17.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 72, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 150.82, "r_y0": 642.95, "r_x1": 480.59, "r_y1": 642.95, "r_x2": 480.59, "r_y2": 634.88, "r_x3": 150.82, "r_y3": 634.88, "coord_origin": "TOPLEFT" }, "text": "Xue, W., Li, Q., Tao, D.: Res2tim: Reconstruct syntactic structures from table", "orig": "Xue, W., Li, Q., Tao, D.: Res2tim: Reconstruct syntactic structures from table", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 73, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.52, "r_y0": 653.91, "r_x1": 480.59, "r_y1": 653.91, "r_x2": 480.59, "r_y2": 645.84, "r_x3": 151.52, "r_y3": 645.84, "coord_origin": "TOPLEFT" }, "text": "images. In: 2019 International Conference on Document Analysis and Recognition", "orig": "images. In: 2019 International Conference on Document Analysis and Recognition", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 74, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.52, "r_y0": 664.87, "r_x1": 299.3, "r_y1": 664.87, "r_x2": 299.3, "r_y2": 656.8, "r_x3": 151.52, "r_y3": 656.8, "coord_origin": "TOPLEFT" }, "text": "(ICDAR). pp. 749-755. IEEE (2019)", "orig": "(ICDAR). pp. 749-755. IEEE (2019)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "17. Xue, W., Li, Q., Tao, D.: Res2tim: Reconstruct syntactic structures from table images. In: 2019 International Conference on Document Analysis and Recognition (ICDAR). pp. 749-755. IEEE (2019)" } ], "headers": [ { "label": "page_header", "id": 13, "page_no": 12, "cluster": { "id": 13, "label": "page_header", "bbox": { "l": 194.48, "t": 93.77, "r": 447.54, "b": 101.84, "coord_origin": "TOPLEFT" }, "confidence": 0.916, "cells": [ { "index": 0, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 194.48, "r_y0": 101.84, "r_x1": 447.54, "r_y1": 101.84, "r_x2": 447.54, "r_y2": 93.77, "r_x3": 194.48, "r_y3": 93.77, "coord_origin": "TOPLEFT" }, "text": "Optimized Table Tokenization for Table Structure Recognition", "orig": "Optimized Table Tokenization for Table Structure Recognition", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "Optimized Table Tokenization for Table Structure Recognition" }, { "label": "page_header", "id": 14, "page_no": 12, "cluster": { "id": 14, "label": "page_header", "bbox": { "l": 471.38, "t": 93.77, "r": 480.59, "b": 101.84, "coord_origin": "TOPLEFT" }, "confidence": 0.906, "cells": [ { "index": 1, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 471.38, "r_y0": 101.84, "r_x1": 480.59, "r_y1": 101.84, "r_x2": 480.59, "r_y2": 93.77, "r_x3": 471.38, "r_y3": 93.77, "coord_origin": "TOPLEFT" }, "text": "13", "orig": "13", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "13" } ] } }, { "page_no": 13, "size": { "width": 612.0, "height": 792.0 }, "parsed_page": { "dimension": { "angle": 0.0, "rect": { "r_x0": 0.0, "r_y0": 0.0, "r_x1": 612.0, "r_y1": 0.0, "r_x2": 612.0, "r_y2": 792.0, "r_x3": 0.0, "r_y3": 792.0, "coord_origin": "BOTTOMLEFT" }, "boundary_type": "crop_box", "art_bbox": { "l": 0.0, "t": 792.0, "r": 612.0, "b": 0.0, "coord_origin": "BOTTOMLEFT" }, "bleed_bbox": { "l": 0.0, "t": 792.0, "r": 612.0, "b": 0.0, "coord_origin": "BOTTOMLEFT" }, "crop_bbox": { "l": 0.0, "t": 792.0, "r": 612.0, "b": 0.0, "coord_origin": "BOTTOMLEFT" }, "media_bbox": { "l": 0.0, "t": 792.0, "r": 612.0, "b": 0.0, "coord_origin": "BOTTOMLEFT" }, "trim_bbox": { "l": 0.0, "t": 792.0, "r": 612.0, "b": 0.0, "coord_origin": "BOTTOMLEFT" } }, "bitmap_resources": [], "char_cells": [], "word_cells": [], "textline_cells": [ { "index": 0, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 101.84, "r_x1": 143.98, "r_y1": 101.84, "r_x2": 143.98, "r_y2": 93.77, "r_x3": 134.76, "r_y3": 93.77, "coord_origin": "TOPLEFT" }, "text": "14", "orig": "14", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 1, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 167.82, "r_y0": 101.84, "r_x1": 178.08, "r_y1": 101.84, "r_x2": 178.08, "r_y2": 93.77, "r_x3": 167.82, "r_y3": 93.77, "coord_origin": "TOPLEFT" }, "text": "M.", "orig": "M.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 2, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 182.38, "r_y0": 101.84, "r_x1": 231.72, "r_y1": 101.84, "r_x2": 231.72, "r_y2": 93.77, "r_x3": 182.38, "r_y3": 93.77, "coord_origin": "TOPLEFT" }, "text": "Lysak, et al.", "orig": "Lysak, et al.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 3, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 127.74, "r_x1": 146.08, "r_y1": 127.74, "r_x2": 146.08, "r_y2": 119.67, "r_x3": 134.76, "r_y3": 119.67, "coord_origin": "TOPLEFT" }, "text": "18.", "orig": "18.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 4, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 150.51, "r_y0": 127.74, "r_x1": 480.59, "r_y1": 127.74, "r_x2": 480.59, "r_y2": 119.67, "r_x3": 150.51, "r_y3": 119.67, "coord_origin": "TOPLEFT" }, "text": "Xue, W., Yu, B., Wang, W., Tao, D., Li, Q.: Tgrnet: A table graph reconstruc-", "orig": "Xue, W., Yu, B., Wang, W., Tao, D., Li, Q.: Tgrnet: A table graph reconstruc-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 5, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.52, "r_y0": 138.7, "r_x1": 480.59, "r_y1": 138.7, "r_x2": 480.59, "r_y2": 130.63, "r_x3": 151.52, "r_y3": 130.63, "coord_origin": "TOPLEFT" }, "text": "tion network for table structure recognition. In: Proceedings of the IEEE/CVF", "orig": "tion network for table structure recognition. In: Proceedings of the IEEE/CVF", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 6, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.52, "r_y0": 149.66, "r_x1": 427.53, "r_y1": 149.66, "r_x2": 427.53, "r_y2": 141.59, "r_x3": 151.52, "r_y3": 141.59, "coord_origin": "TOPLEFT" }, "text": "International Conference on Computer Vision. pp. 1295-1304 (2021)", "orig": "International Conference on Computer Vision. pp. 1295-1304 (2021)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 7, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 160.62, "r_x1": 146.19, "r_y1": 160.62, "r_x2": 146.19, "r_y2": 152.55, "r_x3": 134.76, "r_y3": 152.55, "coord_origin": "TOPLEFT" }, "text": "19.", "orig": "19.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 8, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 150.66, "r_y0": 160.62, "r_x1": 480.59, "r_y1": 160.62, "r_x2": 480.59, "r_y2": 152.55, "r_x3": 150.66, "r_y3": 152.55, "coord_origin": "TOPLEFT" }, "text": "Ye, J., Qi, X., He, Y., Chen, Y., Gu, D., Gao, P., Xiao, R.: Pingan-vcgroup\u2019s", "orig": "Ye, J., Qi, X., He, Y., Chen, Y., Gu, D., Gao, P., Xiao, R.: Pingan-vcgroup\u2019s", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 9, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.52, "r_y0": 171.58, "r_x1": 480.59, "r_y1": 171.58, "r_x2": 480.59, "r_y2": 163.51, "r_x3": 151.52, "r_y3": 163.51, "coord_origin": "TOPLEFT" }, "text": "solution for icdar 2021 competition on scientific literature parsing task b: Ta-", "orig": "solution for icdar 2021 competition on scientific literature parsing task b: Ta-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 10, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.52, "r_y0": 182.54, "r_x1": 280.64, "r_y1": 182.54, "r_x2": 280.64, "r_y2": 174.47, "r_x3": 151.52, "r_y3": 174.47, "coord_origin": "TOPLEFT" }, "text": "ble recognition to html (2021).", "orig": "ble recognition to html (2021).", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 11, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 285.08, "r_y0": 182.58, "r_x1": 478.03, "r_y1": 182.58, "r_x2": 478.03, "r_y2": 175.11, "r_x3": 285.08, "r_y3": 175.11, "coord_origin": "TOPLEFT" }, "text": "https://doi.org/10.48550/ARXIV.2105.01848", "orig": "https://doi.org/10.48550/ARXIV.2105.01848", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 12, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 478.03, "r_y0": 182.54, "r_x1": 480.59, "r_y1": 182.54, "r_x2": 480.59, "r_y2": 174.47, "r_x3": 478.03, "r_y3": 174.47, "coord_origin": "TOPLEFT" }, "text": ",", "orig": ",", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 13, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.52, "r_y0": 193.54, "r_x1": 302.12, "r_y1": 193.54, "r_x2": 302.12, "r_y2": 186.07, "r_x3": 151.52, "r_y3": 186.07, "coord_origin": "TOPLEFT" }, "text": "https://arxiv.org/abs/2105.01848", "orig": "https://arxiv.org/abs/2105.01848", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 14, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 204.46, "r_x1": 145.66, "r_y1": 204.46, "r_x2": 145.66, "r_y2": 196.39, "r_x3": 134.76, "r_y3": 196.39, "coord_origin": "TOPLEFT" }, "text": "20.", "orig": "20.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 15, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 149.92, "r_y0": 204.46, "r_x1": 480.59, "r_y1": 204.46, "r_x2": 480.59, "r_y2": 196.39, "r_x3": 149.92, "r_y3": 196.39, "coord_origin": "TOPLEFT" }, "text": "Zhang, Z., Zhang, J., Du, J., Wang, F.: Split, embed and merge: An accurate table", "orig": "Zhang, Z., Zhang, J., Du, J., Wang, F.: Split, embed and merge: An accurate table", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 16, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.52, "r_y0": 215.41, "r_x1": 318.55, "r_y1": 215.41, "r_x2": 318.55, "r_y2": 207.34, "r_x3": 151.52, "r_y3": 207.34, "coord_origin": "TOPLEFT" }, "text": "structure recognizer. Pattern Recognition", "orig": "structure recognizer. Pattern Recognition", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 17, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 321.62, "r_y0": 215.21, "r_x1": 337.53, "r_y1": 215.21, "r_x2": 337.53, "r_y2": 207.28, "r_x3": 321.62, "r_y3": 207.28, "coord_origin": "TOPLEFT" }, "text": "126", "orig": "126", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 18, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 337.53, "r_y0": 215.41, "r_x1": 399.47, "r_y1": 215.41, "r_x2": 399.47, "r_y2": 207.34, "r_x3": 337.53, "r_y3": 207.34, "coord_origin": "TOPLEFT" }, "text": ", 108565 (2022)", "orig": ", 108565 (2022)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 19, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 226.37, "r_x1": 145.72, "r_y1": 226.37, "r_x2": 145.72, "r_y2": 218.3, "r_x3": 134.76, "r_y3": 218.3, "coord_origin": "TOPLEFT" }, "text": "21.", "orig": "21.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 20, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 150.01, "r_y0": 226.37, "r_x1": 480.59, "r_y1": 226.37, "r_x2": 480.59, "r_y2": 218.3, "r_x3": 150.01, "r_y3": 218.3, "coord_origin": "TOPLEFT" }, "text": "Zheng, X., Burdick, D., Popa, L., Zhong, X., Wang, N.X.R.: Global table extractor", "orig": "Zheng, X., Burdick, D., Popa, L., Zhong, X., Wang, N.X.R.: Global table extractor", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 21, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.52, "r_y0": 237.33, "r_x1": 480.59, "r_y1": 237.33, "r_x2": 480.59, "r_y2": 229.26, "r_x3": 151.52, "r_y3": 229.26, "coord_origin": "TOPLEFT" }, "text": "(gte): A framework for joint table identification and cell structure recognition using", "orig": "(gte): A framework for joint table identification and cell structure recognition using", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 22, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.52, "r_y0": 248.29, "r_x1": 480.59, "r_y1": 248.29, "r_x2": 480.59, "r_y2": 240.22, "r_x3": 151.52, "r_y3": 240.22, "coord_origin": "TOPLEFT" }, "text": "visual context. In: 2021 IEEE Winter Conference on Applications of Computer Vi-", "orig": "visual context. In: 2021 IEEE Winter Conference on Applications of Computer Vi-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 23, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.52, "r_y0": 259.25, "r_x1": 293.44, "r_y1": 259.25, "r_x2": 293.44, "r_y2": 251.18, "r_x3": 151.52, "r_y3": 251.18, "coord_origin": "TOPLEFT" }, "text": "sion (WACV). pp. 697-706 (2021).", "orig": "sion (WACV). pp. 697-706 (2021).", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 24, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 297.05, "r_y0": 259.3, "r_x1": 480.59, "r_y1": 259.3, "r_x2": 480.59, "r_y2": 251.83, "r_x3": 297.05, "r_y3": 251.83, "coord_origin": "TOPLEFT" }, "text": "https://doi.org/10.1109/WACV48630.2021.", "orig": "https://doi.org/10.1109/WACV48630.2021.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 25, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.52, "r_y0": 270.25, "r_x1": 175.05, "r_y1": 270.25, "r_x2": 175.05, "r_y2": 262.79, "r_x3": 151.52, "r_y3": 262.79, "coord_origin": "TOPLEFT" }, "text": "00074", "orig": "00074", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 26, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 281.17, "r_x1": 146.37, "r_y1": 281.17, "r_x2": 146.37, "r_y2": 273.1, "r_x3": 134.76, "r_y3": 273.1, "coord_origin": "TOPLEFT" }, "text": "22.", "orig": "22.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 27, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 150.91, "r_y0": 281.17, "r_x1": 480.59, "r_y1": 281.17, "r_x2": 480.59, "r_y2": 273.1, "r_x3": 150.91, "r_y3": 273.1, "coord_origin": "TOPLEFT" }, "text": "Zhong, X., ShafieiBavani, E., Jimeno Yepes, A.: Image-based table recognition:", "orig": "Zhong, X., ShafieiBavani, E., Jimeno Yepes, A.: Image-based table recognition:", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 28, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.52, "r_y0": 292.13, "r_x1": 480.59, "r_y1": 292.13, "r_x2": 480.59, "r_y2": 284.06, "r_x3": 151.52, "r_y3": 284.06, "coord_origin": "TOPLEFT" }, "text": "Data, model, and evaluation. In: Vedaldi, A., Bischof, H., Brox, T., Frahm, J.M.", "orig": "Data, model, and evaluation. In: Vedaldi, A., Bischof, H., Brox, T., Frahm, J.M.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 29, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.52, "r_y0": 303.09, "r_x1": 480.6, "r_y1": 303.09, "r_x2": 480.6, "r_y2": 295.02, "r_x3": 151.52, "r_y3": 295.02, "coord_origin": "TOPLEFT" }, "text": "(eds.) Computer Vision - ECCV 2020. pp. 564-580. Springer International Pub-", "orig": "(eds.) Computer Vision - ECCV 2020. pp. 564-580. Springer International Pub-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 30, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.52, "r_y0": 314.05, "r_x1": 236.02, "r_y1": 314.05, "r_x2": 236.02, "r_y2": 305.98, "r_x3": 151.52, "r_y3": 305.98, "coord_origin": "TOPLEFT" }, "text": "lishing, Cham (2020)", "orig": "lishing, Cham (2020)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 31, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 325.0, "r_x1": 145.7, "r_y1": 325.0, "r_x2": 145.7, "r_y2": 316.93, "r_x3": 134.76, "r_y3": 316.93, "coord_origin": "TOPLEFT" }, "text": "23.", "orig": "23.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 32, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 149.97, "r_y0": 325.0, "r_x1": 480.59, "r_y1": 325.0, "r_x2": 480.59, "r_y2": 316.93, "r_x3": 149.97, "r_y3": 316.93, "coord_origin": "TOPLEFT" }, "text": "Zhong, X., Tang, J., Yepes, A.J.: Publaynet: largest dataset ever for document lay-", "orig": "Zhong, X., Tang, J., Yepes, A.J.: Publaynet: largest dataset ever for document lay-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 33, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.52, "r_y0": 335.96, "r_x1": 480.59, "r_y1": 335.96, "r_x2": 480.59, "r_y2": 327.89, "r_x3": 151.52, "r_y3": 327.89, "coord_origin": "TOPLEFT" }, "text": "out analysis. In: 2019 International Conference on Document Analysis and Recog-", "orig": "out analysis. In: 2019 International Conference on Document Analysis and Recog-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 34, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.52, "r_y0": 346.92, "r_x1": 335.14, "r_y1": 346.92, "r_x2": 335.14, "r_y2": 338.85, "r_x3": 151.52, "r_y3": 338.85, "coord_origin": "TOPLEFT" }, "text": "nition (ICDAR). pp. 1015-1022. IEEE (2019)", "orig": "nition (ICDAR). pp. 1015-1022. IEEE (2019)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "has_chars": false, "has_words": false, "has_lines": true, "image": null, "lines": [] }, "predictions": { "layout": { "clusters": [ { "id": 7, "label": "page_header", "bbox": { "l": 134.76, "t": 93.77, "r": 143.98, "b": 101.84, "coord_origin": "TOPLEFT" }, "confidence": 0.701, "cells": [ { "index": 0, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 101.84, "r_x1": 143.98, "r_y1": 101.84, "r_x2": 143.98, "r_y2": 93.77, "r_x3": 134.76, "r_y3": 93.77, "coord_origin": "TOPLEFT" }, "text": "14", "orig": "14", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 6, "label": "page_header", "bbox": { "l": 167.82, "t": 93.77, "r": 231.72, "b": 101.84, "coord_origin": "TOPLEFT" }, "confidence": 0.789, "cells": [ { "index": 1, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 167.82, "r_y0": 101.84, "r_x1": 178.08, "r_y1": 101.84, "r_x2": 178.08, "r_y2": 93.77, "r_x3": 167.82, "r_y3": 93.77, "coord_origin": "TOPLEFT" }, "text": "M.", "orig": "M.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 2, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 182.38, "r_y0": 101.84, "r_x1": 231.72, "r_y1": 101.84, "r_x2": 231.72, "r_y2": 93.77, "r_x3": 182.38, "r_y3": 93.77, "coord_origin": "TOPLEFT" }, "text": "Lysak, et al.", "orig": "Lysak, et al.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 5, "label": "list_item", "bbox": { "l": 134.76, "t": 119.67, "r": 480.59, "b": 149.66, "coord_origin": "TOPLEFT" }, "confidence": 0.944, "cells": [ { "index": 3, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 127.74, "r_x1": 146.08, "r_y1": 127.74, "r_x2": 146.08, "r_y2": 119.67, "r_x3": 134.76, "r_y3": 119.67, "coord_origin": "TOPLEFT" }, "text": "18.", "orig": "18.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 4, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 150.51, "r_y0": 127.74, "r_x1": 480.59, "r_y1": 127.74, "r_x2": 480.59, "r_y2": 119.67, "r_x3": 150.51, "r_y3": 119.67, "coord_origin": "TOPLEFT" }, "text": "Xue, W., Yu, B., Wang, W., Tao, D., Li, Q.: Tgrnet: A table graph reconstruc-", "orig": "Xue, W., Yu, B., Wang, W., Tao, D., Li, Q.: Tgrnet: A table graph reconstruc-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 5, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.52, "r_y0": 138.7, "r_x1": 480.59, "r_y1": 138.7, "r_x2": 480.59, "r_y2": 130.63, "r_x3": 151.52, "r_y3": 130.63, "coord_origin": "TOPLEFT" }, "text": "tion network for table structure recognition. In: Proceedings of the IEEE/CVF", "orig": "tion network for table structure recognition. In: Proceedings of the IEEE/CVF", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 6, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.52, "r_y0": 149.66, "r_x1": 427.53, "r_y1": 149.66, "r_x2": 427.53, "r_y2": 141.59, "r_x3": 151.52, "r_y3": 141.59, "coord_origin": "TOPLEFT" }, "text": "International Conference on Computer Vision. pp. 1295-1304 (2021)", "orig": "International Conference on Computer Vision. pp. 1295-1304 (2021)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 3, "label": "list_item", "bbox": { "l": 134.76, "t": 152.55, "r": 480.59, "b": 193.54, "coord_origin": "TOPLEFT" }, "confidence": 0.954, "cells": [ { "index": 7, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 160.62, "r_x1": 146.19, "r_y1": 160.62, "r_x2": 146.19, "r_y2": 152.55, "r_x3": 134.76, "r_y3": 152.55, "coord_origin": "TOPLEFT" }, "text": "19.", "orig": "19.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 8, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 150.66, "r_y0": 160.62, "r_x1": 480.59, "r_y1": 160.62, "r_x2": 480.59, "r_y2": 152.55, "r_x3": 150.66, "r_y3": 152.55, "coord_origin": "TOPLEFT" }, "text": "Ye, J., Qi, X., He, Y., Chen, Y., Gu, D., Gao, P., Xiao, R.: Pingan-vcgroup\u2019s", "orig": "Ye, J., Qi, X., He, Y., Chen, Y., Gu, D., Gao, P., Xiao, R.: Pingan-vcgroup\u2019s", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 9, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.52, "r_y0": 171.58, "r_x1": 480.59, "r_y1": 171.58, "r_x2": 480.59, "r_y2": 163.51, "r_x3": 151.52, "r_y3": 163.51, "coord_origin": "TOPLEFT" }, "text": "solution for icdar 2021 competition on scientific literature parsing task b: Ta-", "orig": "solution for icdar 2021 competition on scientific literature parsing task b: Ta-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 10, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.52, "r_y0": 182.54, "r_x1": 280.64, "r_y1": 182.54, "r_x2": 280.64, "r_y2": 174.47, "r_x3": 151.52, "r_y3": 174.47, "coord_origin": "TOPLEFT" }, "text": "ble recognition to html (2021).", "orig": "ble recognition to html (2021).", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 11, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 285.08, "r_y0": 182.58, "r_x1": 478.03, "r_y1": 182.58, "r_x2": 478.03, "r_y2": 175.11, "r_x3": 285.08, "r_y3": 175.11, "coord_origin": "TOPLEFT" }, "text": "https://doi.org/10.48550/ARXIV.2105.01848", "orig": "https://doi.org/10.48550/ARXIV.2105.01848", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 12, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 478.03, "r_y0": 182.54, "r_x1": 480.59, "r_y1": 182.54, "r_x2": 480.59, "r_y2": 174.47, "r_x3": 478.03, "r_y3": 174.47, "coord_origin": "TOPLEFT" }, "text": ",", "orig": ",", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 13, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.52, "r_y0": 193.54, "r_x1": 302.12, "r_y1": 193.54, "r_x2": 302.12, "r_y2": 186.07, "r_x3": 151.52, "r_y3": 186.07, "coord_origin": "TOPLEFT" }, "text": "https://arxiv.org/abs/2105.01848", "orig": "https://arxiv.org/abs/2105.01848", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 4, "label": "list_item", "bbox": { "l": 134.76, "t": 196.39, "r": 480.59, "b": 215.41, "coord_origin": "TOPLEFT" }, "confidence": 0.953, "cells": [ { "index": 14, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 204.46, "r_x1": 145.66, "r_y1": 204.46, "r_x2": 145.66, "r_y2": 196.39, "r_x3": 134.76, "r_y3": 196.39, "coord_origin": "TOPLEFT" }, "text": "20.", "orig": "20.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 15, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 149.92, "r_y0": 204.46, "r_x1": 480.59, "r_y1": 204.46, "r_x2": 480.59, "r_y2": 196.39, "r_x3": 149.92, "r_y3": 196.39, "coord_origin": "TOPLEFT" }, "text": "Zhang, Z., Zhang, J., Du, J., Wang, F.: Split, embed and merge: An accurate table", "orig": "Zhang, Z., Zhang, J., Du, J., Wang, F.: Split, embed and merge: An accurate table", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 16, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.52, "r_y0": 215.41, "r_x1": 318.55, "r_y1": 215.41, "r_x2": 318.55, "r_y2": 207.34, "r_x3": 151.52, "r_y3": 207.34, "coord_origin": "TOPLEFT" }, "text": "structure recognizer. Pattern Recognition", "orig": "structure recognizer. Pattern Recognition", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 17, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 321.62, "r_y0": 215.21, "r_x1": 337.53, "r_y1": 215.21, "r_x2": 337.53, "r_y2": 207.28, "r_x3": 321.62, "r_y3": 207.28, "coord_origin": "TOPLEFT" }, "text": "126", "orig": "126", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 18, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 337.53, "r_y0": 215.41, "r_x1": 399.47, "r_y1": 215.41, "r_x2": 399.47, "r_y2": 207.34, "r_x3": 337.53, "r_y3": 207.34, "coord_origin": "TOPLEFT" }, "text": ", 108565 (2022)", "orig": ", 108565 (2022)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 0, "label": "list_item", "bbox": { "l": 134.76, "t": 218.3, "r": 480.59, "b": 270.25, "coord_origin": "TOPLEFT" }, "confidence": 0.972, "cells": [ { "index": 19, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 226.37, "r_x1": 145.72, "r_y1": 226.37, "r_x2": 145.72, "r_y2": 218.3, "r_x3": 134.76, "r_y3": 218.3, "coord_origin": "TOPLEFT" }, "text": "21.", "orig": "21.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 20, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 150.01, "r_y0": 226.37, "r_x1": 480.59, "r_y1": 226.37, "r_x2": 480.59, "r_y2": 218.3, "r_x3": 150.01, "r_y3": 218.3, "coord_origin": "TOPLEFT" }, "text": "Zheng, X., Burdick, D., Popa, L., Zhong, X., Wang, N.X.R.: Global table extractor", "orig": "Zheng, X., Burdick, D., Popa, L., Zhong, X., Wang, N.X.R.: Global table extractor", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 21, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.52, "r_y0": 237.33, "r_x1": 480.59, "r_y1": 237.33, "r_x2": 480.59, "r_y2": 229.26, "r_x3": 151.52, "r_y3": 229.26, "coord_origin": "TOPLEFT" }, "text": "(gte): A framework for joint table identification and cell structure recognition using", "orig": "(gte): A framework for joint table identification and cell structure recognition using", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 22, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.52, "r_y0": 248.29, "r_x1": 480.59, "r_y1": 248.29, "r_x2": 480.59, "r_y2": 240.22, "r_x3": 151.52, "r_y3": 240.22, "coord_origin": "TOPLEFT" }, "text": "visual context. In: 2021 IEEE Winter Conference on Applications of Computer Vi-", "orig": "visual context. In: 2021 IEEE Winter Conference on Applications of Computer Vi-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 23, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.52, "r_y0": 259.25, "r_x1": 293.44, "r_y1": 259.25, "r_x2": 293.44, "r_y2": 251.18, "r_x3": 151.52, "r_y3": 251.18, "coord_origin": "TOPLEFT" }, "text": "sion (WACV). pp. 697-706 (2021).", "orig": "sion (WACV). pp. 697-706 (2021).", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 24, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 297.05, "r_y0": 259.3, "r_x1": 480.59, "r_y1": 259.3, "r_x2": 480.59, "r_y2": 251.83, "r_x3": 297.05, "r_y3": 251.83, "coord_origin": "TOPLEFT" }, "text": "https://doi.org/10.1109/WACV48630.2021.", "orig": "https://doi.org/10.1109/WACV48630.2021.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 25, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.52, "r_y0": 270.25, "r_x1": 175.05, "r_y1": 270.25, "r_x2": 175.05, "r_y2": 262.79, "r_x3": 151.52, "r_y3": 262.79, "coord_origin": "TOPLEFT" }, "text": "00074", "orig": "00074", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 1, "label": "list_item", "bbox": { "l": 134.76, "t": 273.1, "r": 480.6, "b": 314.05, "coord_origin": "TOPLEFT" }, "confidence": 0.969, "cells": [ { "index": 26, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 281.17, "r_x1": 146.37, "r_y1": 281.17, "r_x2": 146.37, "r_y2": 273.1, "r_x3": 134.76, "r_y3": 273.1, "coord_origin": "TOPLEFT" }, "text": "22.", "orig": "22.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 27, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 150.91, "r_y0": 281.17, "r_x1": 480.59, "r_y1": 281.17, "r_x2": 480.59, "r_y2": 273.1, "r_x3": 150.91, "r_y3": 273.1, "coord_origin": "TOPLEFT" }, "text": "Zhong, X., ShafieiBavani, E., Jimeno Yepes, A.: Image-based table recognition:", "orig": "Zhong, X., ShafieiBavani, E., Jimeno Yepes, A.: Image-based table recognition:", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 28, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.52, "r_y0": 292.13, "r_x1": 480.59, "r_y1": 292.13, "r_x2": 480.59, "r_y2": 284.06, "r_x3": 151.52, "r_y3": 284.06, "coord_origin": "TOPLEFT" }, "text": "Data, model, and evaluation. In: Vedaldi, A., Bischof, H., Brox, T., Frahm, J.M.", "orig": "Data, model, and evaluation. In: Vedaldi, A., Bischof, H., Brox, T., Frahm, J.M.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 29, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.52, "r_y0": 303.09, "r_x1": 480.6, "r_y1": 303.09, "r_x2": 480.6, "r_y2": 295.02, "r_x3": 151.52, "r_y3": 295.02, "coord_origin": "TOPLEFT" }, "text": "(eds.) Computer Vision - ECCV 2020. pp. 564-580. Springer International Pub-", "orig": "(eds.) Computer Vision - ECCV 2020. pp. 564-580. Springer International Pub-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 30, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.52, "r_y0": 314.05, "r_x1": 236.02, "r_y1": 314.05, "r_x2": 236.02, "r_y2": 305.98, "r_x3": 151.52, "r_y3": 305.98, "coord_origin": "TOPLEFT" }, "text": "lishing, Cham (2020)", "orig": "lishing, Cham (2020)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, { "id": 2, "label": "list_item", "bbox": { "l": 134.76, "t": 316.93, "r": 480.59, "b": 346.92, "coord_origin": "TOPLEFT" }, "confidence": 0.967, "cells": [ { "index": 31, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 325.0, "r_x1": 145.7, "r_y1": 325.0, "r_x2": 145.7, "r_y2": 316.93, "r_x3": 134.76, "r_y3": 316.93, "coord_origin": "TOPLEFT" }, "text": "23.", "orig": "23.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 32, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 149.97, "r_y0": 325.0, "r_x1": 480.59, "r_y1": 325.0, "r_x2": 480.59, "r_y2": 316.93, "r_x3": 149.97, "r_y3": 316.93, "coord_origin": "TOPLEFT" }, "text": "Zhong, X., Tang, J., Yepes, A.J.: Publaynet: largest dataset ever for document lay-", "orig": "Zhong, X., Tang, J., Yepes, A.J.: Publaynet: largest dataset ever for document lay-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 33, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.52, "r_y0": 335.96, "r_x1": 480.59, "r_y1": 335.96, "r_x2": 480.59, "r_y2": 327.89, "r_x3": 151.52, "r_y3": 327.89, "coord_origin": "TOPLEFT" }, "text": "out analysis. In: 2019 International Conference on Document Analysis and Recog-", "orig": "out analysis. In: 2019 International Conference on Document Analysis and Recog-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 34, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.52, "r_y0": 346.92, "r_x1": 335.14, "r_y1": 346.92, "r_x2": 335.14, "r_y2": 338.85, "r_x3": 151.52, "r_y3": 338.85, "coord_origin": "TOPLEFT" }, "text": "nition (ICDAR). pp. 1015-1022. IEEE (2019)", "orig": "nition (ICDAR). pp. 1015-1022. IEEE (2019)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] } ] }, "tablestructure": { "table_map": {} }, "figures_classification": null, "equations_prediction": null, "vlm_response": null }, "assembled": { "elements": [ { "label": "page_header", "id": 7, "page_no": 13, "cluster": { "id": 7, "label": "page_header", "bbox": { "l": 134.76, "t": 93.77, "r": 143.98, "b": 101.84, "coord_origin": "TOPLEFT" }, "confidence": 0.701, "cells": [ { "index": 0, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 101.84, "r_x1": 143.98, "r_y1": 101.84, "r_x2": 143.98, "r_y2": 93.77, "r_x3": 134.76, "r_y3": 93.77, "coord_origin": "TOPLEFT" }, "text": "14", "orig": "14", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "14" }, { "label": "page_header", "id": 6, "page_no": 13, "cluster": { "id": 6, "label": "page_header", "bbox": { "l": 167.82, "t": 93.77, "r": 231.72, "b": 101.84, "coord_origin": "TOPLEFT" }, "confidence": 0.789, "cells": [ { "index": 1, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 167.82, "r_y0": 101.84, "r_x1": 178.08, "r_y1": 101.84, "r_x2": 178.08, "r_y2": 93.77, "r_x3": 167.82, "r_y3": 93.77, "coord_origin": "TOPLEFT" }, "text": "M.", "orig": "M.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 2, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 182.38, "r_y0": 101.84, "r_x1": 231.72, "r_y1": 101.84, "r_x2": 231.72, "r_y2": 93.77, "r_x3": 182.38, "r_y3": 93.77, "coord_origin": "TOPLEFT" }, "text": "Lysak, et al.", "orig": "Lysak, et al.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "M. Lysak, et al." }, { "label": "list_item", "id": 5, "page_no": 13, "cluster": { "id": 5, "label": "list_item", "bbox": { "l": 134.76, "t": 119.67, "r": 480.59, "b": 149.66, "coord_origin": "TOPLEFT" }, "confidence": 0.944, "cells": [ { "index": 3, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 127.74, "r_x1": 146.08, "r_y1": 127.74, "r_x2": 146.08, "r_y2": 119.67, "r_x3": 134.76, "r_y3": 119.67, "coord_origin": "TOPLEFT" }, "text": "18.", "orig": "18.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 4, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 150.51, "r_y0": 127.74, "r_x1": 480.59, "r_y1": 127.74, "r_x2": 480.59, "r_y2": 119.67, "r_x3": 150.51, "r_y3": 119.67, "coord_origin": "TOPLEFT" }, "text": "Xue, W., Yu, B., Wang, W., Tao, D., Li, Q.: Tgrnet: A table graph reconstruc-", "orig": "Xue, W., Yu, B., Wang, W., Tao, D., Li, Q.: Tgrnet: A table graph reconstruc-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 5, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.52, "r_y0": 138.7, "r_x1": 480.59, "r_y1": 138.7, "r_x2": 480.59, "r_y2": 130.63, "r_x3": 151.52, "r_y3": 130.63, "coord_origin": "TOPLEFT" }, "text": "tion network for table structure recognition. In: Proceedings of the IEEE/CVF", "orig": "tion network for table structure recognition. In: Proceedings of the IEEE/CVF", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 6, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.52, "r_y0": 149.66, "r_x1": 427.53, "r_y1": 149.66, "r_x2": 427.53, "r_y2": 141.59, "r_x3": 151.52, "r_y3": 141.59, "coord_origin": "TOPLEFT" }, "text": "International Conference on Computer Vision. pp. 1295-1304 (2021)", "orig": "International Conference on Computer Vision. pp. 1295-1304 (2021)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "18. Xue, W., Yu, B., Wang, W., Tao, D., Li, Q.: Tgrnet: A table graph reconstruction network for table structure recognition. In: Proceedings of the IEEE/CVF International Conference on Computer Vision. pp. 1295-1304 (2021)" }, { "label": "list_item", "id": 3, "page_no": 13, "cluster": { "id": 3, "label": "list_item", "bbox": { "l": 134.76, "t": 152.55, "r": 480.59, "b": 193.54, "coord_origin": "TOPLEFT" }, "confidence": 0.954, "cells": [ { "index": 7, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 160.62, "r_x1": 146.19, "r_y1": 160.62, "r_x2": 146.19, "r_y2": 152.55, "r_x3": 134.76, "r_y3": 152.55, "coord_origin": "TOPLEFT" }, "text": "19.", "orig": "19.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 8, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 150.66, "r_y0": 160.62, "r_x1": 480.59, "r_y1": 160.62, "r_x2": 480.59, "r_y2": 152.55, "r_x3": 150.66, "r_y3": 152.55, "coord_origin": "TOPLEFT" }, "text": "Ye, J., Qi, X., He, Y., Chen, Y., Gu, D., Gao, P., Xiao, R.: Pingan-vcgroup\u2019s", "orig": "Ye, J., Qi, X., He, Y., Chen, Y., Gu, D., Gao, P., Xiao, R.: Pingan-vcgroup\u2019s", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 9, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.52, "r_y0": 171.58, "r_x1": 480.59, "r_y1": 171.58, "r_x2": 480.59, "r_y2": 163.51, "r_x3": 151.52, "r_y3": 163.51, "coord_origin": "TOPLEFT" }, "text": "solution for icdar 2021 competition on scientific literature parsing task b: Ta-", "orig": "solution for icdar 2021 competition on scientific literature parsing task b: Ta-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 10, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.52, "r_y0": 182.54, "r_x1": 280.64, "r_y1": 182.54, "r_x2": 280.64, "r_y2": 174.47, "r_x3": 151.52, "r_y3": 174.47, "coord_origin": "TOPLEFT" }, "text": "ble recognition to html (2021).", "orig": "ble recognition to html (2021).", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 11, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 285.08, "r_y0": 182.58, "r_x1": 478.03, "r_y1": 182.58, "r_x2": 478.03, "r_y2": 175.11, "r_x3": 285.08, "r_y3": 175.11, "coord_origin": "TOPLEFT" }, "text": "https://doi.org/10.48550/ARXIV.2105.01848", "orig": "https://doi.org/10.48550/ARXIV.2105.01848", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 12, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 478.03, "r_y0": 182.54, "r_x1": 480.59, "r_y1": 182.54, "r_x2": 480.59, "r_y2": 174.47, "r_x3": 478.03, "r_y3": 174.47, "coord_origin": "TOPLEFT" }, "text": ",", "orig": ",", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 13, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.52, "r_y0": 193.54, "r_x1": 302.12, "r_y1": 193.54, "r_x2": 302.12, "r_y2": 186.07, "r_x3": 151.52, "r_y3": 186.07, "coord_origin": "TOPLEFT" }, "text": "https://arxiv.org/abs/2105.01848", "orig": "https://arxiv.org/abs/2105.01848", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "19. Ye, J., Qi, X., He, Y., Chen, Y., Gu, D., Gao, P., Xiao, R.: Pingan-vcgroup's solution for icdar 2021 competition on scientific literature parsing task b: Table recognition to html (2021). https://doi.org/10.48550/ARXIV.2105.01848 , https://arxiv.org/abs/2105.01848" }, { "label": "list_item", "id": 4, "page_no": 13, "cluster": { "id": 4, "label": "list_item", "bbox": { "l": 134.76, "t": 196.39, "r": 480.59, "b": 215.41, "coord_origin": "TOPLEFT" }, "confidence": 0.953, "cells": [ { "index": 14, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 204.46, "r_x1": 145.66, "r_y1": 204.46, "r_x2": 145.66, "r_y2": 196.39, "r_x3": 134.76, "r_y3": 196.39, "coord_origin": "TOPLEFT" }, "text": "20.", "orig": "20.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 15, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 149.92, "r_y0": 204.46, "r_x1": 480.59, "r_y1": 204.46, "r_x2": 480.59, "r_y2": 196.39, "r_x3": 149.92, "r_y3": 196.39, "coord_origin": "TOPLEFT" }, "text": "Zhang, Z., Zhang, J., Du, J., Wang, F.: Split, embed and merge: An accurate table", "orig": "Zhang, Z., Zhang, J., Du, J., Wang, F.: Split, embed and merge: An accurate table", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 16, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.52, "r_y0": 215.41, "r_x1": 318.55, "r_y1": 215.41, "r_x2": 318.55, "r_y2": 207.34, "r_x3": 151.52, "r_y3": 207.34, "coord_origin": "TOPLEFT" }, "text": "structure recognizer. Pattern Recognition", "orig": "structure recognizer. Pattern Recognition", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 17, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 321.62, "r_y0": 215.21, "r_x1": 337.53, "r_y1": 215.21, "r_x2": 337.53, "r_y2": 207.28, "r_x3": 321.62, "r_y3": 207.28, "coord_origin": "TOPLEFT" }, "text": "126", "orig": "126", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 18, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 337.53, "r_y0": 215.41, "r_x1": 399.47, "r_y1": 215.41, "r_x2": 399.47, "r_y2": 207.34, "r_x3": 337.53, "r_y3": 207.34, "coord_origin": "TOPLEFT" }, "text": ", 108565 (2022)", "orig": ", 108565 (2022)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "20. Zhang, Z., Zhang, J., Du, J., Wang, F.: Split, embed and merge: An accurate table structure recognizer. Pattern Recognition 126 , 108565 (2022)" }, { "label": "list_item", "id": 0, "page_no": 13, "cluster": { "id": 0, "label": "list_item", "bbox": { "l": 134.76, "t": 218.3, "r": 480.59, "b": 270.25, "coord_origin": "TOPLEFT" }, "confidence": 0.972, "cells": [ { "index": 19, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 226.37, "r_x1": 145.72, "r_y1": 226.37, "r_x2": 145.72, "r_y2": 218.3, "r_x3": 134.76, "r_y3": 218.3, "coord_origin": "TOPLEFT" }, "text": "21.", "orig": "21.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 20, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 150.01, "r_y0": 226.37, "r_x1": 480.59, "r_y1": 226.37, "r_x2": 480.59, "r_y2": 218.3, "r_x3": 150.01, "r_y3": 218.3, "coord_origin": "TOPLEFT" }, "text": "Zheng, X., Burdick, D., Popa, L., Zhong, X., Wang, N.X.R.: Global table extractor", "orig": "Zheng, X., Burdick, D., Popa, L., Zhong, X., Wang, N.X.R.: Global table extractor", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 21, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.52, "r_y0": 237.33, "r_x1": 480.59, "r_y1": 237.33, "r_x2": 480.59, "r_y2": 229.26, "r_x3": 151.52, "r_y3": 229.26, "coord_origin": "TOPLEFT" }, "text": "(gte): A framework for joint table identification and cell structure recognition using", "orig": "(gte): A framework for joint table identification and cell structure recognition using", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 22, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.52, "r_y0": 248.29, "r_x1": 480.59, "r_y1": 248.29, "r_x2": 480.59, "r_y2": 240.22, "r_x3": 151.52, "r_y3": 240.22, "coord_origin": "TOPLEFT" }, "text": "visual context. In: 2021 IEEE Winter Conference on Applications of Computer Vi-", "orig": "visual context. In: 2021 IEEE Winter Conference on Applications of Computer Vi-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 23, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.52, "r_y0": 259.25, "r_x1": 293.44, "r_y1": 259.25, "r_x2": 293.44, "r_y2": 251.18, "r_x3": 151.52, "r_y3": 251.18, "coord_origin": "TOPLEFT" }, "text": "sion (WACV). pp. 697-706 (2021).", "orig": "sion (WACV). pp. 697-706 (2021).", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 24, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 297.05, "r_y0": 259.3, "r_x1": 480.59, "r_y1": 259.3, "r_x2": 480.59, "r_y2": 251.83, "r_x3": 297.05, "r_y3": 251.83, "coord_origin": "TOPLEFT" }, "text": "https://doi.org/10.1109/WACV48630.2021.", "orig": "https://doi.org/10.1109/WACV48630.2021.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 25, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.52, "r_y0": 270.25, "r_x1": 175.05, "r_y1": 270.25, "r_x2": 175.05, "r_y2": 262.79, "r_x3": 151.52, "r_y3": 262.79, "coord_origin": "TOPLEFT" }, "text": "00074", "orig": "00074", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "21. Zheng, X., Burdick, D., Popa, L., Zhong, X., Wang, N.X.R.: Global table extractor (gte): A framework for joint table identification and cell structure recognition using visual context. In: 2021 IEEE Winter Conference on Applications of Computer Vision (WACV). pp. 697-706 (2021). https://doi.org/10.1109/WACV48630.2021. 00074" }, { "label": "list_item", "id": 1, "page_no": 13, "cluster": { "id": 1, "label": "list_item", "bbox": { "l": 134.76, "t": 273.1, "r": 480.6, "b": 314.05, "coord_origin": "TOPLEFT" }, "confidence": 0.969, "cells": [ { "index": 26, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 281.17, "r_x1": 146.37, "r_y1": 281.17, "r_x2": 146.37, "r_y2": 273.1, "r_x3": 134.76, "r_y3": 273.1, "coord_origin": "TOPLEFT" }, "text": "22.", "orig": "22.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 27, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 150.91, "r_y0": 281.17, "r_x1": 480.59, "r_y1": 281.17, "r_x2": 480.59, "r_y2": 273.1, "r_x3": 150.91, "r_y3": 273.1, "coord_origin": "TOPLEFT" }, "text": "Zhong, X., ShafieiBavani, E., Jimeno Yepes, A.: Image-based table recognition:", "orig": "Zhong, X., ShafieiBavani, E., Jimeno Yepes, A.: Image-based table recognition:", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 28, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.52, "r_y0": 292.13, "r_x1": 480.59, "r_y1": 292.13, "r_x2": 480.59, "r_y2": 284.06, "r_x3": 151.52, "r_y3": 284.06, "coord_origin": "TOPLEFT" }, "text": "Data, model, and evaluation. In: Vedaldi, A., Bischof, H., Brox, T., Frahm, J.M.", "orig": "Data, model, and evaluation. In: Vedaldi, A., Bischof, H., Brox, T., Frahm, J.M.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 29, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.52, "r_y0": 303.09, "r_x1": 480.6, "r_y1": 303.09, "r_x2": 480.6, "r_y2": 295.02, "r_x3": 151.52, "r_y3": 295.02, "coord_origin": "TOPLEFT" }, "text": "(eds.) Computer Vision - ECCV 2020. pp. 564-580. Springer International Pub-", "orig": "(eds.) Computer Vision - ECCV 2020. pp. 564-580. Springer International Pub-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 30, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.52, "r_y0": 314.05, "r_x1": 236.02, "r_y1": 314.05, "r_x2": 236.02, "r_y2": 305.98, "r_x3": 151.52, "r_y3": 305.98, "coord_origin": "TOPLEFT" }, "text": "lishing, Cham (2020)", "orig": "lishing, Cham (2020)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "22. Zhong, X., ShafieiBavani, E., Jimeno Yepes, A.: Image-based table recognition: Data, model, and evaluation. In: Vedaldi, A., Bischof, H., Brox, T., Frahm, J.M. (eds.) Computer Vision - ECCV 2020. pp. 564-580. Springer International Publishing, Cham (2020)" }, { "label": "list_item", "id": 2, "page_no": 13, "cluster": { "id": 2, "label": "list_item", "bbox": { "l": 134.76, "t": 316.93, "r": 480.59, "b": 346.92, "coord_origin": "TOPLEFT" }, "confidence": 0.967, "cells": [ { "index": 31, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 325.0, "r_x1": 145.7, "r_y1": 325.0, "r_x2": 145.7, "r_y2": 316.93, "r_x3": 134.76, "r_y3": 316.93, "coord_origin": "TOPLEFT" }, "text": "23.", "orig": "23.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 32, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 149.97, "r_y0": 325.0, "r_x1": 480.59, "r_y1": 325.0, "r_x2": 480.59, "r_y2": 316.93, "r_x3": 149.97, "r_y3": 316.93, "coord_origin": "TOPLEFT" }, "text": "Zhong, X., Tang, J., Yepes, A.J.: Publaynet: largest dataset ever for document lay-", "orig": "Zhong, X., Tang, J., Yepes, A.J.: Publaynet: largest dataset ever for document lay-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 33, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.52, "r_y0": 335.96, "r_x1": 480.59, "r_y1": 335.96, "r_x2": 480.59, "r_y2": 327.89, "r_x3": 151.52, "r_y3": 327.89, "coord_origin": "TOPLEFT" }, "text": "out analysis. In: 2019 International Conference on Document Analysis and Recog-", "orig": "out analysis. In: 2019 International Conference on Document Analysis and Recog-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 34, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.52, "r_y0": 346.92, "r_x1": 335.14, "r_y1": 346.92, "r_x2": 335.14, "r_y2": 338.85, "r_x3": 151.52, "r_y3": 338.85, "coord_origin": "TOPLEFT" }, "text": "nition (ICDAR). pp. 1015-1022. IEEE (2019)", "orig": "nition (ICDAR). pp. 1015-1022. IEEE (2019)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "23. Zhong, X., Tang, J., Yepes, A.J.: Publaynet: largest dataset ever for document layout analysis. In: 2019 International Conference on Document Analysis and Recognition (ICDAR). pp. 1015-1022. IEEE (2019)" } ], "body": [ { "label": "list_item", "id": 5, "page_no": 13, "cluster": { "id": 5, "label": "list_item", "bbox": { "l": 134.76, "t": 119.67, "r": 480.59, "b": 149.66, "coord_origin": "TOPLEFT" }, "confidence": 0.944, "cells": [ { "index": 3, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 127.74, "r_x1": 146.08, "r_y1": 127.74, "r_x2": 146.08, "r_y2": 119.67, "r_x3": 134.76, "r_y3": 119.67, "coord_origin": "TOPLEFT" }, "text": "18.", "orig": "18.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 4, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 150.51, "r_y0": 127.74, "r_x1": 480.59, "r_y1": 127.74, "r_x2": 480.59, "r_y2": 119.67, "r_x3": 150.51, "r_y3": 119.67, "coord_origin": "TOPLEFT" }, "text": "Xue, W., Yu, B., Wang, W., Tao, D., Li, Q.: Tgrnet: A table graph reconstruc-", "orig": "Xue, W., Yu, B., Wang, W., Tao, D., Li, Q.: Tgrnet: A table graph reconstruc-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 5, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.52, "r_y0": 138.7, "r_x1": 480.59, "r_y1": 138.7, "r_x2": 480.59, "r_y2": 130.63, "r_x3": 151.52, "r_y3": 130.63, "coord_origin": "TOPLEFT" }, "text": "tion network for table structure recognition. In: Proceedings of the IEEE/CVF", "orig": "tion network for table structure recognition. In: Proceedings of the IEEE/CVF", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 6, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.52, "r_y0": 149.66, "r_x1": 427.53, "r_y1": 149.66, "r_x2": 427.53, "r_y2": 141.59, "r_x3": 151.52, "r_y3": 141.59, "coord_origin": "TOPLEFT" }, "text": "International Conference on Computer Vision. pp. 1295-1304 (2021)", "orig": "International Conference on Computer Vision. pp. 1295-1304 (2021)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "18. Xue, W., Yu, B., Wang, W., Tao, D., Li, Q.: Tgrnet: A table graph reconstruction network for table structure recognition. In: Proceedings of the IEEE/CVF International Conference on Computer Vision. pp. 1295-1304 (2021)" }, { "label": "list_item", "id": 3, "page_no": 13, "cluster": { "id": 3, "label": "list_item", "bbox": { "l": 134.76, "t": 152.55, "r": 480.59, "b": 193.54, "coord_origin": "TOPLEFT" }, "confidence": 0.954, "cells": [ { "index": 7, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 160.62, "r_x1": 146.19, "r_y1": 160.62, "r_x2": 146.19, "r_y2": 152.55, "r_x3": 134.76, "r_y3": 152.55, "coord_origin": "TOPLEFT" }, "text": "19.", "orig": "19.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 8, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 150.66, "r_y0": 160.62, "r_x1": 480.59, "r_y1": 160.62, "r_x2": 480.59, "r_y2": 152.55, "r_x3": 150.66, "r_y3": 152.55, "coord_origin": "TOPLEFT" }, "text": "Ye, J., Qi, X., He, Y., Chen, Y., Gu, D., Gao, P., Xiao, R.: Pingan-vcgroup\u2019s", "orig": "Ye, J., Qi, X., He, Y., Chen, Y., Gu, D., Gao, P., Xiao, R.: Pingan-vcgroup\u2019s", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 9, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.52, "r_y0": 171.58, "r_x1": 480.59, "r_y1": 171.58, "r_x2": 480.59, "r_y2": 163.51, "r_x3": 151.52, "r_y3": 163.51, "coord_origin": "TOPLEFT" }, "text": "solution for icdar 2021 competition on scientific literature parsing task b: Ta-", "orig": "solution for icdar 2021 competition on scientific literature parsing task b: Ta-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 10, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.52, "r_y0": 182.54, "r_x1": 280.64, "r_y1": 182.54, "r_x2": 280.64, "r_y2": 174.47, "r_x3": 151.52, "r_y3": 174.47, "coord_origin": "TOPLEFT" }, "text": "ble recognition to html (2021).", "orig": "ble recognition to html (2021).", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 11, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 285.08, "r_y0": 182.58, "r_x1": 478.03, "r_y1": 182.58, "r_x2": 478.03, "r_y2": 175.11, "r_x3": 285.08, "r_y3": 175.11, "coord_origin": "TOPLEFT" }, "text": "https://doi.org/10.48550/ARXIV.2105.01848", "orig": "https://doi.org/10.48550/ARXIV.2105.01848", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 12, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 478.03, "r_y0": 182.54, "r_x1": 480.59, "r_y1": 182.54, "r_x2": 480.59, "r_y2": 174.47, "r_x3": 478.03, "r_y3": 174.47, "coord_origin": "TOPLEFT" }, "text": ",", "orig": ",", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 13, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.52, "r_y0": 193.54, "r_x1": 302.12, "r_y1": 193.54, "r_x2": 302.12, "r_y2": 186.07, "r_x3": 151.52, "r_y3": 186.07, "coord_origin": "TOPLEFT" }, "text": "https://arxiv.org/abs/2105.01848", "orig": "https://arxiv.org/abs/2105.01848", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "19. Ye, J., Qi, X., He, Y., Chen, Y., Gu, D., Gao, P., Xiao, R.: Pingan-vcgroup's solution for icdar 2021 competition on scientific literature parsing task b: Table recognition to html (2021). https://doi.org/10.48550/ARXIV.2105.01848 , https://arxiv.org/abs/2105.01848" }, { "label": "list_item", "id": 4, "page_no": 13, "cluster": { "id": 4, "label": "list_item", "bbox": { "l": 134.76, "t": 196.39, "r": 480.59, "b": 215.41, "coord_origin": "TOPLEFT" }, "confidence": 0.953, "cells": [ { "index": 14, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 204.46, "r_x1": 145.66, "r_y1": 204.46, "r_x2": 145.66, "r_y2": 196.39, "r_x3": 134.76, "r_y3": 196.39, "coord_origin": "TOPLEFT" }, "text": "20.", "orig": "20.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 15, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 149.92, "r_y0": 204.46, "r_x1": 480.59, "r_y1": 204.46, "r_x2": 480.59, "r_y2": 196.39, "r_x3": 149.92, "r_y3": 196.39, "coord_origin": "TOPLEFT" }, "text": "Zhang, Z., Zhang, J., Du, J., Wang, F.: Split, embed and merge: An accurate table", "orig": "Zhang, Z., Zhang, J., Du, J., Wang, F.: Split, embed and merge: An accurate table", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 16, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.52, "r_y0": 215.41, "r_x1": 318.55, "r_y1": 215.41, "r_x2": 318.55, "r_y2": 207.34, "r_x3": 151.52, "r_y3": 207.34, "coord_origin": "TOPLEFT" }, "text": "structure recognizer. Pattern Recognition", "orig": "structure recognizer. Pattern Recognition", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 17, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 321.62, "r_y0": 215.21, "r_x1": 337.53, "r_y1": 215.21, "r_x2": 337.53, "r_y2": 207.28, "r_x3": 321.62, "r_y3": 207.28, "coord_origin": "TOPLEFT" }, "text": "126", "orig": "126", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 18, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 337.53, "r_y0": 215.41, "r_x1": 399.47, "r_y1": 215.41, "r_x2": 399.47, "r_y2": 207.34, "r_x3": 337.53, "r_y3": 207.34, "coord_origin": "TOPLEFT" }, "text": ", 108565 (2022)", "orig": ", 108565 (2022)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "20. Zhang, Z., Zhang, J., Du, J., Wang, F.: Split, embed and merge: An accurate table structure recognizer. Pattern Recognition 126 , 108565 (2022)" }, { "label": "list_item", "id": 0, "page_no": 13, "cluster": { "id": 0, "label": "list_item", "bbox": { "l": 134.76, "t": 218.3, "r": 480.59, "b": 270.25, "coord_origin": "TOPLEFT" }, "confidence": 0.972, "cells": [ { "index": 19, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 226.37, "r_x1": 145.72, "r_y1": 226.37, "r_x2": 145.72, "r_y2": 218.3, "r_x3": 134.76, "r_y3": 218.3, "coord_origin": "TOPLEFT" }, "text": "21.", "orig": "21.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 20, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 150.01, "r_y0": 226.37, "r_x1": 480.59, "r_y1": 226.37, "r_x2": 480.59, "r_y2": 218.3, "r_x3": 150.01, "r_y3": 218.3, "coord_origin": "TOPLEFT" }, "text": "Zheng, X., Burdick, D., Popa, L., Zhong, X., Wang, N.X.R.: Global table extractor", "orig": "Zheng, X., Burdick, D., Popa, L., Zhong, X., Wang, N.X.R.: Global table extractor", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 21, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.52, "r_y0": 237.33, "r_x1": 480.59, "r_y1": 237.33, "r_x2": 480.59, "r_y2": 229.26, "r_x3": 151.52, "r_y3": 229.26, "coord_origin": "TOPLEFT" }, "text": "(gte): A framework for joint table identification and cell structure recognition using", "orig": "(gte): A framework for joint table identification and cell structure recognition using", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 22, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.52, "r_y0": 248.29, "r_x1": 480.59, "r_y1": 248.29, "r_x2": 480.59, "r_y2": 240.22, "r_x3": 151.52, "r_y3": 240.22, "coord_origin": "TOPLEFT" }, "text": "visual context. In: 2021 IEEE Winter Conference on Applications of Computer Vi-", "orig": "visual context. In: 2021 IEEE Winter Conference on Applications of Computer Vi-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 23, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.52, "r_y0": 259.25, "r_x1": 293.44, "r_y1": 259.25, "r_x2": 293.44, "r_y2": 251.18, "r_x3": 151.52, "r_y3": 251.18, "coord_origin": "TOPLEFT" }, "text": "sion (WACV). pp. 697-706 (2021).", "orig": "sion (WACV). pp. 697-706 (2021).", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 24, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 297.05, "r_y0": 259.3, "r_x1": 480.59, "r_y1": 259.3, "r_x2": 480.59, "r_y2": 251.83, "r_x3": 297.05, "r_y3": 251.83, "coord_origin": "TOPLEFT" }, "text": "https://doi.org/10.1109/WACV48630.2021.", "orig": "https://doi.org/10.1109/WACV48630.2021.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 25, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.52, "r_y0": 270.25, "r_x1": 175.05, "r_y1": 270.25, "r_x2": 175.05, "r_y2": 262.79, "r_x3": 151.52, "r_y3": 262.79, "coord_origin": "TOPLEFT" }, "text": "00074", "orig": "00074", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "21. Zheng, X., Burdick, D., Popa, L., Zhong, X., Wang, N.X.R.: Global table extractor (gte): A framework for joint table identification and cell structure recognition using visual context. In: 2021 IEEE Winter Conference on Applications of Computer Vision (WACV). pp. 697-706 (2021). https://doi.org/10.1109/WACV48630.2021. 00074" }, { "label": "list_item", "id": 1, "page_no": 13, "cluster": { "id": 1, "label": "list_item", "bbox": { "l": 134.76, "t": 273.1, "r": 480.6, "b": 314.05, "coord_origin": "TOPLEFT" }, "confidence": 0.969, "cells": [ { "index": 26, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 281.17, "r_x1": 146.37, "r_y1": 281.17, "r_x2": 146.37, "r_y2": 273.1, "r_x3": 134.76, "r_y3": 273.1, "coord_origin": "TOPLEFT" }, "text": "22.", "orig": "22.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 27, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 150.91, "r_y0": 281.17, "r_x1": 480.59, "r_y1": 281.17, "r_x2": 480.59, "r_y2": 273.1, "r_x3": 150.91, "r_y3": 273.1, "coord_origin": "TOPLEFT" }, "text": "Zhong, X., ShafieiBavani, E., Jimeno Yepes, A.: Image-based table recognition:", "orig": "Zhong, X., ShafieiBavani, E., Jimeno Yepes, A.: Image-based table recognition:", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 28, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.52, "r_y0": 292.13, "r_x1": 480.59, "r_y1": 292.13, "r_x2": 480.59, "r_y2": 284.06, "r_x3": 151.52, "r_y3": 284.06, "coord_origin": "TOPLEFT" }, "text": "Data, model, and evaluation. In: Vedaldi, A., Bischof, H., Brox, T., Frahm, J.M.", "orig": "Data, model, and evaluation. In: Vedaldi, A., Bischof, H., Brox, T., Frahm, J.M.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 29, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.52, "r_y0": 303.09, "r_x1": 480.6, "r_y1": 303.09, "r_x2": 480.6, "r_y2": 295.02, "r_x3": 151.52, "r_y3": 295.02, "coord_origin": "TOPLEFT" }, "text": "(eds.) Computer Vision - ECCV 2020. pp. 564-580. Springer International Pub-", "orig": "(eds.) Computer Vision - ECCV 2020. pp. 564-580. Springer International Pub-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 30, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.52, "r_y0": 314.05, "r_x1": 236.02, "r_y1": 314.05, "r_x2": 236.02, "r_y2": 305.98, "r_x3": 151.52, "r_y3": 305.98, "coord_origin": "TOPLEFT" }, "text": "lishing, Cham (2020)", "orig": "lishing, Cham (2020)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "22. Zhong, X., ShafieiBavani, E., Jimeno Yepes, A.: Image-based table recognition: Data, model, and evaluation. In: Vedaldi, A., Bischof, H., Brox, T., Frahm, J.M. (eds.) Computer Vision - ECCV 2020. pp. 564-580. Springer International Publishing, Cham (2020)" }, { "label": "list_item", "id": 2, "page_no": 13, "cluster": { "id": 2, "label": "list_item", "bbox": { "l": 134.76, "t": 316.93, "r": 480.59, "b": 346.92, "coord_origin": "TOPLEFT" }, "confidence": 0.967, "cells": [ { "index": 31, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 325.0, "r_x1": 145.7, "r_y1": 325.0, "r_x2": 145.7, "r_y2": 316.93, "r_x3": 134.76, "r_y3": 316.93, "coord_origin": "TOPLEFT" }, "text": "23.", "orig": "23.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 32, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 149.97, "r_y0": 325.0, "r_x1": 480.59, "r_y1": 325.0, "r_x2": 480.59, "r_y2": 316.93, "r_x3": 149.97, "r_y3": 316.93, "coord_origin": "TOPLEFT" }, "text": "Zhong, X., Tang, J., Yepes, A.J.: Publaynet: largest dataset ever for document lay-", "orig": "Zhong, X., Tang, J., Yepes, A.J.: Publaynet: largest dataset ever for document lay-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 33, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.52, "r_y0": 335.96, "r_x1": 480.59, "r_y1": 335.96, "r_x2": 480.59, "r_y2": 327.89, "r_x3": 151.52, "r_y3": 327.89, "coord_origin": "TOPLEFT" }, "text": "out analysis. In: 2019 International Conference on Document Analysis and Recog-", "orig": "out analysis. In: 2019 International Conference on Document Analysis and Recog-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 34, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 151.52, "r_y0": 346.92, "r_x1": 335.14, "r_y1": 346.92, "r_x2": 335.14, "r_y2": 338.85, "r_x3": 151.52, "r_y3": 338.85, "coord_origin": "TOPLEFT" }, "text": "nition (ICDAR). pp. 1015-1022. IEEE (2019)", "orig": "nition (ICDAR). pp. 1015-1022. IEEE (2019)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "23. Zhong, X., Tang, J., Yepes, A.J.: Publaynet: largest dataset ever for document layout analysis. In: 2019 International Conference on Document Analysis and Recognition (ICDAR). pp. 1015-1022. IEEE (2019)" } ], "headers": [ { "label": "page_header", "id": 7, "page_no": 13, "cluster": { "id": 7, "label": "page_header", "bbox": { "l": 134.76, "t": 93.77, "r": 143.98, "b": 101.84, "coord_origin": "TOPLEFT" }, "confidence": 0.701, "cells": [ { "index": 0, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 134.76, "r_y0": 101.84, "r_x1": 143.98, "r_y1": 101.84, "r_x2": 143.98, "r_y2": 93.77, "r_x3": 134.76, "r_y3": 93.77, "coord_origin": "TOPLEFT" }, "text": "14", "orig": "14", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "14" }, { "label": "page_header", "id": 6, "page_no": 13, "cluster": { "id": 6, "label": "page_header", "bbox": { "l": 167.82, "t": 93.77, "r": 231.72, "b": 101.84, "coord_origin": "TOPLEFT" }, "confidence": 0.789, "cells": [ { "index": 1, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 167.82, "r_y0": 101.84, "r_x1": 178.08, "r_y1": 101.84, "r_x2": 178.08, "r_y2": 93.77, "r_x3": 167.82, "r_y3": 93.77, "coord_origin": "TOPLEFT" }, "text": "M.", "orig": "M.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false }, { "index": 2, "rgba": { "r": 0, "g": 0, "b": 0, "a": 255 }, "rect": { "r_x0": 182.38, "r_y0": 101.84, "r_x1": 231.72, "r_y1": 101.84, "r_x2": 231.72, "r_y2": 93.77, "r_x3": 182.38, "r_y3": 93.77, "coord_origin": "TOPLEFT" }, "text": "Lysak, et al.", "orig": "Lysak, et al.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false } ], "children": [] }, "text": "M. Lysak, et al." } ] } } ]